From 755b521dd14837a237a8e592ff576b10a4b93f7e Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Wed, 31 May 2017 09:36:09 +0200
Subject: [PATCH 01/41] import Workstation 12.5.5 module sources

---
 vmmon-only/COPYING                           |  339 ++
 vmmon-only/Makefile                          |  150 +
 vmmon-only/Makefile.kernel                   |   39 +
 vmmon-only/Makefile.normal                   |  143 +
 vmmon-only/README                            |   14 +
 vmmon-only/autoconf/geninclude.c             |   41 +
 vmmon-only/autoconf/smpcall.c                |   37 +
 vmmon-only/autoconf/tsc_khz.c                |   32 +
 vmmon-only/common/apic.c                     |  279 +
 vmmon-only/common/apic.h                     |   47 +
 vmmon-only/common/comport.c                  |  203 +
 vmmon-only/common/comport.h                  |   41 +
 vmmon-only/common/cpuid.c                    |  209 +
 vmmon-only/common/cpuid.h                    |   56 +
 vmmon-only/common/hashFunc.c                 |   41 +
 vmmon-only/common/hostKernel.h               |   83 +
 vmmon-only/common/hostif.h                   |  148 +
 vmmon-only/common/hostifGlobalLock.h         |   45 +
 vmmon-only/common/hostifMem.h                |   37 +
 vmmon-only/common/memtrack.c                 |  551 ++
 vmmon-only/common/memtrack.h                 |   60 +
 vmmon-only/common/phystrack.c                |  495 ++
 vmmon-only/common/phystrack.h                |   54 +
 vmmon-only/common/task.c                     | 2180 ++++++++
 vmmon-only/common/task.h                     |   43 +
 vmmon-only/common/vmx86.c                    | 2920 +++++++++++
 vmmon-only/common/vmx86.h                    |  201 +
 vmmon-only/include/address_defs.h            |   95 +
 vmmon-only/include/basic_initblock.h         |   60 +
 vmmon-only/include/circList.h                |  428 ++
 vmmon-only/include/community_source.h        |   67 +
 vmmon-only/include/compat_autoconf.h         |   41 +
 vmmon-only/include/compat_cred.h             |   47 +
 vmmon-only/include/compat_highmem.h          |   32 +
 vmmon-only/include/compat_interrupt.h        |   55 +
 vmmon-only/include/compat_ioport.h           |   63 +
 vmmon-only/include/compat_kernel.h           |   42 +
 vmmon-only/include/compat_module.h           |   83 +
 vmmon-only/include/compat_page.h             |   75 +
 vmmon-only/include/compat_pci.h              |   72 +
 vmmon-only/include/compat_pgtable.h          |  139 +
 vmmon-only/include/compat_sched.h            |  293 ++
 vmmon-only/include/compat_semaphore.h        |   49 +
 vmmon-only/include/compat_spinlock.h         |   48 +
 vmmon-only/include/compat_version.h          |  131 +
 vmmon-only/include/contextinfo.h             |   78 +
 vmmon-only/include/cpu_defs.h                |   49 +
 vmmon-only/include/cpuid_info.h              |   95 +
 vmmon-only/include/crossgdt.h                |   79 +
 vmmon-only/include/driver-config.h           |   79 +
 vmmon-only/include/hashFunc.h                |  345 ++
 vmmon-only/include/includeCheck.h            |   17 +
 vmmon-only/include/initblock.h               |   43 +
 vmmon-only/include/iocontrols.h              |  623 +++
 vmmon-only/include/memDefaults.h             |  154 +
 vmmon-only/include/modulecall.h              |  495 ++
 vmmon-only/include/modulecallstructs.h       |   99 +
 vmmon-only/include/mon_assert.h              |  207 +
 vmmon-only/include/monitorAction_exported.h  |  156 +
 vmmon-only/include/numa_defs.h               |   72 +
 vmmon-only/include/overheadmem_types.h       |  131 +
 vmmon-only/include/pageLock_defs.h           |  105 +
 vmmon-only/include/pagelist.h                |  101 +
 vmmon-only/include/pcip_defs.h               |  122 +
 vmmon-only/include/perfctr_generic.h         |   72 +
 vmmon-only/include/pgtbl.h                   |  382 ++
 vmmon-only/include/pshare_ext.h              |   64 +
 vmmon-only/include/ptsc.h                    |  263 +
 vmmon-only/include/rateconv.h                |  118 +
 vmmon-only/include/uccostTable.h             |   34 +
 vmmon-only/include/usercalldefs.h            |   35 +
 vmmon-only/include/vcpuid.h                  |   65 +
 vmmon-only/include/vcpuset.h                 |  808 +++
 vmmon-only/include/vcpuset_types.h           |   58 +
 vmmon-only/include/versioned_atomic.h        |  170 +
 vmmon-only/include/vm_asm.h                  |   93 +
 vmmon-only/include/vm_asm_x86.h              |  998 ++++
 vmmon-only/include/vm_asm_x86_64.h           |  136 +
 vmmon-only/include/vm_assert.h               |  336 ++
 vmmon-only/include/vm_atomic.h               | 3896 ++++++++++++++
 vmmon-only/include/vm_basic_asm.h            | 1258 +++++
 vmmon-only/include/vm_basic_asm_x86.h        |  548 ++
 vmmon-only/include/vm_basic_asm_x86_64.h     |  615 +++
 vmmon-only/include/vm_basic_asm_x86_common.h |  313 ++
 vmmon-only/include/vm_basic_defs.h           |  786 +++
 vmmon-only/include/vm_basic_math.h           |  166 +
 vmmon-only/include/vm_basic_types.h          | 1158 ++++
 vmmon-only/include/vm_time.h                 |   55 +
 vmmon-only/include/vmm_constants.h           |   48 +
 vmmon-only/include/vmmem_shared.h            |  108 +
 vmmon-only/include/vmware.h                  |   57 +
 vmmon-only/include/vmware_pack_begin.h       |   43 +
 vmmon-only/include/vmware_pack_end.h         |   44 +
 vmmon-only/include/vmware_pack_init.h        |   65 +
 vmmon-only/include/x86_basic_defs.h          |  242 +
 vmmon-only/include/x86apic.h                 |  353 ++
 vmmon-only/include/x86cpuid.h                | 1783 +++++++
 vmmon-only/include/x86cpuid_asm.h            |  445 ++
 vmmon-only/include/x86desc.h                 |  601 +++
 vmmon-only/include/x86msr.h                  |  505 ++
 vmmon-only/include/x86perfctr.h              |  976 ++++
 vmmon-only/include/x86segdescrs.h            |  101 +
 vmmon-only/include/x86sel.h                  |   67 +
 vmmon-only/include/x86svm.h                  |  496 ++
 vmmon-only/include/x86types.h                |  479 ++
 vmmon-only/include/x86vendor.h               |   37 +
 vmmon-only/include/x86vt-vmcs-fields.h       |  213 +
 vmmon-only/include/x86vt.h                   | 1047 ++++
 vmmon-only/include/x86vtinstr.h              |  623 +++
 vmmon-only/linux/driver.c                    | 2103 ++++++++
 vmmon-only/linux/driver.h                    |  118 +
 vmmon-only/linux/driverLog.c                 |  207 +
 vmmon-only/linux/driverLog.h                 |   37 +
 vmmon-only/linux/hostif.c                    | 3603 +++++++++++++
 vmmon-only/linux/hostif_priv.h               |   50 +
 vmmon-only/linux/vmhost.h                    |  100 +
 vmmon-only/linux/vmmonInt.h                  |  109 +
 vmmon-only/vmcore/driver_vmcore.h            |   34 +
 vmmon-only/vmcore/moduleloop.c               |  265 +
 vmnet-only/COPYING                           |  339 ++
 vmnet-only/Makefile                          |  150 +
 vmnet-only/Makefile.kernel                   |   40 +
 vmnet-only/Makefile.normal                   |   77 +
 vmnet-only/bridge.c                          | 1761 +++++++
 vmnet-only/community_source.h                |   67 +
 vmnet-only/compat_autoconf.h                 |   41 +
 vmnet-only/compat_module.h                   |   83 +
 vmnet-only/compat_netdevice.h                |  346 ++
 vmnet-only/compat_skbuff.h                   |  170 +
 vmnet-only/compat_sock.h                     |   77 +
 vmnet-only/compat_version.h                  |  131 +
 vmnet-only/driver-config.h                   |   79 +
 vmnet-only/driver.c                          | 1707 ++++++
 vmnet-only/geninclude.c                      |   41 +
 vmnet-only/hub.c                             |  733 +++
 vmnet-only/includeCheck.h                    |   17 +
 vmnet-only/monitorAction_exported.h          |  156 +
 vmnet-only/net.h                             |  209 +
 vmnet-only/netdev_has_dev_net.c              |   37 +
 vmnet-only/netdev_has_net.c                  |   43 +
 vmnet-only/netif.c                           |  598 +++
 vmnet-only/nfhook_uses_skb.c                 |   45 +
 vmnet-only/procfs.c                          |  407 ++
 vmnet-only/skblin.c                          |   41 +
 vmnet-only/smac.c                            | 4951 ++++++++++++++++++
 vmnet-only/smac.h                            |  119 +
 vmnet-only/smac_compat.c                     |  427 ++
 vmnet-only/smac_compat.h                     |   60 +
 vmnet-only/userif.c                          | 1161 ++++
 vmnet-only/vm_assert.h                       |  336 ++
 vmnet-only/vm_atomic.h                       | 3896 ++++++++++++++
 vmnet-only/vm_basic_asm.h                    | 1258 +++++
 vmnet-only/vm_basic_asm_x86.h                |  548 ++
 vmnet-only/vm_basic_asm_x86_64.h             |  615 +++
 vmnet-only/vm_basic_asm_x86_common.h         |  313 ++
 vmnet-only/vm_basic_defs.h                   |  786 +++
 vmnet-only/vm_basic_types.h                  | 1158 ++++
 vmnet-only/vm_device_version.h               |  309 ++
 vmnet-only/vm_oui.h                          |  207 +
 vmnet-only/vmnetInt.h                        |  100 +
 vmnet-only/vmware_pack_begin.h               |   43 +
 vmnet-only/vmware_pack_end.h                 |   44 +
 vmnet-only/vmware_pack_init.h                |   65 +
 vmnet-only/vnet.h                            |  450 ++
 vmnet-only/vnetEvent.c                       |  557 ++
 vmnet-only/vnetEvent.h                       |   50 +
 vmnet-only/vnetFilter.h                      |  191 +
 vmnet-only/vnetFilterInt.h                   |    0
 vmnet-only/vnetInt.h                         |  365 ++
 vmnet-only/vnetKernel.h                      |   83 +
 vmnet-only/vnetUserListener.c                |  336 ++
 vmnet-only/x86cpuid.h                        | 1815 +++++++
 172 files changed, 68382 insertions(+)
 create mode 100644 vmmon-only/COPYING
 create mode 100644 vmmon-only/Makefile
 create mode 100644 vmmon-only/Makefile.kernel
 create mode 100644 vmmon-only/Makefile.normal
 create mode 100644 vmmon-only/README
 create mode 100644 vmmon-only/autoconf/geninclude.c
 create mode 100644 vmmon-only/autoconf/smpcall.c
 create mode 100644 vmmon-only/autoconf/tsc_khz.c
 create mode 100644 vmmon-only/common/apic.c
 create mode 100644 vmmon-only/common/apic.h
 create mode 100644 vmmon-only/common/comport.c
 create mode 100644 vmmon-only/common/comport.h
 create mode 100644 vmmon-only/common/cpuid.c
 create mode 100644 vmmon-only/common/cpuid.h
 create mode 100644 vmmon-only/common/hashFunc.c
 create mode 100644 vmmon-only/common/hostKernel.h
 create mode 100644 vmmon-only/common/hostif.h
 create mode 100644 vmmon-only/common/hostifGlobalLock.h
 create mode 100644 vmmon-only/common/hostifMem.h
 create mode 100644 vmmon-only/common/memtrack.c
 create mode 100644 vmmon-only/common/memtrack.h
 create mode 100644 vmmon-only/common/phystrack.c
 create mode 100644 vmmon-only/common/phystrack.h
 create mode 100644 vmmon-only/common/task.c
 create mode 100644 vmmon-only/common/task.h
 create mode 100644 vmmon-only/common/vmx86.c
 create mode 100644 vmmon-only/common/vmx86.h
 create mode 100644 vmmon-only/include/address_defs.h
 create mode 100644 vmmon-only/include/basic_initblock.h
 create mode 100644 vmmon-only/include/circList.h
 create mode 100644 vmmon-only/include/community_source.h
 create mode 100644 vmmon-only/include/compat_autoconf.h
 create mode 100644 vmmon-only/include/compat_cred.h
 create mode 100644 vmmon-only/include/compat_highmem.h
 create mode 100644 vmmon-only/include/compat_interrupt.h
 create mode 100644 vmmon-only/include/compat_ioport.h
 create mode 100644 vmmon-only/include/compat_kernel.h
 create mode 100644 vmmon-only/include/compat_module.h
 create mode 100644 vmmon-only/include/compat_page.h
 create mode 100644 vmmon-only/include/compat_pci.h
 create mode 100644 vmmon-only/include/compat_pgtable.h
 create mode 100644 vmmon-only/include/compat_sched.h
 create mode 100644 vmmon-only/include/compat_semaphore.h
 create mode 100644 vmmon-only/include/compat_spinlock.h
 create mode 100644 vmmon-only/include/compat_version.h
 create mode 100644 vmmon-only/include/contextinfo.h
 create mode 100644 vmmon-only/include/cpu_defs.h
 create mode 100644 vmmon-only/include/cpuid_info.h
 create mode 100644 vmmon-only/include/crossgdt.h
 create mode 100644 vmmon-only/include/driver-config.h
 create mode 100644 vmmon-only/include/hashFunc.h
 create mode 100644 vmmon-only/include/includeCheck.h
 create mode 100644 vmmon-only/include/initblock.h
 create mode 100644 vmmon-only/include/iocontrols.h
 create mode 100644 vmmon-only/include/memDefaults.h
 create mode 100644 vmmon-only/include/modulecall.h
 create mode 100644 vmmon-only/include/modulecallstructs.h
 create mode 100644 vmmon-only/include/mon_assert.h
 create mode 100644 vmmon-only/include/monitorAction_exported.h
 create mode 100644 vmmon-only/include/numa_defs.h
 create mode 100644 vmmon-only/include/overheadmem_types.h
 create mode 100644 vmmon-only/include/pageLock_defs.h
 create mode 100644 vmmon-only/include/pagelist.h
 create mode 100644 vmmon-only/include/pcip_defs.h
 create mode 100644 vmmon-only/include/perfctr_generic.h
 create mode 100644 vmmon-only/include/pgtbl.h
 create mode 100644 vmmon-only/include/pshare_ext.h
 create mode 100644 vmmon-only/include/ptsc.h
 create mode 100644 vmmon-only/include/rateconv.h
 create mode 100644 vmmon-only/include/uccostTable.h
 create mode 100644 vmmon-only/include/usercalldefs.h
 create mode 100644 vmmon-only/include/vcpuid.h
 create mode 100644 vmmon-only/include/vcpuset.h
 create mode 100644 vmmon-only/include/vcpuset_types.h
 create mode 100644 vmmon-only/include/versioned_atomic.h
 create mode 100644 vmmon-only/include/vm_asm.h
 create mode 100644 vmmon-only/include/vm_asm_x86.h
 create mode 100644 vmmon-only/include/vm_asm_x86_64.h
 create mode 100644 vmmon-only/include/vm_assert.h
 create mode 100644 vmmon-only/include/vm_atomic.h
 create mode 100644 vmmon-only/include/vm_basic_asm.h
 create mode 100644 vmmon-only/include/vm_basic_asm_x86.h
 create mode 100644 vmmon-only/include/vm_basic_asm_x86_64.h
 create mode 100644 vmmon-only/include/vm_basic_asm_x86_common.h
 create mode 100644 vmmon-only/include/vm_basic_defs.h
 create mode 100644 vmmon-only/include/vm_basic_math.h
 create mode 100644 vmmon-only/include/vm_basic_types.h
 create mode 100644 vmmon-only/include/vm_time.h
 create mode 100644 vmmon-only/include/vmm_constants.h
 create mode 100644 vmmon-only/include/vmmem_shared.h
 create mode 100644 vmmon-only/include/vmware.h
 create mode 100644 vmmon-only/include/vmware_pack_begin.h
 create mode 100644 vmmon-only/include/vmware_pack_end.h
 create mode 100644 vmmon-only/include/vmware_pack_init.h
 create mode 100644 vmmon-only/include/x86_basic_defs.h
 create mode 100644 vmmon-only/include/x86apic.h
 create mode 100644 vmmon-only/include/x86cpuid.h
 create mode 100644 vmmon-only/include/x86cpuid_asm.h
 create mode 100644 vmmon-only/include/x86desc.h
 create mode 100644 vmmon-only/include/x86msr.h
 create mode 100644 vmmon-only/include/x86perfctr.h
 create mode 100644 vmmon-only/include/x86segdescrs.h
 create mode 100644 vmmon-only/include/x86sel.h
 create mode 100644 vmmon-only/include/x86svm.h
 create mode 100644 vmmon-only/include/x86types.h
 create mode 100644 vmmon-only/include/x86vendor.h
 create mode 100644 vmmon-only/include/x86vt-vmcs-fields.h
 create mode 100644 vmmon-only/include/x86vt.h
 create mode 100644 vmmon-only/include/x86vtinstr.h
 create mode 100644 vmmon-only/linux/driver.c
 create mode 100644 vmmon-only/linux/driver.h
 create mode 100644 vmmon-only/linux/driverLog.c
 create mode 100644 vmmon-only/linux/driverLog.h
 create mode 100644 vmmon-only/linux/hostif.c
 create mode 100644 vmmon-only/linux/hostif_priv.h
 create mode 100644 vmmon-only/linux/vmhost.h
 create mode 100644 vmmon-only/linux/vmmonInt.h
 create mode 100644 vmmon-only/vmcore/driver_vmcore.h
 create mode 100644 vmmon-only/vmcore/moduleloop.c
 create mode 100644 vmnet-only/COPYING
 create mode 100644 vmnet-only/Makefile
 create mode 100644 vmnet-only/Makefile.kernel
 create mode 100644 vmnet-only/Makefile.normal
 create mode 100644 vmnet-only/bridge.c
 create mode 100644 vmnet-only/community_source.h
 create mode 100644 vmnet-only/compat_autoconf.h
 create mode 100644 vmnet-only/compat_module.h
 create mode 100644 vmnet-only/compat_netdevice.h
 create mode 100644 vmnet-only/compat_skbuff.h
 create mode 100644 vmnet-only/compat_sock.h
 create mode 100644 vmnet-only/compat_version.h
 create mode 100644 vmnet-only/driver-config.h
 create mode 100644 vmnet-only/driver.c
 create mode 100644 vmnet-only/geninclude.c
 create mode 100644 vmnet-only/hub.c
 create mode 100644 vmnet-only/includeCheck.h
 create mode 100644 vmnet-only/monitorAction_exported.h
 create mode 100644 vmnet-only/net.h
 create mode 100644 vmnet-only/netdev_has_dev_net.c
 create mode 100644 vmnet-only/netdev_has_net.c
 create mode 100644 vmnet-only/netif.c
 create mode 100644 vmnet-only/nfhook_uses_skb.c
 create mode 100644 vmnet-only/procfs.c
 create mode 100644 vmnet-only/skblin.c
 create mode 100644 vmnet-only/smac.c
 create mode 100644 vmnet-only/smac.h
 create mode 100644 vmnet-only/smac_compat.c
 create mode 100644 vmnet-only/smac_compat.h
 create mode 100644 vmnet-only/userif.c
 create mode 100644 vmnet-only/vm_assert.h
 create mode 100644 vmnet-only/vm_atomic.h
 create mode 100644 vmnet-only/vm_basic_asm.h
 create mode 100644 vmnet-only/vm_basic_asm_x86.h
 create mode 100644 vmnet-only/vm_basic_asm_x86_64.h
 create mode 100644 vmnet-only/vm_basic_asm_x86_common.h
 create mode 100644 vmnet-only/vm_basic_defs.h
 create mode 100644 vmnet-only/vm_basic_types.h
 create mode 100644 vmnet-only/vm_device_version.h
 create mode 100644 vmnet-only/vm_oui.h
 create mode 100644 vmnet-only/vmnetInt.h
 create mode 100644 vmnet-only/vmware_pack_begin.h
 create mode 100644 vmnet-only/vmware_pack_end.h
 create mode 100644 vmnet-only/vmware_pack_init.h
 create mode 100644 vmnet-only/vnet.h
 create mode 100644 vmnet-only/vnetEvent.c
 create mode 100644 vmnet-only/vnetEvent.h
 create mode 100644 vmnet-only/vnetFilter.h
 create mode 100644 vmnet-only/vnetFilterInt.h
 create mode 100644 vmnet-only/vnetInt.h
 create mode 100644 vmnet-only/vnetKernel.h
 create mode 100644 vmnet-only/vnetUserListener.c
 create mode 100644 vmnet-only/x86cpuid.h

diff --git a/vmmon-only/COPYING b/vmmon-only/COPYING
new file mode 100644
index 00000000..d511905c
--- /dev/null
+++ b/vmmon-only/COPYING
@@ -0,0 +1,339 @@
+		    GNU GENERAL PUBLIC LICENSE
+		       Version 2, June 1991
+
+ Copyright (C) 1989, 1991 Free Software Foundation, Inc.,
+ 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+			    Preamble
+
+  The licenses for most software are designed to take away your
+freedom to share and change it.  By contrast, the GNU General Public
+License is intended to guarantee your freedom to share and change free
+software--to make sure the software is free for all its users.  This
+General Public License applies to most of the Free Software
+Foundation's software and to any other program whose authors commit to
+using it.  (Some other Free Software Foundation software is covered by
+the GNU Lesser General Public License instead.)  You can apply it to
+your programs, too.
+
+  When we speak of free software, we are referring to freedom, not
+price.  Our General Public Licenses are designed to make sure that you
+have the freedom to distribute copies of free software (and charge for
+this service if you wish), that you receive source code or can get it
+if you want it, that you can change the software or use pieces of it
+in new free programs; and that you know you can do these things.
+
+  To protect your rights, we need to make restrictions that forbid
+anyone to deny you these rights or to ask you to surrender the rights.
+These restrictions translate to certain responsibilities for you if you
+distribute copies of the software, or if you modify it.
+
+  For example, if you distribute copies of such a program, whether
+gratis or for a fee, you must give the recipients all the rights that
+you have.  You must make sure that they, too, receive or can get the
+source code.  And you must show them these terms so they know their
+rights.
+
+  We protect your rights with two steps: (1) copyright the software, and
+(2) offer you this license which gives you legal permission to copy,
+distribute and/or modify the software.
+
+  Also, for each author's protection and ours, we want to make certain
+that everyone understands that there is no warranty for this free
+software.  If the software is modified by someone else and passed on, we
+want its recipients to know that what they have is not the original, so
+that any problems introduced by others will not reflect on the original
+authors' reputations.
+
+  Finally, any free program is threatened constantly by software
+patents.  We wish to avoid the danger that redistributors of a free
+program will individually obtain patent licenses, in effect making the
+program proprietary.  To prevent this, we have made it clear that any
+patent must be licensed for everyone's free use or not licensed at all.
+
+  The precise terms and conditions for copying, distribution and
+modification follow.
+
+		    GNU GENERAL PUBLIC LICENSE
+   TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION
+
+  0. This License applies to any program or other work which contains
+a notice placed by the copyright holder saying it may be distributed
+under the terms of this General Public License.  The "Program", below,
+refers to any such program or work, and a "work based on the Program"
+means either the Program or any derivative work under copyright law:
+that is to say, a work containing the Program or a portion of it,
+either verbatim or with modifications and/or translated into another
+language.  (Hereinafter, translation is included without limitation in
+the term "modification".)  Each licensee is addressed as "you".
+
+Activities other than copying, distribution and modification are not
+covered by this License; they are outside its scope.  The act of
+running the Program is not restricted, and the output from the Program
+is covered only if its contents constitute a work based on the
+Program (independent of having been made by running the Program).
+Whether that is true depends on what the Program does.
+
+  1. You may copy and distribute verbatim copies of the Program's
+source code as you receive it, in any medium, provided that you
+conspicuously and appropriately publish on each copy an appropriate
+copyright notice and disclaimer of warranty; keep intact all the
+notices that refer to this License and to the absence of any warranty;
+and give any other recipients of the Program a copy of this License
+along with the Program.
+
+You may charge a fee for the physical act of transferring a copy, and
+you may at your option offer warranty protection in exchange for a fee.
+
+  2. You may modify your copy or copies of the Program or any portion
+of it, thus forming a work based on the Program, and copy and
+distribute such modifications or work under the terms of Section 1
+above, provided that you also meet all of these conditions:
+
+    a) You must cause the modified files to carry prominent notices
+    stating that you changed the files and the date of any change.
+
+    b) You must cause any work that you distribute or publish, that in
+    whole or in part contains or is derived from the Program or any
+    part thereof, to be licensed as a whole at no charge to all third
+    parties under the terms of this License.
+
+    c) If the modified program normally reads commands interactively
+    when run, you must cause it, when started running for such
+    interactive use in the most ordinary way, to print or display an
+    announcement including an appropriate copyright notice and a
+    notice that there is no warranty (or else, saying that you provide
+    a warranty) and that users may redistribute the program under
+    these conditions, and telling the user how to view a copy of this
+    License.  (Exception: if the Program itself is interactive but
+    does not normally print such an announcement, your work based on
+    the Program is not required to print an announcement.)
+
+These requirements apply to the modified work as a whole.  If
+identifiable sections of that work are not derived from the Program,
+and can be reasonably considered independent and separate works in
+themselves, then this License, and its terms, do not apply to those
+sections when you distribute them as separate works.  But when you
+distribute the same sections as part of a whole which is a work based
+on the Program, the distribution of the whole must be on the terms of
+this License, whose permissions for other licensees extend to the
+entire whole, and thus to each and every part regardless of who wrote it.
+
+Thus, it is not the intent of this section to claim rights or contest
+your rights to work written entirely by you; rather, the intent is to
+exercise the right to control the distribution of derivative or
+collective works based on the Program.
+
+In addition, mere aggregation of another work not based on the Program
+with the Program (or with a work based on the Program) on a volume of
+a storage or distribution medium does not bring the other work under
+the scope of this License.
+
+  3. You may copy and distribute the Program (or a work based on it,
+under Section 2) in object code or executable form under the terms of
+Sections 1 and 2 above provided that you also do one of the following:
+
+    a) Accompany it with the complete corresponding machine-readable
+    source code, which must be distributed under the terms of Sections
+    1 and 2 above on a medium customarily used for software interchange; or,
+
+    b) Accompany it with a written offer, valid for at least three
+    years, to give any third party, for a charge no more than your
+    cost of physically performing source distribution, a complete
+    machine-readable copy of the corresponding source code, to be
+    distributed under the terms of Sections 1 and 2 above on a medium
+    customarily used for software interchange; or,
+
+    c) Accompany it with the information you received as to the offer
+    to distribute corresponding source code.  (This alternative is
+    allowed only for noncommercial distribution and only if you
+    received the program in object code or executable form with such
+    an offer, in accord with Subsection b above.)
+
+The source code for a work means the preferred form of the work for
+making modifications to it.  For an executable work, complete source
+code means all the source code for all modules it contains, plus any
+associated interface definition files, plus the scripts used to
+control compilation and installation of the executable.  However, as a
+special exception, the source code distributed need not include
+anything that is normally distributed (in either source or binary
+form) with the major components (compiler, kernel, and so on) of the
+operating system on which the executable runs, unless that component
+itself accompanies the executable.
+
+If distribution of executable or object code is made by offering
+access to copy from a designated place, then offering equivalent
+access to copy the source code from the same place counts as
+distribution of the source code, even though third parties are not
+compelled to copy the source along with the object code.
+
+  4. You may not copy, modify, sublicense, or distribute the Program
+except as expressly provided under this License.  Any attempt
+otherwise to copy, modify, sublicense or distribute the Program is
+void, and will automatically terminate your rights under this License.
+However, parties who have received copies, or rights, from you under
+this License will not have their licenses terminated so long as such
+parties remain in full compliance.
+
+  5. You are not required to accept this License, since you have not
+signed it.  However, nothing else grants you permission to modify or
+distribute the Program or its derivative works.  These actions are
+prohibited by law if you do not accept this License.  Therefore, by
+modifying or distributing the Program (or any work based on the
+Program), you indicate your acceptance of this License to do so, and
+all its terms and conditions for copying, distributing or modifying
+the Program or works based on it.
+
+  6. Each time you redistribute the Program (or any work based on the
+Program), the recipient automatically receives a license from the
+original licensor to copy, distribute or modify the Program subject to
+these terms and conditions.  You may not impose any further
+restrictions on the recipients' exercise of the rights granted herein.
+You are not responsible for enforcing compliance by third parties to
+this License.
+
+  7. If, as a consequence of a court judgment or allegation of patent
+infringement or for any other reason (not limited to patent issues),
+conditions are imposed on you (whether by court order, agreement or
+otherwise) that contradict the conditions of this License, they do not
+excuse you from the conditions of this License.  If you cannot
+distribute so as to satisfy simultaneously your obligations under this
+License and any other pertinent obligations, then as a consequence you
+may not distribute the Program at all.  For example, if a patent
+license would not permit royalty-free redistribution of the Program by
+all those who receive copies directly or indirectly through you, then
+the only way you could satisfy both it and this License would be to
+refrain entirely from distribution of the Program.
+
+If any portion of this section is held invalid or unenforceable under
+any particular circumstance, the balance of the section is intended to
+apply and the section as a whole is intended to apply in other
+circumstances.
+
+It is not the purpose of this section to induce you to infringe any
+patents or other property right claims or to contest validity of any
+such claims; this section has the sole purpose of protecting the
+integrity of the free software distribution system, which is
+implemented by public license practices.  Many people have made
+generous contributions to the wide range of software distributed
+through that system in reliance on consistent application of that
+system; it is up to the author/donor to decide if he or she is willing
+to distribute software through any other system and a licensee cannot
+impose that choice.
+
+This section is intended to make thoroughly clear what is believed to
+be a consequence of the rest of this License.
+
+  8. If the distribution and/or use of the Program is restricted in
+certain countries either by patents or by copyrighted interfaces, the
+original copyright holder who places the Program under this License
+may add an explicit geographical distribution limitation excluding
+those countries, so that distribution is permitted only in or among
+countries not thus excluded.  In such case, this License incorporates
+the limitation as if written in the body of this License.
+
+  9. The Free Software Foundation may publish revised and/or new versions
+of the General Public License from time to time.  Such new versions will
+be similar in spirit to the present version, but may differ in detail to
+address new problems or concerns.
+
+Each version is given a distinguishing version number.  If the Program
+specifies a version number of this License which applies to it and "any
+later version", you have the option of following the terms and conditions
+either of that version or of any later version published by the Free
+Software Foundation.  If the Program does not specify a version number of
+this License, you may choose any version ever published by the Free Software
+Foundation.
+
+  10. If you wish to incorporate parts of the Program into other free
+programs whose distribution conditions are different, write to the author
+to ask for permission.  For software which is copyrighted by the Free
+Software Foundation, write to the Free Software Foundation; we sometimes
+make exceptions for this.  Our decision will be guided by the two goals
+of preserving the free status of all derivatives of our free software and
+of promoting the sharing and reuse of software generally.
+
+			    NO WARRANTY
+
+  11. BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY
+FOR THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW.  EXCEPT WHEN
+OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES
+PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED
+OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.  THE ENTIRE RISK AS
+TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH YOU.  SHOULD THE
+PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY SERVICING,
+REPAIR OR CORRECTION.
+
+  12. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
+WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY AND/OR
+REDISTRIBUTE THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES,
+INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING
+OUT OF THE USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED
+TO LOSS OF DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY
+YOU OR THIRD PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER
+PROGRAMS), EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE
+POSSIBILITY OF SUCH DAMAGES.
+
+		     END OF TERMS AND CONDITIONS
+
+	    How to Apply These Terms to Your New Programs
+
+  If you develop a new program, and you want it to be of the greatest
+possible use to the public, the best way to achieve this is to make it
+free software which everyone can redistribute and change under these terms.
+
+  To do so, attach the following notices to the program.  It is safest
+to attach them to the start of each source file to most effectively
+convey the exclusion of warranty; and each file should have at least
+the "copyright" line and a pointer to where the full notice is found.
+
+    <one line to give the program's name and a brief idea of what it does.>
+    Copyright (C) <year>  <name of author>
+
+    This program is free software; you can redistribute it and/or modify
+    it under the terms of the GNU General Public License as published by
+    the Free Software Foundation; either version 2 of the License, or
+    (at your option) any later version.
+
+    This program is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU General Public License for more details.
+
+    You should have received a copy of the GNU General Public License along
+    with this program; if not, write to the Free Software Foundation, Inc.,
+    51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
+
+Also add information on how to contact you by electronic and paper mail.
+
+If the program is interactive, make it output a short notice like this
+when it starts in an interactive mode:
+
+    Gnomovision version 69, Copyright (C) year name of author
+    Gnomovision comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
+    This is free software, and you are welcome to redistribute it
+    under certain conditions; type `show c' for details.
+
+The hypothetical commands `show w' and `show c' should show the appropriate
+parts of the General Public License.  Of course, the commands you use may
+be called something other than `show w' and `show c'; they could even be
+mouse-clicks or menu items--whatever suits your program.
+
+You should also get your employer (if you work as a programmer) or your
+school, if any, to sign a "copyright disclaimer" for the program, if
+necessary.  Here is a sample; alter the names:
+
+  Yoyodyne, Inc., hereby disclaims all copyright interest in the program
+  `Gnomovision' (which makes passes at compilers) written by James Hacker.
+
+  <signature of Ty Coon>, 1 April 1989
+  Ty Coon, President of Vice
+
+This General Public License does not permit incorporating your program into
+proprietary programs.  If your program is a subroutine library, you may
+consider it more useful to permit linking proprietary applications with the
+library.  If this is what you want to do, use the GNU Lesser General
+Public License instead of this License.
diff --git a/vmmon-only/Makefile b/vmmon-only/Makefile
new file mode 100644
index 00000000..de8162e8
--- /dev/null
+++ b/vmmon-only/Makefile
@@ -0,0 +1,150 @@
+#!/usr/bin/make -f
+##########################################################
+# Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+#
+# This program is free software; you can redistribute it and/or modify it
+# under the terms of the GNU General Public License as published by the
+# Free Software Foundation version 2 and no later version.
+#
+# This program is distributed in the hope that it will be useful, but
+# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+# or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+# for more details.
+#
+# You should have received a copy of the GNU General Public License along
+# with this program; if not, write to the Free Software Foundation, Inc.,
+# 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+#
+##########################################################
+
+####
+####  VMware kernel module Makefile to be distributed externally
+####
+
+####
+#### SRCROOT _must_ be a relative path.
+####
+SRCROOT = .
+
+#
+# open-vm-tools doesn't replicate shared source files for different modules;
+# instead, files are kept in shared locations. So define a few useful macros
+# to be able to handle both cases cleanly.
+#
+INCLUDE      :=
+ifdef OVT_SOURCE_DIR
+AUTOCONF_DIR := $(OVT_SOURCE_DIR)/modules/linux/shared/autoconf
+VMLIB_PATH   = $(OVT_SOURCE_DIR)/lib/$(1)
+INCLUDE      += -I$(OVT_SOURCE_DIR)/modules/linux/shared
+INCLUDE      += -I$(OVT_SOURCE_DIR)/lib/include
+else
+AUTOCONF_DIR := $(SRCROOT)/shared/autoconf
+INCLUDE      += -I$(SRCROOT)/shared
+endif
+
+
+VM_UNAME = $(shell uname -r)
+
+# Header directory for the running kernel
+ifdef LINUXINCLUDE
+HEADER_DIR = $(LINUXINCLUDE)
+else
+HEADER_DIR = /lib/modules/$(VM_UNAME)/build/include
+endif
+
+BUILD_DIR = $(HEADER_DIR)/..
+
+DRIVER := vmmon
+PRODUCT := @@PRODUCT@@
+
+# Grep program
+GREP = /bin/grep
+
+vm_check_gcc = $(shell if $(CC) $(1) -S -o /dev/null -xc /dev/null \
+        > /dev/null 2>&1; then echo "$(1)"; else echo "$(2)"; fi)
+vm_check_file = $(shell if test -f $(1); then echo "yes"; else echo "no"; fi)
+
+ifndef VM_KBUILD
+VM_KBUILD := no
+ifeq ($(call vm_check_file,$(BUILD_DIR)/Makefile), yes)
+VM_KBUILD := yes
+endif
+export VM_KBUILD
+endif
+
+ifndef VM_KBUILD_SHOWN
+ifeq ($(VM_KBUILD), no)
+VM_DUMMY := $(shell echo >&2 "Using standalone build system.")
+else
+VM_DUMMY := $(shell echo >&2 "Using kernel build system.")
+endif
+VM_KBUILD_SHOWN := yes
+export VM_KBUILD_SHOWN
+endif
+
+ifneq ($(VM_KBUILD), no)
+
+VMCCVER := $(shell $(CC) -dumpversion)
+
+# If there is no version defined, we are in toplevel pass, not yet in kernel makefiles...
+ifeq ($(VERSION),)
+
+DRIVER_KO := $(DRIVER).ko
+
+.PHONY: $(DRIVER_KO)
+
+auto-build: $(DRIVER_KO)
+	cp -f $< $(SRCROOT)/../$(DRIVER).o
+
+# $(DRIVER_KO) is a phony target, so compare file times explicitly
+$(DRIVER): $(DRIVER_KO)
+	if [ $< -nt $@ ] || [ ! -e $@ ] ; then cp -f $< $@; fi
+
+# Pass gcc version down the chain, so we can detect if kernel attempts to use unapproved compiler
+VM_CCVER := $(VMCCVER)
+export VM_CCVER
+VM_CC := $(CC)
+export VM_CC
+
+MAKEOVERRIDES := $(filter-out CC=%,$(MAKEOVERRIDES))
+
+#
+# Define a setup target that gets built before the actual driver.
+# This target may not be used at all, but if it is then it will be defined
+# in Makefile.kernel
+#
+prebuild:: ;
+postbuild:: ;
+
+$(DRIVER_KO): prebuild
+	$(MAKE) -C $(BUILD_DIR) SUBDIRS=$$PWD SRCROOT=$$PWD/$(SRCROOT) \
+	  MODULEBUILDDIR=$(MODULEBUILDDIR) modules
+	$(MAKE) -C $$PWD SRCROOT=$$PWD/$(SRCROOT) \
+	  MODULEBUILDDIR=$(MODULEBUILDDIR) postbuild
+endif
+
+vm_check_build = $(shell if $(CC) $(KBUILD_CPPFLAGS) $(KBUILD_CFLAGS) \
+	$(CPPFLAGS) $(CFLAGS) $(CFLAGS_KERNEL) $(LINUXINCLUDE) \
+	$(EXTRA_CFLAGS) -Iinclude2/asm/mach-default \
+	-DKBUILD_BASENAME=\"$(DRIVER)\" \
+	-Werror -S -o /dev/null -xc $(1) \
+	> /dev/null 2>&1; then echo "$(2)"; else echo "$(3)"; fi)
+
+CC_WARNINGS := -Wall -Wstrict-prototypes
+CC_OPTS := $(GLOBAL_DEFS) $(CC_WARNINGS) -DVMW_USING_KBUILD
+ifdef VMX86_DEVEL
+CC_OPTS += -DVMX86_DEVEL
+endif
+ifdef VMX86_DEBUG
+CC_OPTS += -DVMX86_DEBUG
+endif
+
+include $(SRCROOT)/Makefile.kernel
+
+else
+
+include $(SRCROOT)/Makefile.normal
+
+endif
+
+#.SILENT:
diff --git a/vmmon-only/Makefile.kernel b/vmmon-only/Makefile.kernel
new file mode 100644
index 00000000..bf805e02
--- /dev/null
+++ b/vmmon-only/Makefile.kernel
@@ -0,0 +1,39 @@
+#!/usr/bin/make -f
+##########################################################
+# Copyright (C) 1998,2015 VMware, Inc. All rights reserved.
+#
+# This program is free software; you can redistribute it and/or modify it
+# under the terms of the GNU General Public License as published by the
+# Free Software Foundation version 2 and no later version.
+#
+# This program is distributed in the hope that it will be useful, but
+# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+# or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+# for more details.
+#
+# You should have received a copy of the GNU General Public License along
+# with this program; if not, write to the Free Software Foundation, Inc.,
+# 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+#
+##########################################################
+
+CC_OPTS += -DVMMON -DVMCORE
+
+INCLUDE := -I$(SRCROOT)/include -I$(SRCROOT)/common -I$(SRCROOT)/linux \
+	   -I$(SRCROOT)/vmcore
+
+EXTRA_CFLAGS := $(CC_OPTS) $(INCLUDE)
+
+EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/autoconf/smpcall.c, -DVMW_HAVE_SMP_CALL_3ARG, )
+EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/autoconf/tsc_khz.c, -DVMW_HAVE_TSC_KHZ, )
+
+obj-m += $(DRIVER).o
+
+$(DRIVER)-y := $(subst $(SRCROOT)/, , $(patsubst %.c, %.o, \
+		$(wildcard $(SRCROOT)/linux/*.c $(SRCROOT)/common/*.c $(SRCROOT)/vmcore/*.c)))
+
+clean:
+	rm -rf $(wildcard $(DRIVER).mod.c $(DRIVER).ko .tmp_versions \
+		Module.symvers Modules.symvers Module.markers modules.order \
+		$(foreach dir,linux/ common/ vmcore/ \
+		./,$(addprefix $(dir),.*.cmd .*.o.flags *.o)))
diff --git a/vmmon-only/Makefile.normal b/vmmon-only/Makefile.normal
new file mode 100644
index 00000000..9e26a969
--- /dev/null
+++ b/vmmon-only/Makefile.normal
@@ -0,0 +1,143 @@
+#!/usr/bin/make -f
+##########################################################
+# Copyright (C) 1998,2015 VMware, Inc. All rights reserved.
+#
+# This program is free software; you can redistribute it and/or modify it
+# under the terms of the GNU General Public License as published by the
+# Free Software Foundation version 2 and no later version.
+#
+# This program is distributed in the hope that it will be useful, but
+# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+# or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+# for more details.
+#
+# You should have received a copy of the GNU General Public License along
+# with this program; if not, write to the Free Software Foundation, Inc.,
+# 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+#
+##########################################################
+
+vm_check_build = $(shell if $(CC) $(CC_OPTS) $(INCLUDE) -Werror -S -o /dev/null -xc $(1) \
+        > /dev/null 2>&1; then echo "$(2)"; else echo "$(3)"; fi)
+
+####
+####  DESTDIR is where the module, object files, and dependencies are built
+####
+DESTDIR := driver-$(VM_UNAME)
+
+####
+####  DRIVERNAME should be untouched unless you have a good reason to change 
+#### it.  The form below is how the scripts expect it.
+####
+DRIVERNAME := $(DRIVER)-xxx-$(VM_UNAME)
+
+ifneq (,$(filter x86_64%, $(shell $(CC) -dumpmachine)))
+MACHINE := x86_64
+else
+MACHINE := x386
+endif
+
+ifdef QUIET
+ECHO := @true
+else
+ECHO := @echo
+endif
+
+####
+#### You must compile with at least -O level of optimization
+#### or the module won't load.
+#### If desparate, I think that bringing in <linux/bitops.h> might
+#### suffice.
+####
+CC_WARNINGS := -Wall -Wstrict-prototypes 
+# Don't use -pipe or egcs-2.91.66 (shipped with RedHat) will die
+CC_KFLAGS := -D__KERNEL__ -fno-strength-reduce -fno-omit-frame-pointer \
+	     -fno-common -DKBUILD_MODNAME=$(DRIVER)
+CC_KFLAGS += $(call vm_check_gcc,-falign-loops=2 -falign-jumps=2 -falign-functions=2, \
+	     -malign-loops=2 -malign-jumps=2 -malign-functions=2)
+CC_KFLAGS += $(call vm_check_gcc,-fno-strict-aliasing,)
+ifeq ($(MACHINE),x86_64)
+CC_KFLAGS += -mno-red-zone -mcmodel=kernel
+else
+# Gcc 3.0 deprecates -m486 --hpreg
+CC_KFLAGS += -DCPU=586 $(call check_gcc,-march=i586,-m486)
+endif
+
+CC_OPTS := -O2 -DMODULE -DVMMON -DVMCORE $(GLOBAL_DEFS) $(CC_KFLAGS) $(CC_WARNINGS) 
+
+INCLUDE := -I$(SRCROOT)/include -I$(SRCROOT)/common -I$(SRCROOT)/linux \
+	   -I$(SRCROOT)/vmcore -I$(HEADER_DIR)
+
+INCLUDE += $(shell $(CC) $(INCLUDE) -E $(SRCROOT)/autoconf/geninclude.c \
+	   | sed -n -e 's!^APATH!-I$(HEADER_DIR)/asm!p')
+
+CC_OPTS += $(call vm_check_build, $(SRCROOT)/autoconf/smpcall.c, -DVMW_HAVE_SMP_CALL_3ARG, )
+CC_OPTS += $(call vm_check_build, $(SRCROOT)/autoconf/tsc_khz.c, -DVMW_HAVE_TSC_KHZ, )
+
+C_TARGETS_LINUX  := driver.o hostif.o driverLog.o
+C_TARGETS_COMMON := vmx86.o memtrack.o phystrack.o cpuid.o task.o hashFunc.o
+C_TARGETS_VMCORE := moduleloop.o
+C_TARGETS_LINUX_D := ${C_TARGETS_LINUX:.o=.d}
+C_TARGETS_COMMON_D := ${C_TARGETS_COMMON:.o=.d}
+C_TARGETS_VMCORE_D := ${C_TARGETS_VMCORE:.o=.d}
+C_TARGETS := $(C_TARGETS_LINUX) $(C_TARGETS_COMMON) $(C_TARGETS_VMCORE)
+
+####
+#### Make Targets are beneath here.
+####
+
+driver: setup deps
+	$(MAKE) -C $(DESTDIR) -f ../Makefile SRCROOT=../$(SRCROOT) $(DRIVER).o \
+		INCLUDE_DEPS=1
+
+setup:
+	@if [ -d $(DESTDIR) ] ; then true ; else mkdir $(DESTDIR); chmod 755 $(DESTDIR) ; fi
+
+$(DRIVER) $(DRIVER).o: $(DRIVERNAME)
+	cp -f $< $@
+
+$(DRIVERNAME): $(C_TARGETS)
+	$(ECHO) "Building $(DRIVERNAME)"
+	ld -r -o $(DRIVERNAME) $(C_TARGETS)
+
+auto-build:
+	$(MAKE) driver QUIET=1
+	cp -f $(DESTDIR)/$(DRIVERNAME) $(SRCROOT)/../$(DRIVER).o
+
+$(C_TARGETS_LINUX): %.o: $(SRCROOT)/linux/%.c
+	$(ECHO) "Compiling  linux/$(<F)"
+	$(CC) $(CC_OPTS) $(INCLUDE) -c $<
+
+$(C_TARGETS_COMMON): %.o: $(SRCROOT)/common/%.c
+	$(ECHO) "Compiling  common/$(<F)"
+	$(CC) $(CC_OPTS) $(INCLUDE) -c $<
+
+$(C_TARGETS_VMCORE): %.o: $(SRCROOT)/vmcore/%.c
+	$(ECHO) "Compiling  vmcore/$(<F)"
+	$(CC) $(CC_OPTS) $(INCLUDE) -c $<
+
+clean:
+	rm -rf $(DESTDIR)/
+
+$(C_TARGETS_COMMON_D): %.d: $(SRCROOT)/common/%.c
+	$(ECHO) "Dependencies for $(<F)"
+	$(CC) -MM $(CC_OPTS) $(INCLUDE) $< > $@
+
+$(C_TARGETS_LINUX_D): %.d: $(SRCROOT)/linux/%.c
+	$(ECHO) "Dependencies for $(<F)"
+	$(CC) -MM $(CC_OPTS) $(INCLUDE) $< > $@
+
+$(C_TARGETS_VMCORE_D): %.d: $(SRCROOT)/vmcore/%.c
+	$(ECHO) "Dependencies for $(<F)"
+	$(CC) -MM $(CC_OPTS) $(INCLUDE) $< > $@
+
+deps: setup 
+	$(MAKE) -C $(DESTDIR) -f ../Makefile SRCROOT=../$(SRCROOT) driver_deps 
+
+driver_deps: ${C_TARGETS:.o=.d}
+
+ifdef INCLUDE_DEPS
+include ${C_TARGETS:.o=.d}
+endif
+
+.SILENT:
diff --git a/vmmon-only/README b/vmmon-only/README
new file mode 100644
index 00000000..6a4da4c4
--- /dev/null
+++ b/vmmon-only/README
@@ -0,0 +1,14 @@
+This files in this directory and its subdirectories are the kernel module
+portion of the VMware Virtual Machine Monitor.  In order to build, make
+certain the Makefile is correct, especially in whether or not your system
+is multi-processor and then just type
+
+	make
+
+from this directory.  A copy of the module will be left in
+
+	driver-<kernel version>/vmmon.o
+
+(e.g. driver-up-2.0.32/vmmon.o).
+
+If you have any problems or questions, send mail to support@vmware.com
diff --git a/vmmon-only/autoconf/geninclude.c b/vmmon-only/autoconf/geninclude.c
new file mode 100644
index 00000000..88d68dc5
--- /dev/null
+++ b/vmmon-only/autoconf/geninclude.c
@@ -0,0 +1,41 @@
+/*********************************************************
+ * Copyright (C) 2003 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#ifdef CONFIG_X86_VOYAGER
+APATH/mach-voyager
+#endif
+#ifdef CONFIG_X86_VISWS
+APATH/mach-visws
+#endif
+#ifdef CONFIG_X86_NUMAQ
+APATH/mach-numaq
+#endif
+#ifdef CONFIG_X86_BIGSMP
+APATH/mach-bigsmp
+#endif
+#ifdef CONFIG_X86_SUMMIT
+APATH/mach-summit
+#endif
+#ifdef CONFIG_X86_GENERICARCH
+APATH/mach-generic
+#endif
+APATH/mach-default
+
diff --git a/vmmon-only/autoconf/smpcall.c b/vmmon-only/autoconf/smpcall.c
new file mode 100644
index 00000000..e27a873a
--- /dev/null
+++ b/vmmon-only/autoconf/smpcall.c
@@ -0,0 +1,37 @@
+/*********************************************************
+ * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * Detect whether smp_call_function has 4 or 3 arguments.
+ * Change happened between 2.6.26 and 2.6.27-rc1.
+ */
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 26)
+#   error This compile test intentionally fails.
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 27)
+#   include <linux/smp.h>
+
+int
+vmware_smp_call_function(void (*func)(void *info), void *info, int wait)
+{
+   return smp_call_function(func, info, wait);
+}
+#endif
diff --git a/vmmon-only/autoconf/tsc_khz.c b/vmmon-only/autoconf/tsc_khz.c
new file mode 100644
index 00000000..f2f262f7
--- /dev/null
+++ b/vmmon-only/autoconf/tsc_khz.c
@@ -0,0 +1,32 @@
+/*********************************************************
+ * Copyright (C) 2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * Detect if tsc_khz is available.
+ */
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#include <linux/cpu.h>
+
+int
+vmw_tsc_khz(void)
+{
+    return tsc_khz;
+}
diff --git a/vmmon-only/common/apic.c b/vmmon-only/common/apic.c
new file mode 100644
index 00000000..a9eb1a4c
--- /dev/null
+++ b/vmmon-only/common/apic.c
@@ -0,0 +1,279 @@
+/*********************************************************
+ * Copyright (C) 2011 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "vmware.h"
+#include "hostif.h"
+#include "x86cpuid_asm.h"
+#include "vm_asm.h"
+#include "cpuid.h"
+#include "apic.h"
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * APIC_GetMA --
+ *
+ *      Return the MA of the host's APIC by reading the APIC_BASE
+ *      MSR and applying any necessary masking.
+ *
+ * Side effects:
+ *      None
+ *
+ * Return value:
+ *      MA of host APIC if successful (guaranteed to be page-aligned),
+ *      or the sentinel (MA)-1 if unsucessful or if X2 APIC mode is enabled
+ *      since this disables the MMIO interface.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MA
+APIC_GetMA(void)
+{
+   uint64 result;
+   CpuidVendor cpuVendor = CPUID_GetVendor();
+   uint32 features = CPUID_GetFeatures();
+
+   if (!CPUID_ISSET(1, EDX, MSR, features) ||
+       !CPUID_ISSET(1, EDX, APIC, features)) {
+      return (MA)-1;
+   }
+
+   if (cpuVendor != CPUID_VENDOR_INTEL &&
+       cpuVendor != CPUID_VENDOR_AMD &&
+       cpuVendor != CPUID_VENDOR_VIA) {
+      return (MA)-1;
+   }
+
+   /*
+    * Check if X2 APIC mode is enabled.
+    */
+
+   if ((__GET_MSR(MSR_APIC_BASE) & APIC_MSR_X2APIC_ENABLED) != 0) {
+      return (MA)-1;
+   }
+
+   /*
+    * APIC is present and enabled.  The CPUID[0x1].edx[APIC] bit,
+    * already checked, mirrors the APIC base MSR's enable bit.
+    */
+
+   // Mask out goo in the low 12 bits, which is unrelated to the address.
+   result = __GET_MSR(MSR_APIC_BASE) & ~MASK64(PAGE_SHIFT);
+
+   /*
+    * On Intel, the high bits are reserved so we mask.
+    * On AMD, high bits are explicitly MBZ, so no need.
+    * Via doesn't specify, so we'll assume reserved.
+    */
+   if (cpuVendor == CPUID_VENDOR_INTEL || cpuVendor == CPUID_VENDOR_VIA) {
+      /*
+       * Intel suggests using CPUID 0x80000008.eax[7-0] (physical
+       * address size), with 36 (24 bit MPNs) as a fallback.
+       * Via has that cpuid leaf as well.
+       */
+      unsigned numPhysicalBits = 36;
+
+      if (CPUID_AddressSizeSupported()) {
+         numPhysicalBits = __GET_EAX_FROM_CPUID(0x80000008) & 0xff;
+      }
+
+      result &= MASK64(numPhysicalBits);
+   }
+
+   ASSERT_ON_COMPILE(sizeof(result) == sizeof(MA));
+   return result;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * APIC_Read --
+ *
+ *      Reads the given APIC register using the proper interface.  Does not
+ *      check to see if the register number is valid.
+ *
+ * Side effects:
+ *      Yes.
+ *
+ * Return value:
+ *      Value of the register.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint32
+APIC_Read(const APICDescriptor *desc, // IN
+          int regNum)                 // IN
+{
+   if (desc->isX2) {
+      return (uint32 )__GET_MSR(MSR_X2APIC_BASE + regNum);
+   } else {
+      return desc->base[regNum][0];
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * APIC_ReadID --
+ *
+ *      Reads the APIC ID using the proper interface.  The semantics of the
+ *      ID are different in X2APIC mode so APIC_Read() should not be used.
+ *
+ * Side effects:
+ *      None.
+ *
+ * Return value:
+ *      APIC ID.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint32
+APIC_ReadID(const APICDescriptor *desc) // IN
+{
+   uint32 reg = APIC_Read(desc, APICR_ID);
+
+   if (desc->isX2) {
+      return reg;
+   } else {
+      return (reg & XAPIC_ID_MASK) >> APIC_ID_SHIFT;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * APIC_Write --
+ *
+ *      Writes the given value to the given APIC register using the proper 
+ *      interface.  Does not check to see if the register number is valid.
+ *
+ * Side effects:
+ *      Yes.
+ *
+ * Return value:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+APIC_Write(const APICDescriptor *desc, // IN
+           int regNum,                 // IN
+           uint32 val)                 // IN
+{
+   if (desc->isX2) {
+      __SET_MSR(MSR_X2APIC_BASE + regNum, val);
+   } else {
+      desc->base[regNum][0] = val;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * APIC_ReadICR --
+ *
+ *      Reads the APIC ICR using the proper interface.  The semantics of the 
+ *      ICR are different in X2APIC mode so APIC_Read() should not be used.
+ *
+ * Side effects:
+ *      Yes.
+ *
+ * Return value:
+ *      The full 64-bit value of the ICR.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint64 
+APIC_ReadICR(const APICDescriptor *desc) // IN
+{
+   if (desc->isX2) {
+      return __GET_MSR(MSR_X2APIC_BASE + APICR_ICRLO);
+   } else {
+      uint32 icrHi = desc->base[APICR_ICRHI][0];
+      uint32 icrLo = desc->base[APICR_ICRLO][0];
+      return (uint64) icrHi << 32 | icrLo;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * APIC_WriteICR --
+ *
+ *      Writes the given value to the APIC ICR using the proper interface.  
+ *      The semantics of the ICR are different in X2APIC mode so APIC_Write()
+ *      should not be used.
+ *
+ * Side effects:
+ *      Yes.
+ *
+ * Return value:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+APIC_WriteICR(const APICDescriptor *desc, // IN
+              uint32 id,                  // IN
+              uint32 icrLo)               // IN
+{
+   if (desc->isX2) {
+      uint64 icr = (uint64) id << 32 | icrLo;
+      __SET_MSR(MSR_X2APIC_BASE + APICR_ICRLO, icr);
+   } else {
+      ASSERT(!(id & ~(APIC_ICRHI_DEST_MASK >> APIC_ICRHI_DEST_OFFSET)));
+      desc->base[APICR_ICRHI][0] = id << APIC_ICRHI_DEST_OFFSET;
+      desc->base[APICR_ICRLO][0] = icrLo;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * APIC_MaxLvt --
+ *
+ *      Reads the maximum number of LVT entries from the APIC version register.
+ *
+ * Side effects:
+ *      No.
+ *
+ * Return value:
+ *      The maximum number of LVT entries.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint32
+APIC_MaxLVT(const APICDescriptor *desc) // IN
+{
+   uint32 ver = APIC_Read(desc, APICR_VERSION);
+
+   return (ver >> APIC_MAX_LVT_SHIFT) & APIC_MAX_LVT_MASK;
+}
diff --git a/vmmon-only/common/apic.h b/vmmon-only/common/apic.h
new file mode 100644
index 00000000..4d5e751c
--- /dev/null
+++ b/vmmon-only/common/apic.h
@@ -0,0 +1,47 @@
+/*********************************************************
+ * Copyright (C) 2011 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * apic.h --
+ *
+ *      Some host APIC helper functions
+ */
+
+#ifndef APIC_H
+#define APIC_H
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+typedef struct {
+   Bool isX2;
+   volatile uint32 (*base)[4];
+} APICDescriptor;
+
+MA APIC_GetMA(void);
+uint32 APIC_Read(const APICDescriptor *desc, int regNum);
+void APIC_Write(const APICDescriptor *desc, int regNum, uint32 val);
+void APIC_WriteICR(const APICDescriptor *desc, uint32 id, uint32 icrLo);
+uint64 APIC_ReadICR(const APICDescriptor *desc);
+uint32 APIC_ReadID(const APICDescriptor *desc);
+uint32 APIC_MaxLVT(const APICDescriptor *desc);
+
+#endif
diff --git a/vmmon-only/common/comport.c b/vmmon-only/common/comport.c
new file mode 100644
index 00000000..4d591178
--- /dev/null
+++ b/vmmon-only/common/comport.c
@@ -0,0 +1,203 @@
+/*********************************************************
+ * Copyright (C) 2006,2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * comport.c --
+ *
+ *      Simple COM1 port routines for debugging code that can't do any real 
+ *      host IO, such as the worldswitch and related.
+ *
+ *      They all wait for the last character to complete transmission so if the 
+ *      system crashes immediately on return, the last character will be seen 
+ *      by the remote end.
+ *
+ *      These routines do not have any external dependencies so can be called 
+ *      by any code that has privilege to access IO ports.
+ *
+ *      Under Windows, they can be made to forward output to DbgPrint for 
+ *      printing via the debugger.  Just have USE_DBGPRINT set to 1.  If you 
+ *      let USE_DBGPRINT be 0 with Windows, make sure the comport hardware is 
+ *      powered-up by leaving Hyperterm running with the comport open, else 
+ *      Windows will power the chip down.
+ */
+
+#include "comport.h"
+#include "vm_basic_asm.h"  // for INB, OUTB
+
+#if 000 // defined(_MSC_VER)
+#define USE_DBGPRINT 1
+#define USE_MACPORT80 0
+#else
+#define USE_DBGPRINT 0
+#ifdef __APPLE__
+#define USE_MACPORT80 1
+#else
+#define USE_MACPORT80 0
+#endif
+#endif
+
+#if USE_DBGPRINT
+void DbgPrint(char const *format, ...);
+#elif !USE_MACPORT80
+#define IOBASE 0x3F8  // COM1 base IO port number
+#define BAUD 115200   // baud rate
+#define THR 0         // transmitter holding register
+#define LSR 5         // line status register
+#define LSR_TE 0x20   // - transmit fifo completely empty
+#define LSR_TI 0x40   // - transmitter idle
+#endif
+
+
+void
+CP_Init(void)
+{
+#if !USE_DBGPRINT && !USE_MACPORT80
+   OUTB(IOBASE+3, 0x83);               // LCR=select DLL/DLH, wordlen=8 bits
+   OUTB(IOBASE+0, (115200/BAUD)&255);  // DLL=lo order baud rate
+   OUTB(IOBASE+1, (115200/BAUD)/256);  // DLH=hi order baud rate
+   OUTB(IOBASE+3, 0x03);               // LCR=select RBR/THR/IER
+   OUTB(IOBASE+4, 0x07);               // MCR=dtr, rts, port-enable
+   OUTB(IOBASE+2, 0x07);               // FCR=reset rcv fifo, reset xmt fifo
+   OUTB(IOBASE+1, 0);                  // IER=disable all interrupts
+#endif
+}
+
+
+void
+CP_PutChr(uint8 ch) // IN
+{
+#if USE_DBGPRINT
+   DbgPrint("%c", ch);
+#elif USE_MACPORT80
+   int bit;
+
+   OUTB(0x80, (ch & 1) | 0x10);
+   for (bit = 1; bit < 64; bit ++) {
+      OUTB(0x80, (ch >> (bit & 7)) & 1);
+   }
+#else
+   if (ch == '\n') CP_PutChr('\r');
+   while ((INB(IOBASE+LSR) & LSR_TE) == 0) { }
+   OUTB(IOBASE+THR, ch);
+   while ((INB(IOBASE+LSR) & LSR_TI) == 0) { }
+#endif
+}
+
+
+void
+CP_PutDec(uint32 value) // IN
+{
+#if USE_DBGPRINT
+   DbgPrint("%u", value);
+#else
+   char s[12];
+   int i;
+
+   i = 0;
+   do {
+      s[i++] = (value % 10) + '0';
+      value /= 10;
+   } while (value > 0);
+   while (--i >= 0) CP_PutChr(s[i]);
+#endif
+}
+
+
+void
+CP_PutHexPtr(void *value) // IN
+{
+   if (sizeof value == 8) {
+      CP_PutHex64((uint64)(VA)value);
+   }
+   if (sizeof value == 4) {
+      CP_PutHex32((uint32)(VA)value);
+   }
+}
+
+
+void
+CP_PutHex64(uint64 value) // IN
+{
+   CP_PutHex32((uint32)(value >> 32));
+   CP_PutHex32((uint32)value);
+}
+
+
+void
+CP_PutHex32(uint32 value) // IN
+{
+#if USE_DBGPRINT
+   DbgPrint("%8.8X", value);
+#else
+   CP_PutHex16((uint16)(value >> 16));
+   CP_PutHex16((uint16)value);
+#endif
+}
+
+
+void
+CP_PutHex16(uint16 value) // IN
+{
+#if USE_DBGPRINT
+   DbgPrint("%4.4X", value);
+#else
+   CP_PutHex8((uint8)(value >> 8));
+   CP_PutHex8((uint8)value);
+#endif
+}
+
+
+void
+CP_PutHex8(uint8 value) // IN
+{
+#if USE_DBGPRINT
+   DbgPrint("%2.2X", value);
+#else
+   CP_PutChr("0123456789ABCDEF"[(value>>4)&15]);
+   CP_PutChr("0123456789ABCDEF"[value&15]);
+#endif
+}
+
+
+void
+CP_PutSp(void)
+{
+   CP_PutChr(' ');
+}
+
+
+void
+CP_PutCrLf(void)
+{
+   CP_PutChr('\n');
+}
+
+
+void
+CP_PutStr(char const *s) // IN
+{
+#if USE_DBGPRINT
+   DbgPrint("%s", s);
+#else
+   char c;
+
+   while ((c = *(s ++)) != 0) {
+      CP_PutChr(c);
+   }
+#endif
+}
diff --git a/vmmon-only/common/comport.h b/vmmon-only/common/comport.h
new file mode 100644
index 00000000..bf3cdb09
--- /dev/null
+++ b/vmmon-only/common/comport.h
@@ -0,0 +1,41 @@
+/*********************************************************
+ * Copyright (C) 2006 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _COMPORT_H
+#define _COMPORT_H
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMX
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"  // for uint8, et al
+
+void CP_Init(void);
+void CP_PutChr(uint8 ch);
+void CP_PutDec(uint32 value);
+void CP_PutHexPtr(void *value);
+void CP_PutHex64(uint64 value);
+void CP_PutHex32(uint32 value);
+void CP_PutHex16(uint16 value);
+void CP_PutHex8(uint8 value);
+void CP_PutSp(void);
+void CP_PutCrLf(void);
+void CP_PutStr(char const *s);
+
+#endif
diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
new file mode 100644
index 00000000..4984eb00
--- /dev/null
+++ b/vmmon-only/common/cpuid.c
@@ -0,0 +1,209 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifdef linux
+/* Must come before any kernel header file --hpreg */
+#   include "driver-config.h"
+
+#   include <linux/string.h>
+#endif
+#ifdef __APPLE__
+#   include <string.h> // For strcmp().
+#endif
+
+#include "vmware.h"
+#include "vm_assert.h"
+#include "hostif.h"
+#include "cpuid.h"
+#include "x86cpuid_asm.h"
+
+uint32 cpuidFeatures;
+static CpuidVendor vendor = CPUID_NUM_VENDORS;
+static uint32 version;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CPUIDExtendedSupported --
+ *
+ *     Determine whether processor supports extended CPUID (0x8000xxxx)
+ *     and how many of them.
+ *
+ * Results:
+ *     0         if extended CPUID is not supported
+ *     otherwise maximum extended CPUID supported (bit 31 set)
+ *
+ * Side effects:
+ *     None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static uint32
+CPUIDExtendedSupported(void)
+{
+   uint32 eax;
+
+   eax = __GET_EAX_FROM_CPUID(0x80000000);
+   if ((eax & 0x80000000) != 0x80000000) {
+      return 0;
+   }
+
+   return eax;
+}
+
+
+void
+CPUID_Init(void)
+{
+   CPUIDRegs regs;
+   uint32 *ptr;
+   char name[16];
+
+   __GET_CPUID(1, &regs);
+   version = regs.eax;
+   cpuidFeatures = regs.edx;
+
+   __GET_CPUID(0, &regs);
+   ptr = (uint32 *)name;
+   ptr[0] = regs.ebx;
+   ptr[1] = regs.edx;
+   ptr[2] = regs.ecx;
+   ptr[3] = 0;
+
+   if (strcmp(name, CPUID_INTEL_VENDOR_STRING_FIXED) == 0) {
+      vendor = CPUID_VENDOR_INTEL;
+   } else if (strcmp(name, CPUID_AMD_VENDOR_STRING_FIXED) == 0) {
+      vendor = CPUID_VENDOR_AMD;
+   } else if (strcmp(name, CPUID_CYRIX_VENDOR_STRING_FIXED) == 0) {
+      vendor = CPUID_VENDOR_CYRIX;
+   } else {
+      Warning("VMMON CPUID: Unrecognized CPU\n");
+      vendor = CPUID_VENDOR_UNKNOWN;
+   }
+}
+
+
+CpuidVendor
+CPUID_GetVendor(void)
+{
+   ASSERT(vendor != CPUID_NUM_VENDORS);
+   return vendor;
+}
+
+
+uint32
+CPUID_GetVersion(void)
+{
+   ASSERT(vendor != CPUID_NUM_VENDORS);
+   return version;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CPUID_SyscallSupported --
+ *
+ *     Determine whether processor supports syscall opcode and MSRs.
+ *
+ * Results:
+ *     FALSE     if processor does not support syscall
+ *     TRUE      if processor supports syscall
+ *
+ * Side effects:
+ *     It determines value only on first call, caching it for future.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+CPUID_SyscallSupported(void)
+{
+   /*
+    * It is OK to use local static variables here as 'result' does not depend
+    * on any work done in CPUID_Init(). It purely depends on the CPU.
+    */
+   static Bool initialized = FALSE;
+   static Bool result;
+
+   if (UNLIKELY(!initialized)) {
+      result =    CPUIDExtendedSupported() >= 0x80000001
+               && (__GET_EDX_FROM_CPUID(0x80000001) & (1 << 11));
+      initialized = TRUE;
+   }
+
+   return result;
+}
+
+
+Bool
+CPUID_LongModeSupported(void)
+{
+   /*
+    * It is OK to use local static variables here as 'result' does not depend
+    * on any work done in CPUID_Init(). It purely depends on the CPU.
+    */
+   static Bool initialized = FALSE;
+   static Bool result;
+
+   if (UNLIKELY(!initialized)) {
+      result =       CPUIDExtendedSupported() >= 0x80000001
+                  && (__GET_EDX_FROM_CPUID(0x80000001) & (1 << 29));
+      initialized = TRUE;
+   }
+
+   return result;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CPUID_AddressSizeSupported --
+ *
+ *     Determine whether processor supports the address size cpuid
+ *     extended leaf.
+ *
+ * Results:
+ *     True iff the processor supports CPUID 0x80000008.
+ *
+ * Side effects:
+ *     It determines value only on first call, caching it for future.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+CPUID_AddressSizeSupported(void)
+{
+   /*
+    * It is OK to use local static variables here as 'result' does not depend
+    * on any work done in CPUID_Init(). It purely depends on the CPU.
+    */
+   static Bool initialized = FALSE;
+   static Bool result;
+
+   if (UNLIKELY(!initialized)) {
+      result = CPUIDExtendedSupported() >= 0x80000008;
+      initialized = TRUE;
+   }
+
+   return result;
+}
diff --git a/vmmon-only/common/cpuid.h b/vmmon-only/common/cpuid.h
new file mode 100644
index 00000000..59bb8067
--- /dev/null
+++ b/vmmon-only/common/cpuid.h
@@ -0,0 +1,56 @@
+/*********************************************************
+ * Copyright (C) 1998,2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * cpuid.h --
+ *
+ *    wrap CPUID instruction
+ */
+
+#ifndef CPUID_H
+#define CPUID_H
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "x86cpuid.h"
+
+extern uint32 cpuidFeatures;
+
+void CPUID_Init(void);
+CpuidVendor CPUID_GetVendor(void);
+uint32 CPUID_GetVersion(void);
+Bool CPUID_SyscallSupported(void);
+Bool CPUID_LongModeSupported(void);
+Bool CPUID_AddressSizeSupported(void);
+
+static INLINE uint32 
+CPUID_GetFeatures(void)
+{
+   return cpuidFeatures;
+}
+
+static INLINE Bool
+CPUID_SSE2Supported(void)
+{
+   return CPUID_ISSET(1, EDX, SSE2, CPUID_GetFeatures());
+}
+
+#endif
+
diff --git a/vmmon-only/common/hashFunc.c b/vmmon-only/common/hashFunc.c
new file mode 100644
index 00000000..b8510821
--- /dev/null
+++ b/vmmon-only/common/hashFunc.c
@@ -0,0 +1,41 @@
+/*********************************************************
+ * Copyright (C) 2001 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * hashFunc.c --
+ *
+ *	The core implementation lives in lib/shared/hashFunc.h because it 
+ *      is shared by the vmkernel and vmmon.
+ */
+
+#include "hashFunc.h"
+
+/*
+ * Wrappers
+ */
+
+// arbitrary constant
+#define	HASH_INIT_VALUE	(42)
+
+// 64-bit hash for one 4K page
+uint64 
+HashFunc_HashPage(const void *addr)
+{
+   return hash2((uint64 *)addr, PAGE_SIZE / sizeof (uint64), HASH_INIT_VALUE);
+}
diff --git a/vmmon-only/common/hostKernel.h b/vmmon-only/common/hostKernel.h
new file mode 100644
index 00000000..51dc0e3f
--- /dev/null
+++ b/vmmon-only/common/hostKernel.h
@@ -0,0 +1,83 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * hostKernel.h --
+ *
+ *    Definition of HOST_KERNEL_* --hpreg
+ */
+
+
+#ifndef __HOST_KERNEL_H__
+#   define __HOST_KERNEL_H__
+
+
+#   ifdef linux
+/*
+ * In some cases, this files needs to include Linux kernel header file
+ * asm/page.h.
+ *
+ * However, asm/page.h defines PAGE_SHIFT, PAGE_SIZE, PAGE_MASK, PAGE_OFFSET
+ * and VMware header file vm_basic_types.h defines PAGE_SHIFT, PAGE_SIZE,
+ * PAGE_MASK, PAGE_OFFSET. PAGE_MASK and PAGE_OFFSET are defined differently
+ * (XXX we should really prefix the VMware version with VM_ to prevent any
+ * further confusion), but fortunately the driver does not use them.
+ *
+ * So in this file, we must solve the definition conflict for files that
+ * include both this file and vm_basic_types.h. 2 cases can occur:
+ *
+ * 1) this file is included before vm_basic_types.h is included. This is fine,
+ *    because vm_basic_types.h only defines PAGE_* if they don't exist yet.
+ *
+ * 2) vm_basic_types.h is included before this file is included.
+ * We must undefine
+ *    PAGE_* in between. But this only works if asm/page.h is not included
+ *    before this file is included.
+ *
+ * In summary: if you make sure you do not include asm/page.h before you
+ * include this file, then we guarantee that:
+ * . This file and vm_basic_types.h can be included in any order
+ * . asm/page.h will be included
+ * . The PAGE_* definitions will come from asm/page.h
+ *
+ *   --hpreg
+ */
+
+/* Must come before any kernel header file --hpreg */
+#      include "driver-config.h"
+
+#      undef PAGE_SHIFT
+#      undef PAGE_SIZE
+#      undef PAGE_MASK
+#      undef PAGE_OFFSET
+
+/* For __PAGE_OFFSET --hpreg */
+#      include <asm/page.h>
+
+#      define HOST_KERNEL_VA_2_LA(_x) (_x)
+#      define HOST_KERNEL_LA_2_VA(_x) (_x)
+#  else
+/* For VA and LA --hpreg */
+#      include "vm_basic_types.h"
+
+#      define HOST_KERNEL_VA_2_LA(_addr) ((LA)(_addr))
+#      define HOST_KERNEL_LA_2_VA(_addr) ((VA)(_addr))
+#  endif
+
+
+#endif /* __HOST_KERNEL_H__ */
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
new file mode 100644
index 00000000..865abc00
--- /dev/null
+++ b/vmmon-only/common/hostif.h
@@ -0,0 +1,148 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *  hostif.h - Platform dependent interface for supporting 
+ *             the vmx86 device driver. 
+ */
+
+
+#ifndef _HOSTIF_H_
+#define _HOSTIF_H_
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vmx86.h"
+#include "vcpuset.h"
+
+#include "hostifMem.h"
+#include "hostifGlobalLock.h"
+
+/*
+ * Host-specific definitions. 
+ */
+#if !__linux__ && !defined(WINNT_DDK) && !defined __APPLE__
+#error "Only Linux or NT or Mac OS defined for now."
+#endif
+
+
+/*
+ * The default monitor spin time for crosscalls is 50 usec
+ * in vmcore/vmx/main/monitor_init.c.  This value is used
+ * in vmx86_YieldToSet to decide whether to block and wait
+ * for another vCPU to process our crosscall, or just wake
+ * up the other vCPUs and go back to monitor.
+ */
+
+#define CROSSCALL_SPIN_SHORT_US 50
+
+/*
+ * Sleep timeout in usec, see above comment for CROSSCALL_SPIN_SHORT_US
+ */
+
+#define CROSSCALL_SLEEP_US 1000
+
+/* Return value for HostIF_IPI. */
+typedef enum {
+   IPI_NONE,      // No IPI was sent.
+   IPI_UNICAST,   // Unicast IPIs were sent.
+   IPI_BROADCAST  // A broadcast IPI was sent to all PCPUs.
+} HostIFIPIMode;
+
+EXTERN int   HostIF_Init(VMDriver *vm);
+EXTERN int   HostIF_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
+EXTERN void *HostIF_MapCrossPage(VMDriver *vm, VA64 uAddr);
+EXTERN void  HostIF_InitFP(VMDriver *vm);
+
+EXTERN void *HostIF_AllocPage(void);
+EXTERN void  HostIF_FreePage(void *ptr);
+
+EXTERN int   HostIF_LockPage(VMDriver *vm, VA64 uAddr,
+                             Bool allowMultipleMPNsPerVA, MPN *mpn);
+EXTERN int   HostIF_UnlockPage(VMDriver *vm, VA64 uAddr);
+EXTERN int   HostIF_UnlockPageByMPN(VMDriver *vm, MPN mpn, VA64 uAddr);
+EXTERN Bool  HostIF_IsLockedByMPN(VMDriver *vm, MPN mpn);
+EXTERN void  HostIF_FreeAllResources(VMDriver *vm);
+EXTERN uint64 HostIF_ReadUptime(void);
+EXTERN uint64 HostIF_UptimeFrequency(void);
+EXTERN unsigned int HostIF_EstimateLockedPageLimit(const VMDriver *vm,
+                                                   unsigned int lockedPages);
+EXTERN void  HostIF_Wait(unsigned int timeoutMs);
+EXTERN void  HostIF_WaitForFreePages(unsigned int timeoutMs);
+EXTERN void *HostIF_AllocCrossGDT(uint32 numPages, MPN maxValidFirst,
+                                  MPN *crossGDTMPNs);
+EXTERN void  HostIF_FreeCrossGDT(uint32 numPages, void *crossGDT);
+EXTERN void  HostIF_VMLock(VMDriver *vm, int callerID);
+EXTERN void  HostIF_VMUnlock(VMDriver *vm, int callerID);
+#ifdef VMX86_DEBUG
+EXTERN Bool HostIF_VMLockIsHeld(VMDriver *vm);
+#endif
+
+EXTERN Bool  HostIF_APICInit(VMDriver *vm, Bool setVMPtr, Bool probe);
+
+EXTERN int   HostIF_SemaphoreWait(VMDriver *vm,
+                                  Vcpuid vcpuid,
+                                  uint64 *args);
+
+EXTERN int   HostIF_SemaphoreSignal(uint64 *args);
+
+EXTERN void  HostIF_SemaphoreForceWakeup(VMDriver *vm, const VCPUSet *vcs);
+EXTERN HostIFIPIMode HostIF_IPI(VMDriver *vm, const VCPUSet *vcs);
+
+EXTERN uint32 HostIF_GetCurrentPCPU(void);
+EXTERN void HostIF_CallOnEachCPU(void (*func)(void *), void *data);
+
+EXTERN Bool HostIF_PrepareWaitForThreads(VMDriver *vm, Vcpuid currVcpu);
+EXTERN void HostIF_WaitForThreads(VMDriver *vm, Vcpuid currVcpu);
+EXTERN void HostIF_CancelWaitForThreads(VMDriver *vm, Vcpuid currVcpu);
+EXTERN void HostIF_WakeUpYielders(VMDriver *vm, Vcpuid currVcpu);
+
+EXTERN int HostIF_AllocLockedPages(VMDriver *vm, VA64 addr,
+                                   unsigned int numPages, Bool kernelMPNBuffer);
+EXTERN int HostIF_FreeLockedPages(VMDriver *vm, VA64 addr,
+                                  unsigned int numPages, Bool kernelMPNBuffer);
+EXTERN MPN HostIF_GetNextAnonPage(VMDriver *vm, MPN mpn);
+EXTERN int HostIF_GetLockedPageList(VMDriver *vm, VA64 uAddr,
+                                    unsigned int numPages);
+
+EXTERN int HostIF_ReadPage(MPN mpn, VA64 addr, Bool kernelBuffer);
+EXTERN int HostIF_WritePage(MPN mpn, VA64 addr, Bool kernelBuffer);
+#ifdef _WIN32
+/* Add a HostIF_ReadMachinePage() if/when needed */
+EXTERN int HostIF_WriteMachinePage(MPN mpn, VA64 addr);
+#else
+#define HostIF_WriteMachinePage(_a, _b) HostIF_WritePage((_a), (_b), TRUE)
+#endif
+#if defined __APPLE__
+// There is no need for a fast clock lock on Mac OS.
+#define HostIF_FastClockLock(_callerID) do {} while (0)
+#define HostIF_FastClockUnlock(_callerID) do {} while (0)
+#else
+EXTERN void HostIF_FastClockLock(int callerID);
+EXTERN void HostIF_FastClockUnlock(int callerID);
+#endif
+EXTERN int HostIF_SetFastClockRate(unsigned rate);
+
+EXTERN MPN HostIF_AllocMachinePage(void);
+EXTERN void HostIF_FreeMachinePage(MPN mpn);
+
+EXTERN int HostIF_SafeRDMSR(uint32 msr, uint64 *val);
+
+#endif // ifdef _HOSTIF_H_
diff --git a/vmmon-only/common/hostifGlobalLock.h b/vmmon-only/common/hostifGlobalLock.h
new file mode 100644
index 00000000..678e84ab
--- /dev/null
+++ b/vmmon-only/common/hostifGlobalLock.h
@@ -0,0 +1,45 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *  hostifGlobalLock.h - Platform dependent interface. This module
+ *                       defines functions for manipulating/checking
+ *                       the Global lock used by some drivers.
+ */
+
+
+#ifndef _HOSTIFGLOBALLOCK_H_
+#define _HOSTIFGLOBALLOCK_H_
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+
+#ifdef __APPLE__
+Bool HostIFGlobalLock_Start(void);
+void HostIFGlobalLock_Stop(void);
+#endif
+void HostIF_GlobalLock(int callerID);
+void HostIF_GlobalUnlock(int callerID);
+#ifdef VMX86_DEBUG
+Bool HostIF_GlobalLockIsHeld(void);
+#endif
+
+
+#endif // ifdef _HOSTIFGLOBALLOCK_H_
diff --git a/vmmon-only/common/hostifMem.h b/vmmon-only/common/hostifMem.h
new file mode 100644
index 00000000..318534c2
--- /dev/null
+++ b/vmmon-only/common/hostifMem.h
@@ -0,0 +1,37 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *  hostifMem.h - Platform dependent interface. This module defines
+ *                functions for allocating and releasing memory
+ *                from the kernel.
+ */
+
+
+#ifndef _HOSTIFMEM_H_
+#define _HOSTIFMEM_H_
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+
+void *HostIF_AllocKernelMem(size_t size, int nonPageable);
+void  HostIF_FreeKernelMem(void *ptr);
+
+#endif // ifdef _HOSTIFMEM_H_
diff --git a/vmmon-only/common/memtrack.c b/vmmon-only/common/memtrack.c
new file mode 100644
index 00000000..e53daebc
--- /dev/null
+++ b/vmmon-only/common/memtrack.c
@@ -0,0 +1,551 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * memtrack.c --
+ *
+ *    Utility module for tracking pinned memory, which allows later
+ *    lookup by VPN.
+ *
+ * --
+ *
+ * Track memory using a 3-level directory, to keep allocations to one
+ * page in size. The first level is inlined with the MemTrack struct
+ * and a new page is allocated for each directory in the second level,
+ * as needed. The third level packs in as many MemTrackEntry structs
+ * on a single page as possible.
+ *
+ * Optionally use a 2-level directory on systems that prefer larger
+ * contiguous allocations. In this case we allow the first level
+ * allocation to be larger than 1 page (its size will depend on the
+ * maximum number of tracked pages, currently set to 4GB).
+ *
+ *   MemTrack      MemTrackDir1        MemTrackDir2      MemTrackDir3
+ *   (Handle)                           (Optional)
+ *
+ *                                ---->/----------\
+ *                                |    | Dir[0]   |----->/----------\
+ *                                |    | Dir[1]   |      | Entry[0] |
+ *                                |    | ...      |      | Entry[1] |
+ *                                |    | Dir[N]   |      | ...      |
+ * /----------\  MEMTRACK_DIR2_ENTRIES \----------/      | Entry[N] |
+ * | ...      |                   |                      \----------/
+ * | dir1     |----/----------\   |  ->/----------\
+ * | ...      |\   | Dir[0]   |----  | | Dir[N+1] |
+ * |          | \  | Dir[1]   |------- | Dir[N+2] |
+ * \----------/  \ | ...      |        | ...      |
+ *                \| Dir[N]   |-----   | Dir[N+N] |           .
+ *                 \----------/    |   \----------/           .
+ *   MEMTRACK_DIR1_ENTRIES         |                          .
+ *                                 --->/----------\
+ *                                     | ...      |
+ *                                     |          |
+ *                                     |          |
+ *                                     | Dir[M]   |----->/----------\
+ *                                     \----------/      | ...      |
+ *                                                       |          |
+ *                                                       |          |
+ *                                                       | Entry[M] |
+ *                                                       \----------/
+ *
+ * We also keep a simple chaining hash table of entries hashed on
+ * the VPN, for quick lookup. A separate hash table hashed on the MPN
+ * exists as well, but this is only used in debug builds.
+ *
+ * This tracker does not allow pages to be removed. If, in the future,
+ * we have a use case for removing MPNs from the tracker, a simple
+ * MemTrackEntry recycle scheme can be implemented at the cost of an
+ * additional pointer per MemTrackEntry instance.
+ */
+
+#if defined(__linux__)
+/* Must come before any kernel header file. */
+#   include "driver-config.h"
+
+#   include <linux/string.h> /* memset() in the kernel */
+#elif defined(WINNT_DDK)
+#   undef PAGE_SIZE          /* Redefined in ntddk.h, and we use that defn. */
+#   undef PAGE_SHIFT
+#   include <ntddk.h>
+#else
+#   include <string.h>
+#endif
+
+#include "vmware.h"
+#include "hostif.h"
+
+#include "memtrack.h"
+
+/*
+ * Modify this value to increase the maximum number of tracked pages
+ * per MemTrack instance.
+ */
+#define MEMTRACK_MAX_TRACKED        MBYTES_2_PAGES(4096)
+
+/*
+ * Linux uses a 3-level directory, because we want to keep allocations
+ * to a single page.
+ */
+#if defined(__linux__)
+#define MEMTRACK_3LEVEL             (1)
+#endif
+
+#define MEMTRACK_DIR3_ENTRIES       (PAGE_SIZE / sizeof (MemTrackEntry))
+#if defined(MEMTRACK_3LEVEL)
+#define MEMTRACK_DIR2_ENTRIES       (PAGE_SIZE / sizeof (void *))
+#else
+#define MEMTRACK_DIR2_ENTRIES       (1)
+#endif
+#define MEMTRACK_DIR1_ENTRIES       CEILING(MEMTRACK_MAX_TRACKED,        \
+                                            (MEMTRACK_DIR2_ENTRIES *     \
+                                             MEMTRACK_DIR3_ENTRIES))
+
+#define MEMTRACK_HT_SIZE            (16384)
+#define MEMTRACK_HT_ENTRIES         (PAGE_SIZE / sizeof (void *))
+#define MEMTRACK_HT_PAGES           (MEMTRACK_HT_SIZE / MEMTRACK_HT_ENTRIES)
+
+typedef struct MemTrackDir3 {
+   MemTrackEntry     entries[MEMTRACK_DIR3_ENTRIES];
+} MemTrackDir3;
+
+#if defined(MEMTRACK_3LEVEL)
+typedef struct MemTrackDir2 {
+   MemTrackDir3     *dir[MEMTRACK_DIR2_ENTRIES];
+} MemTrackDir2;
+#else
+typedef struct MemTrackDir3 MemTrackDir2;
+#endif
+
+typedef struct MemTrackDir1 {
+   MemTrackDir2     *dir[MEMTRACK_DIR1_ENTRIES];
+} MemTrackDir1;
+
+typedef struct MemTrackHTPage {
+   MemTrackEntry    *entries[MEMTRACK_HT_ENTRIES];
+} MemTrackHTPage;
+
+typedef struct MemTrackHT {
+   MemTrackHTPage   *pages[MEMTRACK_HT_PAGES];
+} MemTrackHT;
+
+typedef uint64 MemTrackHTKey;
+
+typedef struct MemTrack {
+   unsigned          numPages;      /* Number of pages tracked. */
+   MemTrackDir1      dir1;          /* First level directory. */
+   MemTrackHT        vpnHashTable;  /* VPN to entry hashtable. */
+#if defined(MEMTRACK_MPN_LOOKUP)
+   MemTrackHT        mpnHashTable;  /* MPN to entry hashtable. */
+#endif
+} MemTrack;
+
+/*
+ * The following functions and macros help allocate and access the
+ * directory structure. This is convenient because the second level
+ * directory is optional.
+ */
+
+#define MEMTRACK_IDX2DIR(_idx, _p1, _p2, _p3)                          \
+   do {                                                                \
+      _p1   = _idx / (MEMTRACK_DIR2_ENTRIES * MEMTRACK_DIR3_ENTRIES);  \
+      _p2   = (_idx / MEMTRACK_DIR3_ENTRIES) % MEMTRACK_DIR2_ENTRIES;  \
+      _p3   = _idx % MEMTRACK_DIR3_ENTRIES;                            \
+   } while (0)
+
+#define MEMTRACK_GETDIR2(_dir1, _p1)     (_dir1->dir[_p1])
+#define MEMTRACK_ALLOCDIR2(_dir1, _p1)   MemTrackAllocDir2(_dir1, _p1)
+#define MEMTRACK_FREEDIR2(_dir1)         HostIF_FreePage(_dir1)
+
+#if defined(MEMTRACK_3LEVEL)
+#define MEMTRACK_GETENTRY(_dir1, _p1, _p2, _p3) \
+                                         (&((_dir1->dir[_p1])->dir[_p2])->entries[_p3])
+#define MEMTRACK_GETDIR3(_dir2, _p2)     (_dir2->dir[_p2])
+#define MEMTRACK_ALLOCDIR3(_dir2, _p2)   MemTrackAllocDir3(_dir2, _p2)
+#define MEMTRACK_FREEDIR3(_dir2)         HostIF_FreePage(_dir2)
+#else
+#define MEMTRACK_GETENTRY(_dir1, _p1, _p2, _p3) \
+                                         (&(_dir1->dir[_p1])->entries[_p3])
+#define MEMTRACK_GETDIR3(_dir2, _p2)     (_dir2)
+#define MEMTRACK_ALLOCDIR3(_dir2, _p2)   (_dir2)
+#define MEMTRACK_FREEDIR3(_dir2)
+#endif
+
+static INLINE void *
+MemTrackAllocPage(void)
+{
+   void *ptr = HostIF_AllocPage();
+   if (ptr != NULL) {
+      memset(ptr, 0, PAGE_SIZE);
+   }
+   return ptr;
+}
+
+#define MEMTRACK_ALLOCDFN(_name, _itype, _otype)   \
+   static INLINE _otype *                          \
+   _name(_itype *arg, unsigned pos)                \
+   {                                               \
+      if (arg->dir[pos] == NULL) {                 \
+         arg->dir[pos] = MemTrackAllocPage();      \
+      }                                            \
+      return arg->dir[pos];                        \
+   }
+
+#if defined(MEMTRACK_3LEVEL)
+MEMTRACK_ALLOCDFN(MemTrackAllocDir3, MemTrackDir2, MemTrackDir3)
+#endif
+MEMTRACK_ALLOCDFN(MemTrackAllocDir2, MemTrackDir1, MemTrackDir2)
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MemTrackHTLookup --
+ * MemTrackHTInsert --
+ *
+ *      Helper functions to insert or lookup entries in the VPN or
+ *      MPN hash tables. Hash tables are always allocated in page
+ *      size chunks.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#define MEMTRACK_HASHKEY(_key, _hash, _page, _pos)  \
+   do {                                             \
+      _hash = _key % MEMTRACK_HT_SIZE;              \
+      _page = _hash / MEMTRACK_HT_ENTRIES;          \
+      _pos  = _hash % MEMTRACK_HT_ENTRIES;          \
+   } while(0)
+
+static INLINE MemTrackEntry **
+MemTrackHTLookup(MemTrackHT *ht,       // IN
+                 MemTrackHTKey key)    // IN
+{
+   uint64 hash, page, pos;
+
+   MEMTRACK_HASHKEY(key, hash, page, pos);
+
+   return &ht->pages[page]->entries[pos];
+}
+
+static INLINE void
+MemTrackHTInsert(MemTrackHT *ht,          // IN
+                 MemTrackEntry *ent,      // IN
+                 MemTrackEntry **chain,   // OUT
+                 MemTrackHTKey key)       // IN
+{
+   MemTrackEntry **head = MemTrackHTLookup(ht, key);
+   *chain = *head;
+   *head = ent;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MemTrackCleanup --
+ *
+ *      Deallocate all memory associated with the specified tracker.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Memory deallocation.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+MemTrackCleanup(MemTrack *mt)    // IN
+{
+   unsigned idx;
+   unsigned p1;
+   MemTrackDir1 *dir1;
+
+   if (mt == NULL) {
+      return;
+   }
+   dir1 = &mt->dir1;
+
+   for (p1 = 0; p1 < MEMTRACK_DIR1_ENTRIES; p1++) {
+      unsigned p2;
+      MemTrackDir2 *dir2 = MEMTRACK_GETDIR2(dir1, p1);
+
+      if (dir2 == NULL) {
+         break;
+      }
+      for (p2 = 0; p2 < MEMTRACK_DIR2_ENTRIES; p2++) {
+         MemTrackDir3 *dir3 = MEMTRACK_GETDIR3(dir2, p2);
+
+         if (dir3 == NULL) {
+            break;
+         }
+         MEMTRACK_FREEDIR3(dir3);
+      }
+      MEMTRACK_FREEDIR2(dir2);
+   }
+
+   for (idx = 0; idx < MEMTRACK_HT_PAGES; idx++) {
+      if (mt->vpnHashTable.pages[idx] != NULL) {
+         HostIF_FreePage(mt->vpnHashTable.pages[idx]);
+      }
+#if defined(MEMTRACK_MPN_LOOKUP)
+      if (mt->mpnHashTable.pages[idx] != NULL) {
+         HostIF_FreePage(mt->mpnHashTable.pages[idx]);
+      }
+#endif
+   }
+
+   HostIF_FreeKernelMem(mt);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MemTrack_Init --
+ *
+ *      Allocate and initialize the tracker.
+ *
+ * Results:
+ *      Handle used to access the tracker.
+ *
+ * Side effects:
+ *      Memory allocation.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MemTrack *
+MemTrack_Init(void)
+{
+   MemTrack *mt;
+   unsigned idx;
+
+#if defined(MEMTRACK_3LEVEL)
+   ASSERT_ON_COMPILE(sizeof *mt <= PAGE_SIZE);
+   ASSERT_ON_COMPILE(sizeof (MemTrackDir2) == PAGE_SIZE);
+#endif
+   ASSERT_ON_COMPILE(sizeof (MemTrackDir3) <= PAGE_SIZE);
+
+   mt = HostIF_AllocKernelMem(sizeof *mt, FALSE);
+   if (mt == NULL) {
+      Warning("MemTrack failed to allocate handle.\n");
+      goto error;
+   }
+   memset(mt, 0, sizeof *mt);
+
+   for (idx = 0; idx < MEMTRACK_HT_PAGES; idx++) {
+      MemTrackHTPage *htPage = MemTrackAllocPage();
+
+      if (htPage == NULL) {
+         Warning("MemTrack failed to allocate VPN hash table (%d).\n", idx);
+         goto error;
+      }
+      mt->vpnHashTable.pages[idx] = htPage;
+   }
+
+#if defined(MEMTRACK_MPN_LOOKUP)
+   for (idx = 0; idx < MEMTRACK_HT_PAGES; idx++) {
+      MemTrackHTPage *htPage = MemTrackAllocPage();
+
+      if (htPage == NULL) {
+         Warning("MemTrack failed to allocate MPN hash table (%d).\n", idx);
+         goto error;
+      }
+      mt->mpnHashTable.pages[idx] = htPage;
+   }
+#endif
+
+   return mt;
+
+error:
+   MemTrackCleanup(mt);
+   return NULL;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MemTrack_Add --
+ *
+ *      Add the specified VPN:MPN pair to the memory tracker.
+ *
+ * Results:
+ *      A pointer to the element, or NULL on error.
+ *
+ * Side effects:
+ *      Memory allocation.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MemTrackEntry *
+MemTrack_Add(MemTrack *mt,    // IN
+             VPN64 vpn,       // IN
+             MPN mpn)         // IN
+{
+   unsigned idx = mt->numPages;
+   unsigned p1, p2, p3;
+   MemTrackEntry *ent;
+   MemTrackDir1 *dir1 = &mt->dir1;
+   MemTrackDir2 *dir2;
+   MemTrackDir3 *dir3;
+   MEMTRACK_IDX2DIR(idx, p1, p2, p3);
+
+   if (p1 >= MEMTRACK_DIR1_ENTRIES ||
+       p2 >= MEMTRACK_DIR2_ENTRIES ||
+       p3 >= MEMTRACK_DIR3_ENTRIES) {
+      return NULL;
+   }
+
+   dir2 = MEMTRACK_ALLOCDIR2(dir1, p1);
+   if (dir2 == NULL) {
+      return NULL;
+   }
+
+   dir3 = MEMTRACK_ALLOCDIR3(dir2, p2);
+   if (dir3 == NULL) {
+      return NULL;
+   }
+
+   ent = MEMTRACK_GETENTRY(dir1, p1, p2, p3);
+   ent->vpn = vpn;
+   ent->mpn = mpn;
+
+   MemTrackHTInsert(&mt->vpnHashTable, ent, &ent->vpnChain, ent->vpn);
+#if defined(MEMTRACK_MPN_LOOKUP)
+   MemTrackHTInsert(&mt->mpnHashTable, ent, &ent->mpnChain, ent->mpn);
+#endif
+
+   mt->numPages++;
+
+   return ent;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MemTrack_LookupVPN --
+ *
+ *      Lookup the specified VPN address in the memory tracker.
+ *
+ * Results:
+ *      A pointer to the element, or NULL if not there.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MemTrackEntry *
+MemTrack_LookupVPN(MemTrack *mt, // IN
+                   VPN64 vpn)    // IN
+{
+   MemTrackEntry *next = *MemTrackHTLookup(&mt->vpnHashTable, vpn);
+
+   while (next != NULL) {
+      if (next->vpn == vpn) {
+         return next;
+      }
+      next = next->vpnChain;
+   }
+
+   return NULL;
+}
+
+
+#if defined(MEMTRACK_MPN_LOOKUP)
+/*
+ *----------------------------------------------------------------------
+ *
+ * MemTrack_LookupMPN --
+ *
+ *      Lookup the specified MPN address in the memory tracker.
+ *
+ * Results:
+ *      A pointer to the element, or NULL if not there.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+MemTrackEntry *
+MemTrack_LookupMPN(MemTrack *mt, // IN
+                   MPN mpn)      // IN
+{
+   MemTrackEntry *next = *MemTrackHTLookup(&mt->mpnHashTable, mpn);
+
+   while (next != NULL) {
+      if (next->mpn == mpn) {
+         return next;
+      }
+      next = next->mpnChain;
+   }
+
+   return NULL;
+}
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MemTrack_Cleanup --
+ *
+ *      Cleanup all resources allocated for the tracker. For
+ *      all pages in the tracker call the user provided clean up
+ *      function.
+ *
+ * Results:
+ *      Number of pages in the tracker.
+ *
+ * Side effects:
+ *      Memory deallocation.
+ *
+ *----------------------------------------------------------------------
+ */
+
+unsigned
+MemTrack_Cleanup(MemTrack *mt,            // IN
+                 MemTrackCleanupCb *cb,   // IN
+                 void *cData)             // IN
+{
+   unsigned idx;
+   unsigned count = 0;
+
+   for (idx = 0; idx < mt->numPages; idx++) {
+      unsigned p1, p2, p3;
+      MemTrackEntry *ent;
+      MemTrackDir1 *dir1 = &mt->dir1;
+      MEMTRACK_IDX2DIR(idx, p1, p2, p3);
+
+      ent = MEMTRACK_GETENTRY(dir1, p1, p2, p3);
+      cb(cData, ent);
+
+      count++;
+   }
+
+   MemTrackCleanup(mt);
+
+   return count;
+}
diff --git a/vmmon-only/common/memtrack.h b/vmmon-only/common/memtrack.h
new file mode 100644
index 00000000..977c5af3
--- /dev/null
+++ b/vmmon-only/common/memtrack.h
@@ -0,0 +1,60 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * memtrack.h --
+ *
+ *    Utility module for tracking pinned memory, which allows later
+ *    lookup by VPN.
+ */
+
+
+#ifndef _MEMTRACK_H_
+#define _MEMTRACK_H_
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#if defined(VMX86_DEBUG)
+#define MEMTRACK_MPN_LOOKUP
+#endif
+
+struct MemTrack;
+
+typedef struct MemTrackEntry {
+   VPN64                   vpn;
+   MPN                     mpn;
+   struct MemTrackEntry   *vpnChain;
+#if defined(MEMTRACK_MPN_LOOKUP)
+   struct MemTrackEntry   *mpnChain;
+#endif
+} MemTrackEntry;
+
+typedef void (MemTrackCleanupCb)(void *cData, MemTrackEntry *entry);
+
+extern struct MemTrack *MemTrack_Init(void);
+extern unsigned MemTrack_Cleanup(struct MemTrack *mt, MemTrackCleanupCb *cb,
+                                 void *cbData);
+extern MemTrackEntry *MemTrack_Add(struct MemTrack *mt, VPN64 vpn, MPN mpn);
+extern MemTrackEntry *MemTrack_LookupVPN(struct MemTrack *mt, VPN64 vpn);
+#if defined(MEMTRACK_MPN_LOOKUP)
+extern MemTrackEntry *MemTrack_LookupMPN(struct MemTrack *mt, MPN mpn);
+#endif
+
+#endif // _MEMTRACK_H_
diff --git a/vmmon-only/common/phystrack.c b/vmmon-only/common/phystrack.c
new file mode 100644
index 00000000..5972e24a
--- /dev/null
+++ b/vmmon-only/common/phystrack.c
@@ -0,0 +1,495 @@
+/*********************************************************
+ * Copyright (C) 1998,2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * phystrack.c --
+ *
+ *    track down the utilization of the physical pages.
+ *
+ *    Depending on configuration phystracker provides either 2-level or
+ *    3-level structure to track whether page (specified by its MPN) is
+ *    locked or no.  Linux uses 3-level structures with top limit of
+ *    1TB (32bit) or 16TB (64bit).  Windows use 2-level structures
+ *    ready to hold 128GB (32bit) or 2TB (64bit) of memory.  On Mac
+ *    limit is 2-level 128GB.
+ *
+ *    2-level phystracker is built on top of 3-level one by collapsing
+ *    middle level.
+ */
+
+
+#ifdef linux
+/* Must come before any kernel header file --hpreg */
+#   include "driver-config.h"
+
+#   include <linux/string.h> /* memset() in the kernel */
+#else
+#   include <string.h>
+#endif
+
+#include "vmware.h"
+#include "vmx86.h"
+#include "phystrack.h"
+#include "hostif.h"
+
+#define BYTES_PER_ENTRY      (PAGE_SIZE)
+#define PHYSTRACK_L3_ENTRIES (8 * BYTES_PER_ENTRY) /* 128MB */
+
+#if defined(WINNT_DDK)
+#define PHYSTRACK_L1_ENTRIES (PHYSTRACK_MAX_SUPPORTED_GB * 8)
+#elif defined(__linux__)
+#define PHYSTRACK_L2_ENTRIES (BYTES_PER_ENTRY / sizeof(void *)) /* 64GB or 128GB */
+/*
+ * Currently MPN is 32 bits.  15 bits are in L3, 9 bits are in L2,
+ * leaving 8 bits for L1...
+ */
+#define PHYSTRACK_L1_ENTRIES (256) /* 16TB. */
+#else
+#define PHYSTRACK_L1_ENTRIES ((128 + 4) * 8) /* 128 GB */
+#endif
+
+#ifndef PHYSTRACK_L2_ENTRIES
+#define PHYSTRACK_L2_ENTRIES (1)
+#else
+#define PHYSTRACK_3LEVEL (1)
+#endif
+
+typedef struct PhysTrackerL3 {
+   uint8 bits[BYTES_PER_ENTRY];
+} PhysTrackerL3;
+
+#ifdef PHYSTRACK_3LEVEL
+typedef struct PhysTrackerL2 {
+   PhysTrackerL3 *dir[PHYSTRACK_L2_ENTRIES];
+} PhysTrackerL2;
+#else
+typedef struct PhysTrackerL3 PhysTrackerL2;
+#endif
+
+typedef struct PhysTracker {
+   VMDriver *vm; /* Used only for debugging and asserts. */
+   PhysTrackerL2 *dir[PHYSTRACK_L1_ENTRIES];
+} PhysTracker;
+
+
+/*
+ * Convert MPN to p1, p2, and p3 indices.  p1/p2/p3 must be l-values.
+ * Currently we support a 64 bit container for an MPN
+ * in hosted but not an actual 64 bit value as no hosted OS
+ * supports this yet. Hence in PhysMem tracker we are deliberately using
+ * a 32-bit container to save memory. Also the tracker is allocating pages
+ * considering the MPN to be a 32 bit value. This will change once we get
+ * systems supporting 64 bit memory/addressing space.
+ * Until then let us assert if a value greater than 32 bit is being passed.
+ */
+#define PHYSTRACK_MPN2IDX(mpn, p1, p2, p3)           \
+   do {                                              \
+      ASSERT((mpn >> 32) == 0);                      \
+      p2 = (unsigned)(mpn) / PHYSTRACK_L3_ENTRIES;   \
+      p1 = p2 / PHYSTRACK_L2_ENTRIES;                \
+      p2 = p2 % PHYSTRACK_L2_ENTRIES;                \
+      p3 = (unsigned)(mpn) % PHYSTRACK_L3_ENTRIES;   \
+   } while (0)
+
+/*
+ * Convert L3 index to offset and bitmask.  offs/bitmask must be l-values.
+ */
+#define PHYSTRACK_GETL3POS(p3, offs, bitmask) \
+   do {                          \
+      offs = (p3) / 8;           \
+      bitmask = 1 << ((p3) % 8); \
+   } while (0)
+
+/*
+ * Helpers hiding middle level.
+ */
+#ifdef PHYSTRACK_3LEVEL
+#define PHYSTRACK_GETL3(dir2, p2) (dir2)->dir[(p2)]
+#define PHYSTRACK_ALLOCL3(dir2, p2) PhysTrackAllocL3((dir2), (p2))
+#define PHYSTRACK_FREEL3(dir2, p2) PhysTrackFreeL3((dir2), (p2))
+#else
+#define PHYSTRACK_GETL3(dir2, p2) (dir2)
+#define PHYSTRACK_ALLOCL3(dir2, p2) (dir2)
+#define PHYSTRACK_FREEL3(dir2, p2) do { } while (0)
+#endif
+
+
+#ifdef PHYSTRACK_3LEVEL
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrackAllocL3 --
+ *
+ *      Allocate and hook L3 table to the L2 directory if does not exist.
+ *      Or get existing one if it exists.
+ *
+ * Results:
+ *      L3 table.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER PhysTrackerL3 *
+PhysTrackAllocL3(PhysTrackerL2 *dir2,
+                 unsigned int p2)
+{
+   PhysTrackerL3 *dir3;
+
+   dir3 = dir2->dir[p2];
+   if (!dir3) {
+      ASSERT_ON_COMPILE(sizeof *dir3 == PAGE_SIZE);
+      dir3 = HostIF_AllocPage();
+      if (!dir3) {
+         PANIC();
+      }
+      memset(dir3, 0, sizeof *dir3);
+      dir2->dir[p2] = dir3;
+   }
+   return dir3;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrackFreeL3 --
+ *
+ *      Unhook L3 table from L2 directory, and free it.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+PhysTrackFreeL3(PhysTrackerL2 *dir2,
+                unsigned int p2)
+{
+   HostIF_FreePage(dir2->dir[p2]);
+   dir2->dir[p2] = NULL;
+}
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrack_Alloc --
+ *
+ *      Create new PhysTracker.
+ *
+ * Results:
+ *      Creates new PhysTracker.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+PhysTracker *
+PhysTrack_Alloc(VMDriver *vm)
+{
+   PhysTracker *tracker;
+
+   ASSERT(vm != NULL);
+
+   /* allocate a new phystracker */
+   tracker = HostIF_AllocKernelMem(sizeof *tracker, FALSE);
+   if (tracker) {
+      memset(tracker, 0, sizeof *tracker);
+      tracker->vm = vm;
+   } else {
+      Warning("%s failed\n", __FUNCTION__);
+   }
+
+   return tracker;
+} 
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrack_Free --
+ *
+ *      module deallocation
+ *
+ * Results:
+ *      reallocates all structures, including 'tracker'
+ *     
+ * Side effects:
+ *      tracker deallocated
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+PhysTrack_Free(PhysTracker *tracker) 
+{
+   unsigned int p1;
+
+   ASSERT(tracker);
+
+   for (p1 = 0; p1 < PHYSTRACK_L1_ENTRIES; p1++) {
+      PhysTrackerL2 *dir2 = tracker->dir[p1];
+
+      if (dir2) {
+         unsigned int p2;
+
+         for (p2 = 0; p2 < PHYSTRACK_L2_ENTRIES; p2++) {
+            PhysTrackerL3 *dir3 = PHYSTRACK_GETL3(dir2, p2);
+
+            if (dir3) {
+               unsigned int pos;
+
+               for (pos = 0; pos < BYTES_PER_ENTRY; pos++) {
+                  if (dir3->bits[pos]) {
+                     Warning("%s: pfns still locked\n", __FUNCTION__);
+                     PANIC();
+                  }
+               }
+               PHYSTRACK_FREEL3(dir2, p2);
+            }
+         }
+         HostIF_FreePage(dir2);
+         tracker->dir[p1] = NULL;
+      }
+   }
+   HostIF_FreeKernelMem(tracker);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrack_Add --
+ *
+ *      add a page to the core map tracking.
+ *
+ * Results:
+ *      void
+ *
+ * Side effects:
+ *      Fatal if the page is already tracked.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+PhysTrack_Add(PhysTracker *tracker, // IN/OUT
+              MPN mpn)              // IN: MPN of page to be added
+{
+   unsigned int p1;
+   unsigned int p2;
+   unsigned int p3;
+   unsigned int pos;
+   unsigned int bit;
+   PhysTrackerL2 *dir2;
+   PhysTrackerL3 *dir3;
+
+   ASSERT(tracker);
+   ASSERT(HostIF_VMLockIsHeld(tracker->vm));
+   PHYSTRACK_MPN2IDX(mpn, p1, p2, p3);
+   ASSERT(p1 < PHYSTRACK_L1_ENTRIES);
+
+   dir2 = tracker->dir[p1];
+   if (!dir2) {
+      // more efficient with page alloc
+      ASSERT_ON_COMPILE(sizeof *dir2 == PAGE_SIZE);
+      dir2 = HostIF_AllocPage();
+      if (!dir2) {
+         PANIC();
+      }
+      memset(dir2, 0, sizeof *dir2);
+      tracker->dir[p1] = dir2;
+   }
+   dir3 = PHYSTRACK_ALLOCL3(dir2, p2);
+   PHYSTRACK_GETL3POS(p3, pos, bit);
+   if (dir3->bits[pos] & bit) {
+      PANIC();
+   }
+   dir3->bits[pos] |= bit;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrack_Remove --
+ *
+ *      remove a page from the core map tracking
+ *
+ * Results:
+ *      void
+ *
+ * Side effects:
+ *      Fatal if the page is not tracked
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+PhysTrack_Remove(PhysTracker *tracker, // IN/OUT
+                 MPN mpn)              // IN: MPN of page to be removed.
+{
+   unsigned int p1;
+   unsigned int p2;
+   unsigned int p3;
+   unsigned int pos;
+   unsigned int bit;
+   PhysTrackerL2 *dir2;
+   PhysTrackerL3 *dir3;
+
+   ASSERT(tracker);
+   ASSERT(HostIF_VMLockIsHeld(tracker->vm));
+   PHYSTRACK_MPN2IDX(mpn, p1, p2, p3);
+   ASSERT(p1 < PHYSTRACK_L1_ENTRIES);
+
+   dir2 = tracker->dir[p1];
+   if (!dir2) {
+      PANIC();
+   }
+   dir3 = PHYSTRACK_GETL3(dir2, p2);
+   if (!dir3) {
+      PANIC();
+   }
+   PHYSTRACK_GETL3POS(p3, pos, bit);
+   if (!(dir3->bits[pos] & bit)) {
+      PANIC();
+   }
+   dir3->bits[pos] &= ~bit;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrack_Test --
+ *
+ *      tests whether a page is being tracked
+ *
+ * Results:
+ *      TRUE if the page is tracked
+ *      FALSE otherwise
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+PhysTrack_Test(const PhysTracker *tracker, // IN
+               MPN mpn)                    // IN: MPN of page to be tested.
+{
+   unsigned int p1;
+   unsigned int p2;
+   unsigned int p3;
+   unsigned int pos;
+   unsigned int bit;
+   PhysTrackerL2 *dir2;
+   PhysTrackerL3 *dir3;
+
+   ASSERT(tracker);
+   ASSERT(HostIF_VMLockIsHeld(tracker->vm));
+   PHYSTRACK_MPN2IDX(mpn, p1, p2, p3);
+   if (p1 >= PHYSTRACK_L1_ENTRIES) {
+      return FALSE;
+   }
+   dir2 = tracker->dir[p1];
+   if (!dir2) {
+      return FALSE;
+   }
+   dir3 = PHYSTRACK_GETL3(dir2, p2);
+   if (!dir3) {
+      return FALSE;
+   }
+   PHYSTRACK_GETL3POS(p3, pos, bit);
+   return (dir3->bits[pos] & bit) != 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrack_GetNext --
+ *
+ *      Return next tracked page
+ *
+ * Results:
+ *      MPN when some tracked page was found
+ *      INVALID_MPN otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+PhysTrack_GetNext(const PhysTracker *tracker, // IN
+                  MPN mpn)                    // IN: MPN of page to be tracked.
+{
+   unsigned int p1;
+   unsigned int p2;
+   unsigned int p3;
+
+   if (mpn == INVALID_MPN) {
+      mpn = 0; /* First iteration. */
+   } else {
+      mpn++;   /* We want the next MPN. */
+   }
+   PHYSTRACK_MPN2IDX(mpn, p1, p2, p3);
+
+   ASSERT(tracker);
+   ASSERT(HostIF_VMLockIsHeld(tracker->vm));
+   for (; p1 < PHYSTRACK_L1_ENTRIES; p1++) {
+      PhysTrackerL2 *dir2;
+
+      dir2 = tracker->dir[p1];
+      if (dir2) {
+         for (; p2 < PHYSTRACK_L2_ENTRIES; p2++) {
+            PhysTrackerL3 *dir3;
+
+            dir3 = PHYSTRACK_GETL3(dir2, p2);
+            if (dir3) {
+               for (; p3 < PHYSTRACK_L3_ENTRIES; p3++) {
+                  unsigned int pos;
+                  unsigned int bit;
+
+                  PHYSTRACK_GETL3POS(p3, pos, bit);
+                  if (dir3->bits[pos] & bit) {
+                     return (p1 * PHYSTRACK_L2_ENTRIES + p2) * PHYSTRACK_L3_ENTRIES + p3;
+                  }
+               }
+            }
+            p3 = 0;
+         }
+      }
+      p2 = 0; p3 = 0;
+   }
+   return INVALID_MPN;
+}
+
diff --git a/vmmon-only/common/phystrack.h b/vmmon-only/common/phystrack.h
new file mode 100644
index 00000000..e88c19a3
--- /dev/null
+++ b/vmmon-only/common/phystrack.h
@@ -0,0 +1,54 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * phystrack.h --
+ *
+ *    track down the utilization of the physical pages
+ */
+
+#ifndef PHYSTRACK_H
+#define PHYSTRACK_H
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#if defined(WINNT_DDK)
+/* XXX: can be more efficient based on server vs. desktop and version of Windows */
+#define PHYSTRACK_MAX_SUPPORTED_GB (2048 + 4) /* 2 TB 64-bit W2k8 + 4 GB PCI */
+#endif
+
+struct PhysTracker;
+struct VMDriver;
+
+EXTERN struct PhysTracker *PhysTrack_Alloc(struct VMDriver *vm);
+EXTERN void PhysTrack_Free(struct PhysTracker *);
+
+EXTERN void PhysTrack_Add(struct PhysTracker *, MPN);
+EXTERN void PhysTrack_Remove(struct PhysTracker *, MPN);
+EXTERN Bool PhysTrack_Test(const struct PhysTracker *, MPN);
+EXTERN MPN PhysTrack_GetNext(const struct PhysTracker *, MPN);
+
+#endif
+
+
+
+
+
+
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
new file mode 100644
index 00000000..de2429ef
--- /dev/null
+++ b/vmmon-only/common/task.c
@@ -0,0 +1,2180 @@
+/*********************************************************
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * task.c --
+ *
+ *      Task initialization and switching routines between the host
+ *      and the monitor.
+ *
+ *      A task switch:
+ *          -saves the EFLAGS,CR0,CR2,CR4, and IDT
+ *          -jumps to code on the shared page
+ *              which saves the registers, GDT and CR3
+ *              which then restores the registers, GDT and CR3
+ *          -restores the IDT,CR0,CR2,CR4 and EFLAGS
+ *
+ *      This file is pretty much independent of the host OS.
+ *
+ */
+
+#ifdef linux
+/* Must come before any kernel header file --hpreg */
+#   include "driver-config.h"
+#   include <linux/string.h> /* memset() in the kernel */
+
+#   define EXPORT_SYMTAB
+#else
+#   include <string.h>
+#endif
+
+#include "vmware.h"
+#include "modulecall.h"
+#include "vmx86.h"
+#include "task.h"
+#include "vm_asm.h"
+#include "cpuid.h"
+#include "hostif.h"
+/* On Linux, must come before any inclusion of asm/page.h --hpreg */
+#include "hostKernel.h"
+#include "comport.h"
+#include "crossgdt.h"
+#include "x86svm.h"
+#include "x86vt.h"
+#include "x86vtinstr.h"
+#include "apic.h"
+#include "x86perfctr.h"
+
+#if defined(_WIN64)
+#   include "x86.h"
+#   include "vmmon-asm-x86-64.h"
+#   define USE_TEMPORARY_GDT 1
+#else
+/* It is OK to set this to 1 on 64-bit Linux/Mac OS for testing. */
+#   define USE_TEMPORARY_GDT 0
+#endif
+
+#define TS_ASSERT(t) do { \
+   DEBUG_ONLY(if (!(t)) TaskAssertFail(__LINE__);)  \
+} while (0)
+
+static CrossGDT *crossGDT = NULL;
+static MPN crossGDTMPNs[CROSSGDT_NUMPAGES];
+static DTR crossGDTDescHKLA;
+static Selector kernelStackSegment = 0;
+static uint32 dummyLVT;
+static Atomic_uint64 hvRootPage[MAX_PCPUS];
+static Atomic_Ptr tmpGDT[MAX_PCPUS];
+static Bool pebsAvailable = FALSE;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskAllocHVRootPage --
+ *
+ *      Allocate and initialize an HV root page.  Upon success, race to be
+ *      the first to store the allocated MPN in '*slot'.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      When the call returns, '*slot' contains the MPN of an HV root page if
+ *      a thread succeeded, or INVALID_MPN if all threads failed.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskAllocHVRootPage(Atomic_uint64 *slot) // IN/OUT
+{
+   uint32 *content;
+   uint64 vmxBasicMSR;
+   MPN mpn;
+   static const MPN invalidMPN = INVALID_MPN;
+
+   ASSERT(slot != NULL);
+
+   /* Allocate the page contents. */
+   content = HostIF_AllocKernelMem(PAGE_SIZE, TRUE);
+   if (content == NULL) {
+      Warning("%s: Failed to allocate content.\n", __FUNCTION__);
+      return;
+   }
+
+   /*
+    * On VMX-capable hardware, write the VMCS revision identifier at the
+    * beginning of the HV root page.  On SVM-capable hardware, the HV root
+    * page is just initialized to zeroes.
+    */
+   memset(content, 0, PAGE_SIZE);
+   if (HostIF_SafeRDMSR(MSR_VMX_BASIC, &vmxBasicMSR) == 0) {
+      *content = LODWORD(vmxBasicMSR);
+   }
+
+   /* Allocate the HV root page. */
+   mpn = HostIF_AllocMachinePage();
+
+   if (mpn != INVALID_MPN) {
+      /*
+       * Store the MPN of the HV root page. This is done atomically, so if
+       * several threads concurrently race and call TaskAllocHVRootPage() with
+       * the same 'slot', only the first one to pass this finish line will win.
+       */
+      if (HostIF_WriteMachinePage(mpn, PtrToVA64(content)) != 0 ||
+          !Atomic_CMPXCHG64(slot, &invalidMPN, &mpn)) {
+         /*
+          * Either we couldn't set up the page or this thread lost the race.
+          * We must free its HV root page.
+          */
+         Warning("%s: Failed to setup page mpn=%llx.\n",
+                 __FUNCTION__, (long long unsigned)mpn);
+         HostIF_FreeMachinePage(mpn);
+      }
+   } else {
+      Warning("%s: Failed to allocate page.\n", __FUNCTION__);
+   }
+
+   HostIF_FreeKernelMem(content);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskGetHVRootPage --
+ *
+ *      Lazily allocate an HV root page, and return its MPN.
+ *
+ * Results:
+ *      On success: The MPN of the HV root page.
+ *      On failure: INVALID_MPN.
+ *
+ * Side effects:
+ *      Might allocate memory, and transition '*slot' from
+ *      INVALID_MPN to a valid MPN.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static MPN
+TaskGetHVRootPage(Atomic_uint64 *slot) // IN/OUT
+{
+   MPN mpn = Atomic_Read64(slot);
+
+   if (mpn != INVALID_MPN) {
+      return mpn;
+   }
+
+   TaskAllocHVRootPage(slot);
+
+   return Atomic_Read64(slot);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_GetHVRootPageForPCPU --
+ *
+ *      Lazily allocate the HV root page for a pCPU, and return its MPN.
+ *      This is used for the VMXON region on Intel/VIA hardware and the
+ *      host save area on AMD hardware.
+ *
+ * Results:
+ *      On success: The MPN of the HV root page.
+ *      On failure: INVALID_MPN.
+ *
+ * Side effects:
+ *      Might allocate memory, and transition 'hvRootPage[pCPU]' from
+ *      INVALID_MPN to a valid MPN.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+MPN
+Task_GetHVRootPageForPCPU(uint32 pCPU) // IN
+{
+   ASSERT(pCPU < ARRAYSIZE(hvRootPage));
+
+   return TaskGetHVRootPage(&hvRootPage[pCPU]);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskAllocGDT --
+ *
+ *      Allocate a GDT. Upon success, race to be the first to store its base in
+ *      '*slot'.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      When the call returns, '*slot' contains the base of a GDT if a thread
+ *      succeeded, or NULL if all threads failed.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskAllocGDT(Atomic_Ptr *slot) // IN/OUT
+{
+   Descriptor *base;
+
+   ASSERT(slot);
+
+   /* Allocate a GDT. */
+   base = HostIF_AllocKernelMem(0x10000 /* Maximal GDT size */, TRUE);
+   if (!base) {
+      Warning("%s: Failed to allocate temporary GDT.\n", __FUNCTION__);
+      return;
+   }
+
+   /*
+    * Store the base of the GDT. This is done atomically, so if several threads
+    * concurrently race and call TaskAllocGDT() with the same 'slot', only the
+    * first one to pass this finish line will win.
+    */
+
+   if (Atomic_ReadIfEqualWritePtr(slot, NULL, base)) {
+      /* This thread lost the race. It must free its GDT. */
+      HostIF_FreeKernelMem(base);
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskGetGDT --
+ *
+ *      Lazily allocate a GDT, and return its base.
+ *
+ * Results:
+ *      On success: The base of the GDT.
+ *      On failure: NULL.
+ *
+ * Side effects:
+ *      Might allocate memory, and transition '*slot' from NULL to a valid
+ *      base.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Descriptor *
+TaskGetGDT(Atomic_Ptr *slot) // IN/OUT
+{
+   Descriptor *base = Atomic_ReadPtr(slot);
+
+   if (base) {
+      return base;
+   }
+
+   TaskAllocGDT(slot);
+
+   return Atomic_ReadPtr(slot);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_GetTmpGDT --
+ *
+ *      Lazily allocate the temporary GDT for a pCPU, and return its base.
+ *
+ * Results:
+ *      On success: The base of the temporary GDT.
+ *      On failure: NULL.
+ *
+ * Side effects:
+ *      Might allocate memory, and transition 'tmpGDT[pCPU]' from NULL to a
+ *      valid base.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Descriptor *
+Task_GetTmpGDT(uint32 pCPU) // IN
+{
+   ASSERT(pCPU < ARRAYSIZE(tmpGDT));
+
+   return TaskGetGDT(&tmpGDT[pCPU]);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskFreeHVRootPages --
+ *
+ *      Free all HV root pages (allocated by TaskAllocHVRootPage), if any.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskFreeHVRootPages(void)
+{
+   MPN mpn;
+   unsigned i;
+
+   for (i = 0; i < ARRAYSIZE(hvRootPage); i++) {
+      mpn = Atomic_Read64(&hvRootPage[i]);
+      if (mpn != INVALID_MPN) {
+         HostIF_FreeMachinePage(mpn);
+      }
+   }
+}
+
+
+#ifdef VMX86_DEBUG
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskAssertFail --
+ *
+ *      Output line number to comport and crash.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskAssertFail(int line)
+{
+   CP_PutStr("TaskAssertFail*: ");
+   CP_PutDec(line);
+   CP_PutCrLf();
+   SET_CR3(0);
+}
+
+
+#endif
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSaveGDT64 --
+ *
+ *      Save the current GDT in the caller-supplied struct.
+ *
+ * Results:
+ *      *hostGDT64 = copy of the processor's GDT.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+TaskSaveGDT64(DTR64 *hostGDT64)  // OUT
+{
+   hostGDT64->offset = 0;
+   _Get_GDT((DTR *)hostGDT64);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSaveIDT64 --
+ *
+ *      Save the current IDT in the caller-supplied struct.
+ *
+ * Results:
+ *      *hostIDT64 = copy of the processor's IDT.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+TaskSaveIDT64(DTR64 *hostIDT64)  // OUT
+{
+   hostIDT64->offset = 0;
+   _Get_IDT((DTR *)hostIDT64);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskLoadIDT64 --
+ *
+ *      Load the current IDT from the caller-supplied struct.
+ *
+ * Results:
+ *      Processor's IDT = *hostIDT64.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+TaskLoadIDT64(DTR64 *hostIDT64)  // IN
+{
+   _Set_IDT((DTR *)hostIDT64);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskCopyGDT64 --
+ *
+ *      Copy the given GDT contents to the caller-supplied buffer.
+ *
+ *      This routine assumes the caller has already verified there is enough
+ *      room in the output buffer.
+ *
+ * Results:
+ *      *out = copy of the processor's GDT contents.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+TaskCopyGDT64(DTR64 *hostGDT64,  // IN  GDT to be copied from
+              Descriptor *out)   // OUT where to copy contents to
+{
+   memcpy(out,
+          (void *)HOST_KERNEL_LA_2_VA((LA)hostGDT64->offset),
+          hostGDT64->limit + 1);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_Terminate --
+ *
+ *      Called at driver unload time.  Undoes whatever Task_Initialize did.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Release temporary GDT memory.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+Task_Terminate(void)
+{
+   TaskFreeHVRootPages();
+
+   if (crossGDT != NULL) {
+      HostIF_FreeCrossGDT(CROSSGDT_NUMPAGES, crossGDT);
+      crossGDT = NULL;
+      crossGDTDescHKLA.limit  = 0;
+      crossGDTDescHKLA.offset = 0;
+   }
+
+   if (USE_TEMPORARY_GDT) {
+      unsigned i;
+
+      for (i = 0; i < ARRAYSIZE(tmpGDT); i++) {
+         Descriptor *base = Atomic_ReadPtr(&tmpGDT[i]);
+
+         if (base) {
+            HostIF_FreeKernelMem(base);
+         }
+      }
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_Initialize --
+ *
+ *      Called at driver load time to initialize module's static data.
+ *
+ * Results:
+ *      TRUE iff initialization successful.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+Task_Initialize(void)
+{
+   unsigned i;
+
+   ASSERT_ON_COMPILE(sizeof (Atomic_uint64) == sizeof (MPN));
+   for (i = 0; i < ARRAYSIZE(hvRootPage); i++) {
+      Atomic_Write64(&hvRootPage[i], INVALID_MPN);
+   }
+   if (USE_TEMPORARY_GDT) {
+      for (i = 0; i < ARRAYSIZE(tmpGDT); i++) {
+         Atomic_WritePtr(&tmpGDT[i], NULL);
+      }
+   }
+
+   /*
+    * The worldswitch code doesn't work with a zero stack segment
+    * because it temporarily restores the data segments to the stack
+    * segment.  So here we make sure we have a non-zero kernel
+    * read/write flat data segment.
+    */
+
+   kernelStackSegment = GET_SS();
+   if (kernelStackSegment == 0) {
+      DTR hostGDTR;
+
+      GET_GDT(hostGDTR);
+      for (kernelStackSegment = 8;
+           kernelStackSegment + 7 <= hostGDTR.limit;
+           kernelStackSegment += 8) {
+         uint64 gdte = *(uint64 *)(hostGDTR.offset + kernelStackSegment);
+
+         if ((gdte & 0xFFCFFEFFFFFFFFFFULL) == 0x00CF92000000FFFFULL) {
+            goto gotnzss;
+         }
+      }
+      Warning("%s: no non-null flat kernel data GDT segment\n",
+              __FUNCTION__);
+
+      return FALSE;
+gotnzss:;
+   }
+   if ((kernelStackSegment == 0) || ((kernelStackSegment & 7) != 0)) {
+           Warning("Task_Initialize: unsupported SS %04x\n",
+                   kernelStackSegment);
+         return FALSE;
+   }
+
+   /*
+    * Check if PEBS is supported.  For simplicity we assume there will not
+    * be mixed CPU models.  According to the Intel SDM, PEBS is supported if:
+    *
+    * IA32_MISC_ENABLE.EMON_AVAILABE (bit 7) is set and
+    * IA32_MISC_ENABLE.PEBS_UNAVAILABE (bit 12) is clear.
+    */
+
+   pebsAvailable = PerfCtr_PEBSAvailable();
+   return TRUE;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskRestoreHostGDTTRLDT --
+ *
+ *
+ * Results:
+ *      The host's GDT is copied (or partially copied) to the
+ *      dynamically allocated temporary GDT.
+ *
+ *      The TR is restored using the temporary GDT then the host's real GDT is
+ *      restored.  Finally, the host LDT is restored.
+ *
+ * Notes:
+ *      An OS which checks critical data structures, such as the GDT,
+ *      can fail when this module changes the TSS busy bit in the host
+ *      GDT.  To avoid this problem, we use a sparse copy of the host
+ *      GDT to perform the manipulation of the TSS busy bit.
+ *
+ *      See PR 68144.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+TaskRestoreHostGDTTRLDT(Descriptor *tempGDTBase,
+                        DTR64 hostGDT64,
+                        Selector ldt,
+                        Selector cs,
+                        Selector tr)
+{
+   TS_ASSERT(tr != 0);
+   TS_ASSERT((tr & 7) == 0);
+
+   if (USE_TEMPORARY_GDT) {
+      DTR64 tempGDT64;
+
+      /*
+       * Set up a temporary GDT so that the TSS 'busy bit' can be
+       * changed without affecting the host's data structures.
+       */
+
+      const VA hostGDTVA  = HOST_KERNEL_LA_2_VA(hostGDT64.offset);
+      const unsigned size = sizeof(Descriptor);
+      const Selector ss   = SELECTOR_CLEAR_RPL(GET_SS());
+
+      ASSERT(hostGDTVA == HOST_KERNEL_LA_2_VA(hostGDT64.offset));
+
+      ASSERT(SELECTOR_RPL(cs) == 0 && SELECTOR_TABLE(cs) == 0);
+      ASSERT(SELECTOR_RPL(ss) == 0 && SELECTOR_TABLE(ss) == 0);
+
+      /*
+       * Copy code and data segments so they remain valid in case of NMI.
+       * Worldswitch code returns with DS==ES==SS so we don't have to set
+       * up DS,ES explicitly.
+       */
+
+      ASSERT(SELECTOR_CLEAR_RPL(GET_DS()) == ss);
+      ASSERT(SELECTOR_CLEAR_RPL(GET_ES()) == ss);
+      tempGDTBase[cs / size]     = *(Descriptor *)(hostGDTVA + cs);
+      tempGDTBase[ss / size]     = *(Descriptor *)(hostGDTVA + ss);
+
+      /*
+       * TR descriptors use two entries (64-bits wide) in 64-bit mode.
+       */
+
+      tempGDTBase[tr / size]     = *(Descriptor *)(hostGDTVA + tr);
+      tempGDTBase[tr / size + 1] = *(Descriptor *)(hostGDTVA + tr + size);
+
+      /*
+       * Clear the 'task busy' bit so we can reload TR.
+       */
+
+      if (Desc_Type(&tempGDTBase[tr / size]) == TASK_DESC_BUSY) {
+         Desc_SetType(&tempGDTBase[tr / size], TASK_DESC);
+      }
+
+      /*
+       * Restore the TR using the temp GDT then restore the host's real GDT
+       * then host LDT.
+       */
+
+      tempGDT64.limit  = hostGDT64.limit;
+      tempGDT64.offset = HOST_KERNEL_VA_2_LA((VA)tempGDTBase);
+      _Set_GDT((DTR *)&tempGDT64);
+      SET_TR(tr);
+      _Set_GDT((DTR *)&hostGDT64);
+      SET_LDT(ldt);
+   } else {
+      Descriptor *desc;
+
+      /*
+       * The host isn't picky about the TR entry.  So clear the TSS<busy> bit
+       * in the host GDT, then restore host GDT and TR, then LDT.
+       */
+
+      desc = (Descriptor *)((VA)HOST_KERNEL_LA_2_VA(hostGDT64.offset + tr));
+      if (Desc_Type(desc) == TASK_DESC_BUSY) {
+         Desc_SetType(desc, TASK_DESC);
+      }
+      _Set_GDT((DTR *)&hostGDT64);
+      SET_TR(tr);
+      SET_LDT(ldt);
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_AllocCrossGDT --
+ *
+ *      Make sure the crossGDT is allocated and initialized.
+ *
+ * Results:
+ *      TRUE iff crossGDT was already initialized or successfully initialized.
+ *
+ * Side effects:
+ *      crossGDT static vars set up if not already.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+Task_AllocCrossGDT(InitBlock *initBlock)  // OUT: crossGDT values filled in
+{
+   DTR64 hostGDT64;
+
+   /*
+    * Make sure only one of these runs at a time on the whole system, because
+    * there is only one crossGDT for the whole system.
+    */
+
+   HostIF_GlobalLock(2);
+
+   /*
+    * Maybe the crossGDT has already been set up.
+    */
+
+   if (crossGDT == NULL) {
+      MPN maxValidFirst =
+         0xFFC00 /* 32-bit MONITOR_LINEAR_START */ - CROSSGDT_NUMPAGES;
+
+      /*
+       * The host entries must fit on pages of the crossGDT that are mapped.
+       * Since we know they are below CROSSGDT_LOWSEG, we can just check that
+       * CROSSGDT_LOWSEG and below are mapped.
+       *
+       * Because the CROSSGDT_LOWSEG segments must reside on the first page of
+       * the crossGDT (as they must remain valid with paging off), all we need
+       * do is check that bit 0 of CROSSGDT_PAGEMASK is set (indicating that
+       * page 0 of the crossGDT will be mapped).
+       */
+
+      ASSERT_ON_COMPILE(CROSSGDT_LOWSEG < PAGE_SIZE);
+      ASSERT_ON_COMPILE(CROSSGDT_PAGEMASK & 1);
+
+      /*
+       * Allocate the crossGDT.
+       */
+      ASSERT_ON_COMPILE(sizeof *crossGDT == CROSSGDT_NUMPAGES * PAGE_SIZE);
+      crossGDT = HostIF_AllocCrossGDT(CROSSGDT_NUMPAGES, maxValidFirst,
+                                      crossGDTMPNs);
+      if (crossGDT == NULL) {
+         HostIF_GlobalUnlock(2);
+         Warning("%s: unable to allocate crossGDT\n", __FUNCTION__);
+
+         return FALSE;
+      }
+
+      /*
+       * Check that the crossGDT meets the address requirements documented in
+       * bora/doc/worldswitch-pages.txt.
+       */
+
+      if (crossGDTMPNs[0] > maxValidFirst) {
+         HostIF_FreeCrossGDT(CROSSGDT_NUMPAGES, crossGDT);
+         crossGDT = NULL;
+         HostIF_GlobalUnlock(2);
+         Warning("%s: crossGDT MPN %"FMT64"X gt %"FMT64"X\n", __FUNCTION__,
+                 crossGDTMPNs[0], maxValidFirst);
+
+         return FALSE;
+      }
+
+      /*
+       * Fill the crossGDT with a copy of our host GDT.  VMX will have to fill
+       * in monitor segments via Task_InitCrossGDT.
+       *
+       * We are assuming that all the host segments we will ever need are below
+       * CROSSGDT_LOWSEG.  If this assumption ever breaks, the host segments
+       * would have to be unconditionally transitioned to the CROSSGDT
+       * intermediate segments before switching to the monitor.  The only time
+       * the GDT has been found to be bigger than CROSSGDT_LOWSEG is when they
+       * are running KVM or Xen, and we never see the large segment numbers.
+       */
+
+      memset(crossGDT, 0, sizeof *crossGDT);
+      TaskSaveGDT64(&hostGDT64);
+      if (hostGDT64.limit > CROSSGDT_LOWSEG * 8 - 1) {
+         hostGDT64.limit = CROSSGDT_LOWSEG * 8 - 1;
+      }
+      TaskCopyGDT64(&hostGDT64, crossGDT->gdtes);
+
+      /*
+       * Set up descriptor for the crossGDT using host kernel LA as a base.
+       */
+
+      crossGDTDescHKLA.limit  = sizeof *crossGDT - 1;
+      crossGDTDescHKLA.offset = HOST_KERNEL_VA_2_LA((VA)crossGDT);
+   }
+
+   HostIF_GlobalUnlock(2);
+
+   initBlock->crossGDTHKLA = crossGDTDescHKLA.offset;
+   ASSERT_ON_COMPILE(sizeof initBlock->crossGDTMPNs == sizeof crossGDTMPNs);
+   memcpy(initBlock->crossGDTMPNs, crossGDTMPNs, sizeof crossGDTMPNs);
+
+   return TRUE;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_InitCrosspage  --
+ *
+ *    Initialize the crosspage used to switch to the monitor task.
+ *
+ * Results:
+ *    0 on success
+ *    != 0 on failure
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+Task_InitCrosspage(VMDriver *vm,          // IN
+                   InitBlock *initParams) // IN/OUT: Initial params from the
+                                          //         VM
+{
+   Vcpuid vcpuid;
+
+   if (crossGDT == NULL) {
+      return 1;
+   }
+
+   initParams->crossGDTHKLA = crossGDTDescHKLA.offset;
+   ASSERT_ON_COMPILE(sizeof initParams->crossGDTMPNs == sizeof crossGDTMPNs);
+   memcpy(initParams->crossGDTMPNs, crossGDTMPNs, sizeof crossGDTMPNs);
+
+   for (vcpuid = 0; vcpuid < initParams->numVCPUs;  vcpuid++) {
+      VA64         crossPageUserAddr = initParams->crosspage[vcpuid];
+      VMCrossPage *p                 = HostIF_MapCrossPage(vm, crossPageUserAddr);
+      MPN          crossPageMPN;
+
+      if (p == NULL) {
+         return 1;
+      }
+
+      if (HostIF_LookupUserMPN(vm, crossPageUserAddr, &crossPageMPN) !=
+          PAGE_LOOKUP_SUCCESS ||
+          crossPageMPN == 0) {
+         return 1;
+      }
+
+      {
+         /* The version of the crosspage must be the first four
+          * bytes of the crosspage.  See the declaration
+          * of VMCrossPage in modulecall.h.
+          */
+
+         ASSERT_ON_COMPILE(offsetof(VMCrossPage, version) == 0);
+         ASSERT_ON_COMPILE(sizeof(p->version) == sizeof(uint32));
+
+         /* p->version is VMX's version; CROSSPAGE_VERSION is vmmon's. */
+         if (p->version != CROSSPAGE_VERSION) {
+            Warning("%s: crosspage version mismatch: vmmon claims %#x, must "
+                    "match vmx version of %#x.\n", __FUNCTION__,
+                    (int)CROSSPAGE_VERSION, p->version);
+            return 1;
+         }
+      }
+      {
+         /* The following constants are the size and offset of the
+          * VMCrossPage->crosspage_size field as defined by the
+          * vmm/vmx.
+          */
+
+         ASSERT_ON_COMPILE(offsetof(VMCrossPage, crosspage_size) ==
+                           sizeof(uint32));
+         ASSERT_ON_COMPILE(sizeof(p->crosspage_size) == sizeof(uint32));
+
+         if (p->crosspage_size != sizeof(VMCrossPage)) {
+            Warning("%s: crosspage size mismatch: vmmon claims %#x bytes, "
+                    "must match vmm size of %#x bytes.\n", __FUNCTION__,
+                    (unsigned)sizeof(VMCrossPage), p->crosspage_size);
+            return 1;
+         }
+      }
+
+      if (crossPageMPN > MA_2_MPN(0xFFFFFFFF)) {
+         Warning("%s*: crossPageMPN 0x%016" FMT64 "x invalid\n", __FUNCTION__,
+                 crossPageMPN);
+         return 1;
+      }
+      if (!pseudoTSC.initialized) {
+         Warning("%s*: PseudoTSC has not been initialized\n", __FUNCTION__);
+         return 1;
+      }
+      p->crosspageData.crosspageMA = (uint32)MPN_2_MA(crossPageMPN);
+      p->crosspageData.hostCrossPageLA = (LA64)(uintptr_t)p;
+
+      /*
+       * Pass our kernel code segment numbers back to MonitorPlatformInit.
+       * They have to be in the GDT so they will be valid when the crossGDT is
+       * active.
+       */
+
+      p->crosspageData.hostInitial64CS = GET_CS();
+      TS_ASSERT(SELECTOR_RPL  (p->crosspageData.hostInitial64CS) == 0 &&
+                SELECTOR_TABLE(p->crosspageData.hostInitial64CS) == 0);
+
+      p->crosspageData.moduleCallInterrupted = FALSE;
+      p->crosspageData.pseudoTSCConv.p.mult  = 1;
+      p->crosspageData.pseudoTSCConv.p.shift = 0;
+      p->crosspageData.pseudoTSCConv.p.add   = 0;
+      p->crosspageData.pseudoTSCConv.changed = TRUE;
+      p->crosspageData.worldSwitchPTSC       = Vmx86_GetPseudoTSC();
+      p->crosspageData.timerIntrTS           = MAX_ABSOLUTE_TS;
+      p->crosspageData.hstTimerExpiry        = MAX_ABSOLUTE_TS;
+      p->crosspageData.monTimerExpiry        = MAX_ABSOLUTE_TS;
+      vm->crosspage[vcpuid]                  = p;
+   }
+
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_InitCrossGDT --
+ *
+ *    Fill in a crossGDT entry from the given template.
+ *
+ * Results:
+ *    0 on success
+ *    != 0 on failure
+ *
+ * Side effects:
+ *    CrossGDT entry filled from template.  If crossGDT has already been
+ *    initialized, the entry is compared to the given template.  Any
+ *    discrepancy is logged and an error is returned.  This is necessary
+ *    because this same GDT is shared among all VMs on this host, so really,
+ *    the first call initializes it and the others just do compares.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+Task_InitCrossGDT(InitCrossGDT *initCrossGDT)  // IN
+{
+   Descriptor v;
+   int rc;
+   uint32 i;
+
+   rc = 1;
+   i  = initCrossGDT->index;
+   v  = initCrossGDT->value;
+
+   HostIF_GlobalLock(3);
+   if (i >= sizeof crossGDT->gdtes / sizeof crossGDT->gdtes[0]) {
+      HostIF_GlobalUnlock(3);
+      Warning("%s: index %u too big\n", __FUNCTION__, i);
+   } else if (!(  (1 << (i * sizeof crossGDT->gdtes[0] / PAGE_SIZE))
+                & CROSSGDT_PAGEMASK)) {
+      HostIF_GlobalUnlock(3);
+      Warning("%s: index %u not in CROSSGDT_PAGEMASK %x\n", __FUNCTION__,
+              i, CROSSGDT_PAGEMASK);
+   } else if (!Desc_Present(&v)) {
+      HostIF_GlobalUnlock(3);
+      Warning("%s: entry %u not present\n", __FUNCTION__, i);
+   } else if (!Desc_Present(crossGDT->gdtes + i)) {
+      crossGDT->gdtes[i] = v;
+      HostIF_GlobalUnlock(3);
+      rc = 0;
+   } else if (Desc_EqualIgnoreAccessed(crossGDT->gdtes + i, &v)) {
+      HostIF_GlobalUnlock(3);
+      rc = 0;
+   } else {
+      HostIF_GlobalUnlock(3);
+      Warning("%s: entry 0x%X mismatch\n", __FUNCTION__, i);
+      Warning("%s:   crossGDT %16.16llX\n", __FUNCTION__,
+              (long long unsigned)*(uint64 *)(crossGDT->gdtes + i));
+      Warning("%s:   template %16.16llX\n", __FUNCTION__,
+              (long long unsigned)*(uint64 *)&v);
+   }
+
+   return rc;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ *      Disable and restore APIC NMI delivery.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+TaskDisableNMIDelivery(const APICDescriptor *desc, // IN
+                       int regNum)                 // IN
+{
+   uint32 reg = APIC_Read(desc, regNum);
+
+   if (APIC_LVT_DELVMODE(reg) == APIC_LVT_DELVMODE_NMI &&
+       !APIC_LVT_ISMASKED(reg)) {
+      APIC_Write(desc, regNum, reg | APIC_LVT_MASK);
+      // Force completion of masking (was bug 78470).
+      dummyLVT = APIC_Read(desc, regNum);
+      return TRUE;
+   }
+
+   return FALSE;
+}
+
+
+static void
+TaskDisableNMI(const APICDescriptor *desc, // IN
+               Bool *lint0NMI,             // OUT
+               Bool *lint1NMI,             // OUT
+               Bool *pcNMI,                // OUT
+               Bool *thermalNMI)           // OUT
+{
+   if (desc->base || desc->isX2) {
+      *lint0NMI = TaskDisableNMIDelivery(desc, APICR_LVT0);
+      *lint1NMI = TaskDisableNMIDelivery(desc, APICR_LVT1);
+      *pcNMI = TaskDisableNMIDelivery(desc, APICR_PCLVT);
+
+      /*
+       * The LVT thermal monitor register was introduced
+       * in Pentium 4 and Xeon processors.
+       */
+
+      if (APIC_MaxLVT(desc) >= 5) {
+         *thermalNMI = TaskDisableNMIDelivery(desc, APICR_THERMLVT);
+      } else {
+         *thermalNMI = FALSE;
+      }
+   } else {
+      *lint0NMI = FALSE;
+      *lint1NMI = FALSE;
+      *pcNMI = FALSE;
+      *thermalNMI = FALSE;
+   }
+}
+
+
+static void
+TaskRestoreNMIDelivery(const APICDescriptor *desc, // IN
+                       Bool restore,               // IN
+                       int regNum)                 // IN
+{
+   if (restore) {
+      uint32 reg = APIC_Read(desc, regNum);
+
+      APIC_Write(desc, regNum, reg & ~APIC_LVT_MASK);
+   }
+}
+
+
+static void
+TaskRestoreNMI(const APICDescriptor *desc, // IN
+               Bool lint0NMI,              // IN
+               Bool lint1NMI,              // IN
+               Bool pcNMI,                 // IN
+               Bool thermalNMI)            // IN
+{
+   TaskRestoreNMIDelivery(desc, lint0NMI, APICR_LVT0);
+   TaskRestoreNMIDelivery(desc, lint1NMI, APICR_LVT1);
+   TaskRestoreNMIDelivery(desc, pcNMI, APICR_PCLVT);
+   TaskRestoreNMIDelivery(desc, thermalNMI, APICR_THERMLVT);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskEnableTF --
+ *
+ *     Turn on EFLAGS<TF>.
+ *
+ * Results:
+ *     None.
+ *
+ * Side effects:
+ *     Trace trapping enabled.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+TaskEnableTF(void)
+{
+#if defined(__GNUC__)
+   asm volatile ("pushfq ; orb $1,1(%rsp) ; popfq");
+#elif defined(_MSC_VER)
+   __writeeflags(__readeflags() | EFLAGS_TF);
+#else
+#error no compiler support for setting TF
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskDisableTF --
+ *
+ *     Turn off EFLAGS<TF>.
+ *
+ * Results:
+ *     None.
+ *
+ * Side effects:
+ *     Trace trapping disabled.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+TaskDisableTF(void)
+{
+#if defined(__GNUC__)
+   asm volatile ("pushfq ; andb $~1,1(%rsp) ; popfq");
+#elif defined(_MSC_VER)
+   __writeeflags(__readeflags() & ~EFLAGS_TF);
+#else
+#error no compiler support for clearing TF
+#endif
+}
+
+
+static INLINE Bool
+TaskGotException(const VMCrossPage *crosspage, unsigned exc)
+{
+   return crosspage->crosspageCode.faultHandler.wsException[exc];
+}
+
+
+static INLINE void
+TaskSetException(VMCrossPage *crosspage, unsigned exc, Bool v)
+{
+   crosspage->crosspageCode.faultHandler.wsException[exc] = v;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSaveDebugRegisters --
+ *
+ *      Save debug registers in the host context area of the crosspage.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      crosspage->hostDR[*] = some filled with debug register contents
+ *               hostDRSaved = bits set for those we wrote to hostDR[*] array
+ *                hostDRInHW = bits set indicating which hardware DR contents
+ *                             still match what the host wants
+ *      hardware DR7<GD> = 0
+ *      hardware DR7<bp enables> = 0
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+TaskSaveDebugRegisters(VMCrossPage *crosspage)
+{
+   Bool saveGotDB;
+
+#define SAVE_DR(n)                                      \
+   do {                                                 \
+      uintptr_t drReg;                                  \
+      GET_DR##n(drReg);                                 \
+      crosspage->crosspageData.hostDR[n] = drReg;       \
+   } while (0)
+
+   /* Hardware contains the host's %dr7, %dr6, %dr3, %dr2, %dr1, %dr0 */
+   crosspage->crosspageData.hostDRInHW = ((1 << 7) | (1 << 6) |
+                                          (1 << 3) | (1 << 2) |
+                                          (1 << 1) | (1 << 0));
+
+   /*
+    * Save DR7 since we need to disable debug breakpoints during the world
+    * switch code.  We will get a #DB if DR7<GD> is set, but the
+    * SwitchDBHandler simply IRETs after setting crosspage gotDB flag.
+    */
+
+   saveGotDB = TaskGotException(crosspage, EXC_DB);
+   TaskSetException(crosspage, EXC_DB, FALSE);
+   COMPILER_MEM_BARRIER();      /* Prevent hoisting #UD-raising instructions. */
+   SAVE_DR(7);
+
+   /*
+    * In all cases, DR7 shouldn't have the GD bit set.
+    */
+
+   TS_ASSERT(!(crosspage->crosspageData.hostDR[7] & DR7_GD));
+
+   /*
+    * Save DR6 in order to accommodate the ICEBP instruction and other stuff
+    * that can modify DR6 bits (trace traps, task switch traps, any others?).
+    */
+
+   SAVE_DR(6);
+
+   /*
+    * It may be that DR7 had the GD bit set, in which case the
+    * crosspage exception[EXC_DB] flag would have just been set and
+    * DR6<BD> will be set.  If so, fix the saved values to look like
+    * they were when DR7<GD> was set (before we tripped the #DB), so
+    * they'll get restored to what they were.  Then make sure
+    * breakpoints are disabled during switch.
+    *
+    * Note that I am assuming DR6_BD was clear before the #DB and so
+    * I'm clearing it here.  If it was set, we will end up restoring
+    * it cleared, but there's no way to tell.  Someone suggested that
+    * ICEBP would tell us but it may also clear DR6<3:0>.
+    *
+    * SAVE_DR(6) can raise #DB.
+    */
+
+   if (TaskGotException(crosspage, EXC_DB) &&
+       (crosspage->crosspageData.hostDR[6] & DR6_BD)) {
+      crosspage->crosspageData.hostDR[6] -= DR6_BD;
+      crosspage->crosspageData.hostDR[7] |= DR7_GD;
+      SET_DR7(DR7_DEFAULT);
+
+      /* HW: %dr7 and %dr6 are the guest, %dr3, %dr2, %dr1, %dr0 are host */
+      crosspage->crosspageData.hostDRInHW = ((1 << 3) | (1 << 2) |
+                                             (1 << 1) | (1 << 0));
+   }
+
+   /*
+    * No GD bit, check for enabled breakpoints.  Disable them as they may
+    * coincidentally trip during the switch.
+    */
+
+   else if (crosspage->crosspageData.hostDR[7] & DR7_ENABLED) {
+      SET_DR7(DR7_DEFAULT);          // no #DB here, just simple set
+      /* HW: %dr7 = guest, %dr6, %dr3, %dr2, %dr1, %dr0 = host */
+      crosspage->crosspageData.hostDRInHW = ((1 << 6) | (1 << 3) | (1 << 2) |
+                                             (1 << 1) | (1 << 0));
+   }
+
+   TaskSetException(crosspage, EXC_DB, saveGotDB);
+
+   /*
+    * hostDR[6,7] have host contents in them now.
+    */
+
+   crosspage->crosspageData.hostDRSaved = 0xC0;
+#undef SAVE_DR
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskRestoreDebugRegisters --
+ *
+ *      Put the debug registers back the way they were when
+ *      TaskSaveDebugRegisters was called.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Debug registers restored from values saved in the crosspage.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+TaskRestoreDebugRegisters(VMCrossPageData *crosspage)
+{
+#define RESTORE_DR(n)                                                 \
+   if ((crosspage->hostDRInHW & (1 << n)) == 0) {                     \
+      /* Guest value for register 'n' in hardware. */                 \
+      const uintptr_t drReg = (uintptr_t)crosspage->hostDR[n];        \
+      if (!(crosspage->shadowDRInHW & (1 << n)) ||                    \
+          (drReg != SHADOW_DR(crosspage, n))) {                       \
+         SET_DR##n(drReg);                                            \
+      }                                                               \
+   }
+
+   RESTORE_DR(0);
+   RESTORE_DR(1);
+   RESTORE_DR(2);
+   RESTORE_DR(3);
+   RESTORE_DR(6);
+
+   /*
+    * DR7 must be restored last in case DR7<GD> is set.
+    */
+   RESTORE_DR(7);
+#undef RESTORE_DR
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskUpdateLatestPTSC --
+ *
+ *      Record the per-VM latest visible PTSC value, and indicate that
+ *      this thread is no longer running in the VMM.  See
+ *      TaskUpdatePTSCParameters.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      May update the latest PTSC value and the PTSC offset reference count.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+TaskUpdateLatestPTSC(VMDriver *vm, VMCrossPageData *crosspage)
+{
+   if (Vmx86_HwTSCsSynced()) {
+      uint64 latest;
+      /*
+       * Determine a conservative estimate for the last PTSC value the
+       * VMM may have used.  We can't just use
+       * crosspage->worldSwitchPTSC since some callees of BackToHost
+       * will compute their own PTSC (or infer a PTSC value from the
+       * TSC).
+       */
+      uint64 ptsc = RDTSC() + crosspage->pseudoTSCConv.p.add;
+      do {
+         latest = Atomic_Read64(&vm->ptscLatest);
+         if (ptsc <= latest) {
+            break;
+         }
+      } while (!Atomic_CMPXCHG64(&vm->ptscLatest, &latest, &ptsc));
+      /* After updating the latest PTSC, decrement the reference count. */
+      Atomic_Dec32((Atomic_uint32 *)&vm->ptscOffsetInfo.inVMMCnt);
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskUpdatePTSCParameters --
+ *
+ *      If the PTSC is behind where it should be, based on the host's
+ *      uptime, then adjust the PTSC parameters.  PR 118376.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      May update the PTSC parameters.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+TaskUpdatePTSCParameters(VMDriver *vm,
+                         VMCrossPageData *crosspage,
+                         Vcpuid vcpuid)
+{
+   uint64 tsc, ptsc;
+
+   ASSERT_NO_INTERRUPTS();
+   ASSERT_ON_COMPILE(sizeof(vm->ptscOffsetInfo) == sizeof(Atomic_uint64));
+   ptsc = Vmx86_GetPseudoTSC();
+   /*
+    * Use unsigned comparison to test ptsc inside the interval:
+    *   [worldSwitchPTSC, worldSwitchPTSC + largeDelta)
+    * where largeDelta is choosen to be much larger than the normal time
+    * between worldswitches, but not so large that we'd miss a jump due
+    * to TSC reset.
+    */
+   if (UNLIKELY((uint64)(ptsc - crosspage->worldSwitchPTSC) >
+                Vmx86_GetPseudoTSCHz() * 4096)) {
+      /*
+       * If the PTSC went backwards since we last left the monitor, then either:
+       *  a) TSC is unsynchronized across cores.
+       *  b) TSC was reset (probably due to host stand by or hibernate).
+       *  c) khzEstimate was incorrect (too low).
+       *  d) the host's reference clock is too low resolution.
+       *  e) the host's reference clock is broken.
+       *
+       * We handle case (a) and (b) by switch PTSC over to using the
+       * reference clock as the basis for pseudo TSC.
+       *
+       * For case (c), ideally we'd want to get khzEstimate correct in
+       * the first place.  Using the reference clock for pseudo TSC is
+       * just a backup if all else failed.  It will prevent PTSC from
+       * drifting from real time over the long run.  Additionally, we
+       * could try to adopt the mult/shift of pseudoTSCConv to make PTSC
+       * run at the (incorrect) TSC kHz estimate, so that PTSC
+       * progresses at the correct rate over the short term (while in
+       * the monitor).
+       *
+       * We don't do anything for case (e).  If we see it happen, we
+       * could try to pin the value returned by HostIF_ReadUptime to
+       * some sane range to help compensate.
+       */
+      if (Vmx86_SetPseudoTSCUseRefClock()) {
+         ptsc = Vmx86_GetPseudoTSC();
+      }
+
+      /*
+       * For case (d), check for PTSC between (worldSwitchPTSC - Hz) and
+       * worldSwitchPTSC.  That is, if ptsc is still behind
+       * worldSwitchPTSC (even after ensuring the PTSC is based on the
+       * reference clock), but by less than a second, assume that the
+       * reference clock is too low of resolution, and nudge PTSC
+       * forward to ensure it doesn't go backwards on this VCPU.  If we
+       * are more than a second behind, then we assume that the
+       * reference clock was stepped (or broken) and we just stay in
+       * sync with it.
+       */
+      if ((uint64)(crosspage->worldSwitchPTSC - ptsc) <
+          Vmx86_GetPseudoTSCHz()) {
+         ptsc = crosspage->worldSwitchPTSC;
+      }
+   }
+
+   /*
+    * While running in the monitor, we can't read the reference
+    * clock, which is implemented by the host OS.  So, offset from
+    * the current pseudoTSC value using the TSC in order to provide
+    * high resolution PTSC while in the monitor.  The RDTSC below
+    * must be executed on the same pcpu that the vmm vcpu thread will
+    * run on (in case of out of sync TSCs).  This is guaranteed since
+    * we are on the on-ramp into the monitor with interrupts
+    * disabled.
+    */
+   tsc = RDTSC();
+   if (Vmx86_HwTSCsSynced()) {
+      /*
+       * When the TSCs are synchronized, make Pseudo TSC synchronized
+       * as well.  To ensure this, all vcpu threads of a VM that are
+       * simultaneously running their VMMs need to use the same exact
+       * offset.  This global offset can be updated only when no
+       * threads are running in the VMM.  In the case of synchronized
+       * TSCs, updating the offset only when all threads are outside
+       * the VMM is okay in terms of keeping VMMs' PTSC close to real
+       * time because the TSCs stop only when all cores enter a deep
+       * sleep state (otherwise the TSCs wouldn't be in sync to begin
+       * with).
+       */
+      PseudoTSCOffsetInfo old, new;
+      do {
+         old = vm->ptscOffsetInfo;
+         new = old;
+         if (new.inVMMCnt == 0) {
+            int64 ptscOffset;
+            if (Vmx86_PseudoTSCUsesRefClock()) {
+               /* Must read ptscLatest after reading ptscOffsetInfo. */
+               uint64 latest = Atomic_Read64(&vm->ptscLatest);
+               if (UNLIKELY(ptsc < latest)) {
+                  /*
+                   * The Vmx86_GetPseudoTSC call above occurred before
+                   * some other vcpu thread exited the monitor; need to
+                   * bump forward.
+                   */
+                  ptsc = latest;
+               }
+               ptscOffset = ptsc - tsc;
+            } else {
+               ptscOffset = Vmx86_GetPseudoTSCOffset();
+            }
+            /*
+             * Since inVMMCnt is zero, it is safe to update our entry in
+             * ptscOffsets -- no other thread will try to read it until
+             * the inVMMCnt > 0.
+             */
+            vm->ptscOffsets[vcpuid] = ptscOffset;
+            /* Try to use this thread's offset as the global offset. */
+            new.vcpuid = vcpuid;
+         }
+         new.inVMMCnt++;
+      } while (!Atomic_CMPXCHG64((Atomic_uint64 *)&vm->ptscOffsetInfo,
+                                 (uint64 *)&old, (uint64 *)&new));
+      /* Use the designated global offset as this thread's offset. */
+      crosspage->pseudoTSCConv.p.add   = vm->ptscOffsets[new.vcpuid];
+      crosspage->pseudoTSCConv.changed = TRUE;
+      /*
+       * Need to derive the worldSwitchPTSC value from TSC since the
+       * PTSC, when calculated from TSC, may drift from the reference
+       * clock over the short term.
+       */
+      ptsc = tsc + crosspage->pseudoTSCConv.p.add;
+   } else {
+      crosspage->pseudoTSCConv.p.add   = ptsc - tsc;
+      crosspage->pseudoTSCConv.changed = TRUE;
+   }
+   /* Cache PTSC value for BackToHost. */
+   crosspage->worldSwitchPTSC = ptsc;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSwitchToMonitor --
+ *
+ *      Wrapper that calls code to switch from the host to the monitor.
+ *
+ *      The basic idea is to do a (*(crosspage->hostToVmm))(crosspage)
+ *      but it's complicated because we must have a common call format
+ *      between GCC and MSC.
+ *
+ *      Since we have complete control over what GCC does with asm volatile,
+ *      this amounts to having GCC do exactly what MSC does.
+ *      For 64-bit hosts, we pass the parameter in RCX.
+ *
+ *      For 64-bit GCC, the callee is expected to preserve
+ *      RBX,RBP,RSP,R12..R15, whereas MSC expects the callee to preserve
+ *      RBX,RSI,RDI,RBP,RSP,R12..R15.  So for simplicity, we have the
+ *      worldswitch code save RBX,RSI,RDI,RBP,RSP,R12..R15.
+ *
+ * From an email with Petr regarding gcc's handling of the stdcall
+ * attribute for x86-64:
+ *
+ *    As far as I can tell, for x86_64 there is only one calling
+ *    convention:
+ *       On GCC rdi/rsi/rdx/rcx/r8d/r9d for <= 6 arguments,
+ *       others always on stack, caller always adjusts stack.
+ *
+ *       On MSC it is rcx/rdx/r8d/r9d for <= 4 arguments, rest on
+ *       stack.  When more than 4 arguments are passed, spill space is
+ *       reserved on the stack for the register arguments.  Argument
+ *       5 is accessed at (5 * 8)(rsp).
+ *
+ * Side effects:
+ *      The monitor does many things, but it's irrelevant to this code.  The
+ *      worldswitch should eventually return here with the host state intact.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+TaskSwitchToMonitor(VMCrossPage *crosspage)
+{
+   const uint8 *codePtr = ((uint8 *)&crosspage->crosspageCode.worldswitch +
+                           crosspage->crosspageCode.worldswitch.hostToVmm);
+
+#if defined(__GNUC__)
+   /*
+    * Pass the crosspage pointer in RCX just like 64-bit MSC does.
+    * Tell GCC that the worldswitch preserves RBX,RSI,RDI,RBP,RSP,
+    * R12..R15 just like the MSC 64-bit calling convention.
+    */
+
+   {
+      uint64 raxGetsWiped, rcxGetsWiped;
+
+      __asm__ __volatile__("call *%%rax"
+                           : "=a" (raxGetsWiped),
+                             "=c" (rcxGetsWiped)
+                           : "0" (codePtr),
+                             "1" (crosspage)
+                           : "rdx", "r8", "r9", "r10", "r11", "cc", "memory");
+   }
+#elif defined(_MSC_VER)
+   /*
+    * The 64-bit calling convention is to pass the argument in RCX and that
+    * the called function must preserve RBX,RSI,RDI,RBP,RSP,R12..R15.
+    */
+#pragma warning(suppress: 4055) // Cast of data pointer to function pointer.
+   (*(void (*)(VMCrossPage *))codePtr)(crosspage);
+#else
+#error No compiler defined for TaskSwitchToMonitor
+#endif
+}
+
+
+static void
+TaskTestCrossPageExceptionHandlers(VMCrossPage *crosspage)
+{
+   static Bool testSwitchNMI = TRUE; /* test only first time through */
+
+   /*
+    * Test the DB,NMI,MCE handlers to make sure they can set the
+    * flags.  This is calling the handlers in switchNMI.S.
+    */
+
+   if (vmx86_debug && testSwitchNMI) {
+      Bool gotSave;
+
+      testSwitchNMI = FALSE;
+
+      /*
+       * RAISE_INTERRUPT calls Switch{32,64}DBHandler in switchNMI.S
+       * (depending on host bitsize).
+       */
+
+      gotSave = TaskGotException(crosspage, EXC_DB);
+      TaskSetException(crosspage, EXC_DB, FALSE);
+      RAISE_INTERRUPT(1);
+      TS_ASSERT(TaskGotException(crosspage, EXC_DB));
+      TaskSetException(crosspage, EXC_DB, gotSave);
+
+      /*
+       * RAISE_INTERRUPT calls Switch{32,64}NMIHandler in switchNMI.S
+       * (depending on host bitsize).
+       */
+      gotSave = TaskGotException(crosspage, EXC_NMI);
+      TaskSetException(crosspage, EXC_NMI, FALSE);
+      RAISE_INTERRUPT(EXC_NMI);
+      TS_ASSERT(TaskGotException(crosspage, EXC_NMI));
+
+#if defined(__GNUC__)
+      /*
+       * Test the LRETQ in the 64-bit mini NMI handler to make sure
+       * it works with any 16-byte offset of the stack pointer.
+       * The INT 2 calls Switch64NMIHandler in switchNMI.S.
+       */
+      {
+         uint64 v1, v2;
+
+         asm volatile ("\n"
+                       "        movl    $16, %%ecx      \n"
+                       "1000:                           \n"
+                       "        decq    %%rsp           \n"
+                       "        movb    $0xDB, (%%rsp)  \n"
+                       "        int     $2              \n"
+                       "        loop    1000b           \n"
+                       "        popq    %%rcx           \n"
+                       "        popq    %%rax           \n"
+                       : "=a" (v1), "=c" (v2));
+
+         /*
+          * Ensure nothing overwritten just above where it is
+          * allowed to, because the decq rsp/movb 0xDBs pushed 16
+          * of them one byte at a time.
+          */
+
+         TS_ASSERT(v1 == 0xDBDBDBDBDBDBDBDBULL);
+         TS_ASSERT(v2 == 0xDBDBDBDBDBDBDBDBULL);
+      }
+#endif
+      TaskSetException(crosspage, EXC_NMI, gotSave);
+
+      /*
+       * RAISE_INTERRUPT calls Switch{32,64}MCEHandler in switchNMI.S
+       * (depending on host bitsize).
+       */
+
+      gotSave = TaskGotException(crosspage, EXC_MC);
+      TaskSetException(crosspage, EXC_MC, FALSE);
+      RAISE_INTERRUPT(EXC_MC);
+      TS_ASSERT(TaskGotException(crosspage, EXC_MC));
+      TaskSetException(crosspage, EXC_MC, gotSave);
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskShouldRetryWorldSwitch --
+ *
+ *      Returns whether or not we should retry the world switch.
+ *
+ *      It is possible that the gotNMI and/or gotMCE was detected when
+ *      switching in the host->monitor direction, in which case the
+ *      retryWorldSwitch flag will be set.  If such is the case, we
+ *      want to immediately loop back to the monitor as that is what
+ *      it is expecting us to do.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+TaskShouldRetryWorldSwitch(VMCrossPage *crosspage)
+{
+   Bool result = crosspage->crosspageData.retryWorldSwitch;
+   crosspage->crosspageData.retryWorldSwitch = FALSE;
+   return result;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_Switch --
+ *
+ *      Switches from the host context into the monitor context and
+ *      then receives control when the monitor returns to the
+ *      host.
+ *
+ *      Think of it as a coroutine switch that changes not only the
+ *      registers, but also the address space and all the hardware
+ *      state.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Jump to the monitor. Has no direct effect on the host-visible
+ *      state except that it might generate an interrupt.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+Task_Switch(VMDriver *vm,  // IN
+            Vcpuid vcpuid) // IN
+{
+   uintptr_t   flags;
+   uint64      fs64  = 0;
+   uint64      gs64  = 0;
+   uint64      kgs64 = 0;
+   uint64      pebsMSR = 0;
+   DTR64       hostGDT64, hostIDT64;
+   Selector    cs, ds, es, fs, gs, ss;
+   Selector    hostTR;
+   Selector    hostLDT;
+   Bool lint0NMI;
+   Bool lint1NMI;
+   Bool pcNMI;
+   Bool thermalNMI;
+   VMCrossPage *crosspage = vm->crosspage[vcpuid];
+   uint32 pCPU;
+   MPN hvRootMPN;
+   Descriptor *tempGDTBase;
+
+   ASSERT_ON_COMPILE(sizeof(VMCrossPage) == PAGE_SIZE);
+   TaskDisableNMI(&vm->hostAPIC, &lint0NMI, &lint1NMI, &pcNMI, &thermalNMI);
+   SAVE_FLAGS(flags);
+   CLEAR_INTERRUPTS();
+
+   pCPU = HostIF_GetCurrentPCPU();
+   ASSERT(pCPU < ARRAYSIZE(hvRootPage) && pCPU < ARRAYSIZE(tmpGDT));
+
+   hvRootMPN = Atomic_Read64(&hvRootPage[pCPU]);
+   tempGDTBase = USE_TEMPORARY_GDT ? Atomic_ReadPtr(&tmpGDT[pCPU]) : NULL;
+
+   /*
+    * We can't allocate memory with interrupts disabled on all hosts
+    * so we dummy up a modulecall to do it before we start in on the
+    * world switch.  We must be careful not to overwrite the
+    * crosspages arguments when doing this though, see bug 820257.
+    */
+   if (hvRootMPN == INVALID_MPN &&
+       (crosspage->crosspageData.activateVMX ||
+        crosspage->crosspageData.activateSVM)) {
+      crosspage->crosspageData.userCallType = MODULECALL_USERCALL_NONE;
+      crosspage->crosspageData.moduleCallType = MODULECALL_ALLOC_VMX_PAGE;
+      crosspage->crosspageData.pcpuNum = pCPU;
+   } else if (USE_TEMPORARY_GDT && tempGDTBase == NULL) {
+      crosspage->crosspageData.userCallType = MODULECALL_USERCALL_NONE;
+      crosspage->crosspageData.moduleCallType = MODULECALL_ALLOC_TMP_GDT;
+      crosspage->crosspageData.pcpuNum = pCPU;
+   } else {
+      do {
+         uintptr_t cr0reg, cr2reg, cr3reg, cr4reg;
+         uint64 efer     = ~0ULL;
+         Bool needVMXOFF = FALSE;
+         MA foreignVMCS  = ~0ULL;
+         MA foreignHSAVE = ~0ULL;
+
+         vm->currentHostCpu[vcpuid] = pCPU;
+
+         TaskUpdatePTSCParameters(vm, &crosspage->crosspageData, vcpuid);
+
+         /*
+          * Disable PEBS if it is supported and enabled.  Do this while on the
+          * hosts IDT - PR 848701.
+          */
+         if (pebsAvailable) {
+            pebsMSR = __GET_MSR(IA32_MSR_PEBS_ENABLE);
+            if (pebsMSR != 0) {
+               __SET_MSR(IA32_MSR_PEBS_ENABLE, 0);
+            }
+         }
+
+         /*
+          * Save the host's standard IDT and set up an IDT that only
+          * has space for all the hardware exceptions (though only a
+          * few are handled).
+          */
+
+         TaskSaveIDT64(&hostIDT64);
+         TaskLoadIDT64(&crosspage->crosspageData.switchHostIDTR);
+         TaskTestCrossPageExceptionHandlers(crosspage);
+
+         if (crosspage->crosspageData.activateVMX) {
+            /*
+             * Ensure that VMX is enabled and locked in the feature control MSR,
+             * so that we can set CR4.VMXE to activate VMX.
+             */
+            uint64 bits = MSR_FEATCTL_LOCK | MSR_FEATCTL_VMXE;
+            uint64 featCtl = __GET_MSR(MSR_FEATCTL);
+            if ((featCtl & bits) != bits) {
+               if ((featCtl & MSR_FEATCTL_LOCK) != 0) {
+                  Panic("Intel VT-x is disabled and locked on CPU %d\n", pCPU);
+               }
+               __SET_MSR(MSR_FEATCTL, featCtl | bits);
+            }
+         }
+
+         /*
+          * Save CR state.  The monitor deals with EFER.
+          */
+
+         GET_CR2(cr2reg);
+         GET_CR0(cr0reg);
+         GET_CR4(cr4reg);
+         GET_CR3(cr3reg);
+         crosspage->crosspageData.hostCR3 = cr3reg;
+
+         /*
+          * Any reserved bits in CR0 must be preserved when we switch
+          * to the VMM. [See PR 291004.]  (On the other hand, Intel
+          * recommends that we clear any reserved CR4 bits.)
+          */
+         crosspage->crosspageData.wsCR0 &= ~CR0_RESERVED;
+         crosspage->crosspageData.wsCR0 |= (cr0reg & CR0_RESERVED);
+
+         /*
+          * CR4.VMXE must be enabled to support VMX in the monitor, and it
+          * can't be cleared if it is set on the host.
+          */
+         if (crosspage->crosspageData.activateVMX || (cr4reg & CR4_VMXE) != 0) {
+            crosspage->crosspageData.wsCR4 |= CR4_VMXE;
+         }
+
+         /*
+          * The world-switch CR4.MCE and CR4.PCIDE should always reflect the
+          * host's values.  CR4.PCIDE will be cleared once we're in the monitor,
+          * running on a CR3 with a PCID field of 0.
+          */
+         crosspage->crosspageData.wsCR4 =
+            (crosspage->crosspageData.wsCR4 & ~(CR4_MCE | CR4_PCIDE)) |
+            (cr4reg & (CR4_MCE | CR4_PCIDE));
+
+         /*
+          * The world-switch should never have global pages enabled.  Therefore,
+          * switching to the monitor's CR4 ensures that global pages are
+          * flushed.
+          */
+         ASSERT((crosspage->crosspageData.wsCR4 & CR4_PGE) == 0);
+
+         /*
+          * Load the world-switch CR0 and CR4.  We can't load the monitor's
+          * CR3 yet, because the current code isn't mapped into the
+          * monitor's address space.
+          */
+         SET_CR0((uintptr_t)crosspage->crosspageData.wsCR0);
+         SET_CR4((uintptr_t)crosspage->crosspageData.wsCR4);
+
+         TaskSaveDebugRegisters(crosspage);
+
+         TaskSaveGDT64(&hostGDT64);
+
+         if (crosspage->crosspageData.activateVMX) {
+            MA vmxonRegion = MPN_2_MA(hvRootMPN);
+            VMXStatus status = VMXON_2_STATUS(&vmxonRegion);
+            if (status == VMX_Success) {
+               needVMXOFF = TRUE;
+            } else {
+               VMPTRST(&foreignVMCS);
+            }
+         }
+
+         if (crosspage->crosspageData.activateSVM) {
+            efer = __GET_MSR(MSR_EFER);
+            if ((efer & MSR_EFER_SVME) == 0) {
+               __SET_MSR(MSR_EFER, efer | MSR_EFER_SVME);
+            }
+            foreignHSAVE = __GET_MSR(MSR_VM_HSAVE_PA);
+            __SET_MSR(MSR_VM_HSAVE_PA, MPN_2_MA(hvRootMPN));
+         }
+
+         /*
+          * If NMI stress testing enabled, set EFLAGS<TF>.  This will
+          * make sure there is a valid IDT, GDT, stack, etc. at every
+          * instruction boundary during the switch.
+          */
+         if (WS_INTR_STRESS) {
+            TaskEnableTF();
+         }
+
+         /*
+          * GS and FS are saved outside of the TaskSwitchToMonitor() code to
+          *
+          * 1) minimize the amount of code handled there, and
+          *
+          * 2) prevent us from faulting if they happen to be in the LDT
+          *    (since the LDT is saved and restored here too).
+          *
+          * Also, the 32-bit Mac OS running in legacy mode has
+          * CS, DS, ES, SS in the LDT!
+          */
+         cs = GET_CS();
+         ss = GET_SS();
+#if defined __APPLE__
+         /*
+          * The 64-bit Mac OS kernel leaks segment selectors from
+          * other threads into 64-bit threads.  When the selectors
+          * reference a foreign thread's LDT, we may not be able to
+          * reload them using our thread's LDT.  So, let's just clear
+          * them instead of trying to preserve them.  [PR 467140]
+          */
+         ds = 0;
+         es = 0;
+         fs = 0;
+         gs = 0;
+#else
+         ds = GET_DS();
+         es = GET_ES();
+         fs = GET_FS();
+         gs = GET_GS();
+#endif
+         GET_LDT(hostLDT);
+         GET_TR(hostTR);
+
+         kgs64 = GET_KernelGS64();
+         gs64  = GET_GS64();
+         fs64  = GET_FS64();
+
+         /*
+          * Make sure stack segment is non-zero so worldswitch can use it
+          * to temporarily restore DS,ES on return.
+          */
+         if (ss == 0) {
+            SET_SS(kernelStackSegment);
+         }
+
+         TS_ASSERT(SELECTOR_TABLE(cs) == SELECTOR_GDT);
+         TS_ASSERT(SELECTOR_TABLE(ds) == SELECTOR_GDT);
+         TS_ASSERT(SELECTOR_TABLE(ss) == SELECTOR_GDT);
+
+         DEBUG_ONLY(crosspage->crosspageData.tinyStack[0] = 0xDEADBEEF;)
+         /* Running in host context prior to TaskSwitchToMonitor() */
+         TaskSwitchToMonitor(crosspage);
+         /* Running in host context after to TaskSwitchToMonitor() */
+
+         TS_ASSERT(crosspage->crosspageData.tinyStack[0] == 0xDEADBEEF);
+
+         /*
+          * Temporarily disable single-step stress as VMX/VMCS change code
+          * ASSERTS on RFLAGS content without allowing TF/RF to be set.
+          */
+         if (WS_INTR_STRESS) {
+            TaskDisableTF();
+         }
+
+         if (needVMXOFF) {
+            VMXOFF();
+         } else if (foreignVMCS != ~0ULL) {
+            VMPTRLD_UNCHECKED(&foreignVMCS);
+         }
+         
+         if (WS_INTR_STRESS) {
+            TaskEnableTF();
+         }
+
+         if (crosspage->crosspageData.activateSVM) {
+            __SET_MSR(MSR_VM_HSAVE_PA, foreignHSAVE);
+            if ((efer & MSR_EFER_SVME) == 0) {
+               __SET_MSR(MSR_EFER, efer);
+            }
+         }
+
+         /*
+          * Restore CR state.
+          * CR3 should already have been restored.  CR0 and CR4 have to
+          * be restored if the world switch values do not match the host's.
+          * CR2 always has to be restored.  CR8 never has to be restored.
+          */
+         SET_CR2(cr2reg);
+         if (crosspage->crosspageData.wsCR0 != cr0reg) {
+            SET_CR0(cr0reg);
+         }
+         if (crosspage->crosspageData.wsCR4 != cr4reg) {
+            SET_CR4(cr4reg);
+         } else if ((cr4reg & CR4_PCIDE) != 0) {
+            /*
+             * Flush PCID 0.
+             */
+            ASSERT((cr4reg & CR4_PGE) == 0);
+            SET_CR4(cr4reg | CR4_PGE);
+            SET_CR4(cr4reg);
+         }
+         if (vmx86_debug) {
+            uintptr_t cr;
+            GET_CR0(cr);
+            ASSERT(cr == cr0reg);
+            GET_CR4(cr);
+            ASSERT(cr == cr4reg);
+            GET_CR3(cr);
+            ASSERT(cr == cr3reg);
+         }
+
+         /*
+          * TaskSwitchToMonitor() returns with GDT = crossGDT so switch back to
+          * the host GDT here.  We will also restore host TR as the task busy
+          * bit needs to be fiddled with.  Also restore host LDT while we're
+          * at it.
+          */
+         TaskRestoreHostGDTTRLDT(tempGDTBase, hostGDT64,
+                                 hostLDT, cs, hostTR);
+
+         SET_DS(ds);
+         SET_ES(es);
+
+         /*
+          * First, restore %fs and %gs from the in-memory descriptor tables,
+          * and then overwrite the bases in the descriptor cache with the
+          * saved 64-bit values.
+          */
+
+         SET_FS(fs);
+         SET_GS(gs);
+         SET_FS64(fs64);
+         SET_GS64(gs64);
+         SET_KernelGS64(kgs64);
+
+         /* Restore debug registers and host's IDT; turn off stress test. */
+         if (WS_INTR_STRESS) {
+            TaskDisableTF();
+         }
+
+         TaskRestoreDebugRegisters(&crosspage->crosspageData);
+
+         ASSERT_NO_INTERRUPTS();
+
+         /*
+          * Restore standard host interrupt table and re-enable PEBS afterwards
+          * iff we disabled it.
+          */
+
+         TaskLoadIDT64(&hostIDT64);
+
+         if (pebsMSR != 0) {
+            __SET_MSR(IA32_MSR_PEBS_ENABLE, pebsMSR);
+         }
+
+         TaskUpdateLatestPTSC(vm, &crosspage->crosspageData);
+         vm->currentHostCpu[vcpuid] = INVALID_PCPU;
+
+         /*
+          * If an #NMI or #MCE was logged while switching, re-raise such an
+          * interrupt or exception for the host to consume.  Handlers preserve
+          * NMI-blocking (when not stress-testing or changing VIP/VIP) by using
+          * synthetic irets instead of real irets.  By this point, if an NMI
+          * was received during switching, NMIs should still be blocked.
+          *
+          * When stress testing, NMIs are almost guaranteed to be synthetic, so
+          * no NMI is raised.
+          *
+          * If a #UD was logged while switching, warn accordingly rather than
+          * raising a new exception as this would likely panic the host kernel.
+          */
+
+         if (UNLIKELY(TaskGotException(crosspage, EXC_NMI))) {
+            TaskSetException(crosspage, EXC_NMI, FALSE);
+            if (!WS_INTR_STRESS) {
+               RAISE_INTERRUPT(EXC_NMI);
+            }
+         }
+
+         if (UNLIKELY(TaskGotException(crosspage, EXC_MC))) {
+            TaskSetException(crosspage, EXC_MC, FALSE);
+            if (vmx86_debug) {
+               CP_PutStr("Task_Switch: forwarding MCE to host\n");
+            }
+            RAISE_INTERRUPT(EXC_MC);
+         }
+         if (UNLIKELY(TaskGotException(crosspage, EXC_UD))) {
+            Warning("#UD occurred on switch back to host; dumping core");
+         }
+         /*
+          * The NMI/MCE checks above are special cases for interrupts
+          * received during worldswitch.  Here is the more generic case
+          * of forwarding NMIs received while executing the VMM/guest.
+          */
+         if (crosspage->crosspageData.moduleCallType == MODULECALL_INTR &&
+             crosspage->crosspageData.args[0] == EXC_NMI) {
+            /*
+             * If VMM was interrupted by an NMI, do the INT 2 so the
+             * host will handle it, but then return immediately to the
+             * VMM in case the VMM was in the middle of a critical
+             * region.  E.g. the NMI may have interrupted the VMM while
+             * an interrupt was in service, before the VMM or host has
+             * done the EOI.
+             */
+            RAISE_INTERRUPT(EXC_NMI);
+            crosspage->crosspageData.retryWorldSwitch = TRUE;
+         }
+      } while (UNLIKELY(TaskShouldRetryWorldSwitch(crosspage)));
+   }
+
+   if (crosspage->crosspageData.moduleCallType == MODULECALL_INTR) {
+      /*
+       * Note we must do the RAISE_INTERRUPT before ever enabling
+       * interrupts or bad things have happened (might want to know exactly
+       * what bad things btw).
+       */
+#ifdef _WIN64
+      if (crosspage->crosspageData.args[0] <= 0xFF &&
+          (crosspage->crosspageData.args[0] >= 0x14 ||
+           crosspage->crosspageData.args[0] == EXC_MC)) {
+         RAISE_INTERRUPT((unsigned char)crosspage->crosspageData.args[0]);
+      } else {
+         Warning("%s: Received Unexpected Interrupt: 0x%"FMT64"X\n",
+                 __FUNCTION__, crosspage->crosspageData.args[0]);
+         Panic("Received Unexpected Interrupt: 0x%"FMT64"X\n",
+               crosspage->crosspageData.args[0]);
+      }
+#else
+      /*
+       * Note2 RAISE_INTERRUPT() only takes a constant and hence with switch
+       * statement.
+       */
+#define IRQ_INT(_x) case _x: RAISE_INTERRUPT(_x); break
+#define IRQ_INT2(_x) IRQ_INT(_x); IRQ_INT(_x + 1)
+#define IRQ_INT4(_x) IRQ_INT2(_x); IRQ_INT2(_x + 2)
+#define IRQ_INT8(_x) IRQ_INT4(_x); IRQ_INT4(_x + 4)
+#define IRQ_INT16(_x) IRQ_INT8(_x); IRQ_INT8(_x + 8)
+#define IRQ_INT32(_x) IRQ_INT16(_x); IRQ_INT16(_x + 16)
+
+      switch (crosspage->crosspageData.args[0]) {
+         // These are the general IO interrupts
+         // It would be nice to generate this dynamically, but see Note2 above.
+
+         /*
+          * Pass Machine Check Exception (Interrupt 0x12) to the host.
+          * See bug #45286 for details.
+          */
+         IRQ_INT(EXC_MC);
+
+         /*
+          * pass the reserved vectors (20-31) as well. amd64 windows
+          * generates these.
+          */
+
+         IRQ_INT8(0x14);
+         IRQ_INT4(0x1c);
+
+         IRQ_INT32(0x20);
+         IRQ_INT32(0x40);
+         IRQ_INT32(0x60);
+         IRQ_INT32(0x80);
+         IRQ_INT32(0xa0);
+         IRQ_INT32(0xc0);
+         IRQ_INT32(0xe0);
+
+      default:
+         /*
+          * XXXX nt running on a 2 processor machine we hit this Panic
+          * with int 0xD1 0x61 ...
+          */
+
+         Warning("%s: Received Unexpected Interrupt: 0x%"FMT64"X\n",
+                 __FUNCTION__, crosspage->crosspageData.args[0]);
+         Panic("Received Unexpected Interrupt: 0x%"FMT64"X\n",
+               crosspage->crosspageData.args[0]);
+      }
+#endif
+   }
+
+   RESTORE_FLAGS(flags);
+   TaskRestoreNMI(&vm->hostAPIC, lint0NMI, lint1NMI, pcNMI, thermalNMI);
+}
diff --git a/vmmon-only/common/task.h b/vmmon-only/common/task.h
new file mode 100644
index 00000000..b2fcfd97
--- /dev/null
+++ b/vmmon-only/common/task.h
@@ -0,0 +1,43 @@
+/*********************************************************
+ * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+
+#ifndef TASK_H
+#define TASK_H
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+struct InitBlock;
+struct InitCrossGDT;
+
+extern Bool Task_AllocCrossGDT(struct InitBlock *initBlock);
+extern int Task_InitCrosspage(VMDriver *vm, struct InitBlock *params);
+extern int Task_InitCrossGDT(struct InitCrossGDT *initCrossGDT);
+extern void Task_Switch(VMDriver *vm, Vcpuid vcpuid);
+extern Bool Task_Initialize(void);
+extern void Task_Terminate(void);
+extern MPN Task_GetHVRootPageForPCPU(uint32 pCPU);
+extern Descriptor *Task_GetTmpGDT(uint32 pCPU);
+
+#endif
+
+
+
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
new file mode 100644
index 00000000..dbe794c5
--- /dev/null
+++ b/vmmon-only/common/vmx86.c
@@ -0,0 +1,2920 @@
+/*********************************************************
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmx86.c --
+ *
+ *     Platform independent routines for creating/destroying/running
+ *     virtual machine monitors.
+ */
+
+#ifdef linux
+/* Must come before any kernel header file --hpreg */
+#   include "driver-config.h"
+
+#   include <linux/string.h> /* memset() in the kernel  */
+#   include <linux/sched.h>  /* jiffies from the kernel */
+#else
+#   include <string.h>
+#endif
+
+#ifdef __APPLE__
+#include <IOKit/IOLib.h>  // must come before "vmware.h"
+#endif
+
+#include "vmware.h"
+#include "vm_assert.h"
+#include "vm_basic_math.h"
+#include "vmx86.h"
+#include "task.h"
+#include "initblock.h"
+#include "vm_asm.h"
+#include "iocontrols.h"
+#include "hostif.h"
+#include "cpuid.h"
+#include "vcpuset.h"
+#include "memtrack.h"
+#include "hashFunc.h"
+#if defined(_WIN64)
+#include "x86.h"
+#include "vmmon-asm-x86-64.h"
+#endif
+#include "x86vt.h"
+#include "x86svm.h"
+#include "x86cpuid_asm.h"
+#if defined(linux)
+#include <asm/timex.h>
+#endif
+#include "x86perfctr.h"
+
+
+PseudoTSC pseudoTSC;
+
+/*
+ * Keep track of the virtual machines that have been
+ * created using the following structures.
+ */
+
+static VMDriver *vmDriverList = NULL;
+
+static LockedPageLimit lockedPageLimit = {
+   0,                        // host: does not need to be initialized.
+   0,                        // configured: must be set by some VM as it is powered on.
+   (uint32)MAX_LOCKED_PAGES, // dynamic
+};
+
+/* Percentage of guest "paged" memory that must fit within the hard limit. */
+static unsigned minVmMemPct;
+
+/* Number of pages actually locked by all virtual machines */
+static unsigned numLockedPages;
+
+/* Total virtual machines on this host */
+static unsigned vmCount;
+
+/* Total number of open vmmon file handles. */
+static unsigned fdCount;
+
+/*
+ * We implement a list of allocated VM ID's using an array.
+ * The array is initialized with the values 1...MAX_VMS-1, INVALID_VMID.
+ * vmIDsAllocated holds the last VM ID given out and vmIDsUnused
+ * holds the next VM ID to give out.
+ */
+
+#define INVALID_VMID (-1)
+static int vmIDList[MAX_VMS];
+static int vmIDsAllocated;
+static int vmIDsUnused;
+
+/* Max rate requested for fast clock by any virtual machine. */
+static unsigned globalFastClockRate;
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86AdjustLimitForOverheads --
+ *
+ *        This function adjusts an overall limit on the number of
+ *        locked pages to take into account overhead for the vmx processes, etc.
+ *        since the hostOS will also see this as overhead. We do this for all
+ *        vmx processes, not just ones whose vms have been admitted.
+ *
+ *        If "vm" is NULL, we are allocating a global page and have no
+ *        perVMOverhead term to take into account.
+ *
+ * Results:
+ *       Number of remaining pages considered to be lockable on this host.
+ *
+ * Side effects:
+ *       None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE unsigned
+Vmx86AdjustLimitForOverheads(const VMDriver* vm,
+                             const uint32 limit)
+{
+   uint32 extraCost = (vm != NULL) ? vmCount * vm->memInfo.perVMOverhead : 0;
+   ASSERT(HostIF_GlobalLockIsHeld());
+
+   return (extraCost < limit) ?  (limit - extraCost) : 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86LockedPageLimit --
+ *
+ *       There are three limits controlling how many pages we can lock on
+ *       a host:
+ *
+ *       lockedPageLimit.configured is controlled by UI,
+ *       lockedPageLimit.dynamic is controlled by authd's hardLimitMonitor,
+ *       lockedPageLimit.host is calculated dynamically based on kernel stats
+ *       by vmmon using kernel stats.
+ *
+ *       We can lock the MIN of these values.
+ *
+ * Results:
+ *       Number of pages to lock on this host.
+ *
+ * Side effects:
+ *       Updates the host locked pages limit.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE unsigned
+Vmx86LockedPageLimit(const VMDriver* vm)  // IN:
+{
+   uint32 overallLimit;
+   ASSERT(HostIF_GlobalLockIsHeld());
+
+   lockedPageLimit.host = HostIF_EstimateLockedPageLimit(vm, numLockedPages);
+   overallLimit = MIN(MIN(lockedPageLimit.configured, lockedPageLimit.dynamic),
+                      lockedPageLimit.host);
+
+   return Vmx86AdjustLimitForOverheads(vm, overallLimit);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86HasFreePages --
+ *
+ *       Returns TRUE if the vm can lock more pages.  This is true if
+ *       we are below the host's hard memory limit and this vm has not
+ *       exceeded its maximum allocation.
+ *       Callers must ensure driver-wide and VM serialization
+ *       typically by using HostIF_GlobalLock() and  HostIF_VMLock().
+ *
+ * Results:
+ *       TRUE if pages can be locked, FALSE otherwise
+ *
+ * Side effects:
+ *       None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Vmx86HasFreePages(VMDriver *vm,
+		  unsigned int numPages,
+                  Bool checkVM)
+{
+   /*
+    * 1) Be careful with overflow.
+    * 2) lockedPageLimit and vm->memInfo.maxAllocation can be decreased below
+    *    the current numLockedPages and vm->memInfo.locked
+    * 3) lockedPageLimit.host can go lower than numLockedPages.
+    */
+
+   ASSERT(HostIF_GlobalLockIsHeld() &&
+          (!checkVM || HostIF_VMLockIsHeld(vm)));
+
+   if (checkVM) {
+      /*
+       * Check the per-vm limit.
+       */
+
+      ASSERT(HostIF_VMLockIsHeld(vm));
+      if (vm->memInfo.admitted) {
+	 if (vm->memInfo.maxAllocation <= vm->memInfo.locked) {
+	    return FALSE;
+	 } else if (vm->memInfo.maxAllocation - vm->memInfo.locked < numPages) {
+	    return FALSE;
+	 }
+      }
+   } else {
+      /*
+       * Check the global limit.
+       */
+
+      unsigned limit = Vmx86LockedPageLimit(vm);
+
+      if (limit <= numLockedPages) {
+	 return FALSE;
+      } else if (limit - numLockedPages < numPages) {
+	 return FALSE;
+      }
+   }
+
+   return TRUE;
+}
+
+
+#ifdef VMX86_DEBUG
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86VMIsRegistered --
+ *
+ *      Check if "vm" is on the list of VMDrivers.
+ *
+ * Results:
+ *      Return TRUE iff "vm" is on the list of VMDrivers.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------
+ */
+
+static Bool
+Vmx86VMIsRegistered(VMDriver *vm, Bool needsLock)
+{
+   VMDriver *tmp;
+   Bool      found = FALSE;
+
+   ASSERT(needsLock || HostIF_GlobalLockIsHeld());
+
+   if (needsLock) {
+      HostIF_GlobalLock(5);
+   }
+
+   for (tmp = vmDriverList; tmp != NULL; tmp = tmp->nextDriver) {
+      if (tmp == vm) {
+         found = TRUE;
+         break;
+      }
+   }
+
+   if (needsLock) {
+      HostIF_GlobalUnlock(5);
+   }
+
+   return found;
+}
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_InitIDList --
+ *
+ *       Called when the driver is initialized.
+ *       Set up the list of available VM ID's.
+ *
+ * Results:
+ *       None. Sets up global data.
+ *
+ * Side effects:
+ *       None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_InitIDList(void)
+{
+   int i;
+
+   HostIF_GlobalLock(32);
+
+   for (i = 0; i < MAX_VMS; i++) {
+      vmIDList[i] = i + 1;
+   }
+   vmIDList[MAX_VMS - 1] = INVALID_VMID;
+   vmIDsUnused = 0;
+   vmIDsAllocated = INVALID_VMID;
+
+   HostIF_GlobalUnlock(32);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86FreeVMID --
+ *
+ *       Return a VM ID to the list of available VM ID's.
+ *
+ * Results:
+ *       None
+ *
+ * Side effects:
+ *       None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86FreeVMID(int vmID) // IN
+{
+   int i;
+
+   ASSERT(HostIF_GlobalLockIsHeld());
+
+   /* Deleting head of the list. */
+   if (vmID == vmIDsAllocated) {
+      int tmp;
+
+      tmp = vmIDList[vmIDsAllocated];
+      vmIDList[vmIDsAllocated] = vmIDsUnused;
+      vmIDsAllocated = tmp;
+      vmIDsUnused = vmID;
+
+      return;
+   }
+
+   for (i = vmIDsAllocated; vmIDList[i] != INVALID_VMID; i = vmIDList[i]) {
+      if (vmIDList[i] == vmID) {
+         vmIDList[i] = vmIDList[vmID];
+         vmIDList[vmID] = vmIDsUnused;
+         vmIDsUnused = vmID;
+
+         return;
+      }
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86AllocVMID --
+ *
+ *       Grab a VM ID from the list of available VM ID's.
+ *
+ * Results:
+ *       The VM ID, in the range [ 0 ; MAX_VMS ).
+ *
+ * Side effects:
+ *       None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+Vmx86AllocVMID(void)
+{
+   int vmID;
+
+   ASSERT(HostIF_GlobalLockIsHeld());
+
+   vmID = vmIDsUnused;
+   ASSERT(0 <= vmID && vmID < MAX_VMS);
+   vmIDsUnused = vmIDList[vmID];
+   vmIDList[vmID] = vmIDsAllocated;
+   vmIDsAllocated = vmID;
+
+   return vmID;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86RegisterVMOnList --
+ *
+ *      Add a VM to the list of registered VMs and increment
+ *      the count of VMs.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Add VM to linked list.
+ *	Increment count of VMs.
+ *
+ *----------------------------------------------------------------
+ */
+
+static void
+Vmx86RegisterVMOnList(VMDriver *vm) // IN
+{
+   int vmID;
+   VMDriver **vmp;
+
+   ASSERT(HostIF_GlobalLockIsHeld());
+   vmCount++;
+   vmID = Vmx86AllocVMID();
+   ASSERT(vm->userID == 0);
+   vm->userID = vmID + 1;
+   ASSERT(vm->userID > 0);
+
+   for (vmp = &vmDriverList; *vmp != NULL; vmp = &(*vmp)->nextDriver) {
+      if (*vmp == vm) {
+         Warning("VM already registered on the list of VMs.\n");
+         return;
+      }
+   }
+   *vmp = vm;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86DeleteVMFromList --
+ *
+ *      Delete a VM from the list of registered VMs and decrement
+ *      the count of VMs. This function should be called on any
+ *      VM registered on the VMDriverList before invoking
+ *      Vmx86FreeAllVMResources to free its memory.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Remove VM from linked list.
+ *	Decrement count of VMs.
+ *
+ *----------------------------------------------------------------
+ */
+
+static void
+Vmx86DeleteVMFromList(VMDriver *vm)
+{
+   VMDriver **vmp;
+
+   ASSERT(vm);
+   ASSERT(HostIF_GlobalLockIsHeld());
+   for (vmp = &vmDriverList; *vmp != vm; vmp = &(*vmp)->nextDriver) {
+      if (*vmp == NULL) {
+         Warning("VM is not on the list of registered VMs.\n");
+         return;
+      }
+   }
+   *vmp = vm->nextDriver;
+   vmCount--;
+
+   Vmx86FreeVMID(vm->userID - 1);
+   numLockedPages -= vm->memInfo.locked;
+
+   /*
+    * If no VM is running, reset the configured locked-page limit so
+    * that the next VM to power on sets it appropriately.
+    */
+
+   if (vmCount == 0) {
+      lockedPageLimit.configured = 0;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86FreeAllVMResources
+ *
+ *     Free the resources allocated for a vm that is not registered
+ *     on the VMDriverList.  Except in the case of Vmx86_CreateVM(),
+ *     this should be called only after a call to Vmx86DeleteVMFromList().
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Memory freed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86FreeAllVMResources(VMDriver *vm)
+{
+   ASSERT(!HostIF_GlobalLockIsHeld());
+   if (vm) {
+      ASSERT(!Vmx86VMIsRegistered(vm, TRUE));
+
+      Vmx86_SetHostClockRate(vm, 0);
+
+      HostIF_FreeAllResources(vm);
+
+      HostIF_FreeKernelMem(vm);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86ReserveFreePages --
+ *
+ *       Returns TRUE and increases locked page counts if the vm can lock
+ *       more pages.  This is true if we are below the host's hard memory
+ *       limit and this vm has not exceeded its maximum allocation.
+ *       The function is thread-safe.
+ *
+ *       If ignoreLimits is TRUE then additional pages may be reserved even
+ *       if limits are violated. The request to ignore limits may come in
+ *       cases of anonymous page allocations. Swapping is not always possible 
+ *       at those points but a swap target will have been posted so that the
+ *       vmm will release memory shortly allowing the excessive reservation 
+ *       to be reduced.
+ *
+ * Results:
+ *       TRUE if pages are reserved for locking, FALSE otherwise
+ *
+ * Side effects:
+ *       The global lock and VM's lock are acquired and released.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+Vmx86ReserveFreePages(VMDriver *vm,
+		      unsigned int numPages,
+                      Bool ignoreLimits)
+{
+   Bool retval = FALSE;
+   int retries = 3;
+
+   ASSERT(vm);
+
+   for (retries = 3; !retval && (retries > 0); retries--) {
+      HostIF_GlobalLock(17);
+      HostIF_VMLock(vm, 0);
+
+      // Check VM's limit and don't wait.
+      retval = Vmx86HasFreePages(vm, numPages, TRUE);
+      if (!retval) {
+         HostIF_VMUnlock(vm, 0);
+         HostIF_GlobalUnlock(17);
+	 break;
+      } else {
+	 // Wait to satisfy the global limit.
+	 retval = Vmx86HasFreePages(vm, numPages, FALSE);
+	 if (retval) {
+	    numLockedPages += numPages;
+	    vm->memInfo.locked += numPages;
+            HostIF_VMUnlock(vm, 0);
+	    HostIF_GlobalUnlock(17);
+	    break;
+	 } else {
+            /*
+             * There are not enough pages -- drop the locks and wait for
+             * the host and/or other VMs to produce free pages.
+	     */
+
+            HostIF_VMUnlock(vm, 0);
+	    HostIF_GlobalUnlock(17);
+	    HostIF_WaitForFreePages(10);
+	 }
+      }
+   }
+
+   if (!retval && ignoreLimits) {
+      HostIF_GlobalLock(17);
+      HostIF_VMLock(vm, 0);
+      numLockedPages += numPages;
+      vm->memInfo.locked += numPages;
+      HostIF_VMUnlock(vm, 0);
+      HostIF_GlobalUnlock(17);
+      retval = TRUE;
+   }
+
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86UnreserveFreePages --
+ *
+ *       Decreases the global and VM's locked page counts.
+ *       The function is thread-safe.
+ *
+ * Results:
+ *       void
+ *
+ * Side effects:
+ *       The global lock and VM's lock are acquired and released.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86UnreserveFreePages(VMDriver *vm,
+			unsigned int numPages)
+{
+   ASSERT(vm);
+
+   HostIF_GlobalLock(18);
+   HostIF_VMLock(vm, 1);
+
+   ASSERT(numLockedPages >= numPages);
+   ASSERT(vm->memInfo.locked >= numPages);
+
+   numLockedPages -= numPages;
+   vm->memInfo.locked -= numPages;
+
+   HostIF_VMUnlock(vm, 1);
+   HostIF_GlobalUnlock(18);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_CreateVM --
+ *
+ *      Allocate and initialize a driver structure for a virtual machine.
+ *
+ * Results:
+ *      VMDriver structure or NULL on error.
+ *
+ * Side effects:
+ *      May allocate kernel memory.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+VMDriver *
+Vmx86_CreateVM(void)
+{
+   VMDriver *vm;
+   Vcpuid v;
+
+   vm = HostIF_AllocKernelMem(sizeof *vm, TRUE);
+   if (vm == NULL) {
+      return NULL;
+   }
+   memset(vm, 0, sizeof *vm);
+
+   vm->userID = 0;
+   vm->memInfo.admitted = FALSE;
+   vm->fastSuspResFlag = 0;
+   for (v = 0; v < MAX_INITBLOCK_CPUS; v++) {
+      vm->currentHostCpu[v] = INVALID_PCPU;
+   }
+
+   if (HostIF_Init(vm)) {
+      goto cleanup;
+   }
+
+   HostIF_GlobalLock(0);
+
+#ifdef _WIN32
+   if (vmCount >= MAX_VMS_WIN32) {
+      HostIF_GlobalUnlock(0);
+      goto cleanup;
+   }
+#endif
+   if (vmCount >= MAX_VMS) {
+      HostIF_GlobalUnlock(0);
+      goto cleanup;
+   }
+
+   Vmx86RegisterVMOnList(vm);
+
+   HostIF_GlobalUnlock(0);
+
+   return vm;
+
+cleanup:
+   /*
+    * The VM is not on a list, "vmCount" has not been incremented,
+    * "vm->cowID" is INVALID_VMID, and either the VM's mutex hasn't
+    * been initialized or we've only taken the global lock and checked
+    * a counter since, so we know that the VM has not yet locked any
+    * pages.
+    */
+
+   ASSERT(vm->memInfo.locked == 0);
+   Vmx86FreeAllVMResources(vm);
+
+   return NULL;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_ReleaseVM  --
+ *
+ *      Release a VM (either created here or from a bind).
+ *
+ * Results:
+ *      zero if successful
+ *
+ * Side effects:
+ *      Decrement VM reference count.
+ *      Release resources (those that are left) when count reaches 0.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_ReleaseVM(VMDriver *vm)  // IN:
+{
+   ASSERT(vm);
+   HostIF_GlobalLock(1);
+   Vmx86DeleteVMFromList(vm);
+   HostIF_GlobalUnlock(1);
+   Vmx86FreeAllVMResources(vm);
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_Open --
+ *
+ *      Called on open of the fd.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *	Bumps fdCount.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_Open(void)
+{
+   HostIF_GlobalLock(123);
+   ASSERT(fdCount < MAX_INT32);
+   if (fdCount < MAX_INT32) {
+      fdCount++;
+   }
+   HostIF_GlobalUnlock(123);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_Close --
+ *
+ *      Called on close of the fd.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Decrements fdCount
+ *	May de-initialize ptsc.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_Close(void)
+{
+   HostIF_GlobalLock(124);
+
+   /*
+    * If fdCount hits MAX_INT32 saturate the counter and leave it at
+    * MAX_INT32.
+    */
+
+   ASSERT(fdCount > 0);
+   if (fdCount < MAX_INT32) {
+      fdCount--;
+   }
+
+   /*
+    * If no VMs are running and there are no open file handles, reset the
+    * pseudo TSC state so that the next VM to initialize is free to
+    * initialize the system wide PTSC however it wants.  See PR 403505.
+    */
+
+   if (fdCount == 0) {
+      ASSERT(vmCount == 0);
+      pseudoTSC.initialized = FALSE;
+   }
+   HostIF_GlobalUnlock(124);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_InitVM --
+ *
+ *    Initializaiton of the VM.  Expects all initial arguments
+ *    to be part of the InitBlock structure.
+ *
+ * Results:
+ *    0 on success
+ *    != 0 on failure
+ *
+ * Side effects:
+ *    Many
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+Vmx86_InitVM(VMDriver *vm,          // IN
+             InitBlock *initParams) // IN/OUT: Initial params from the VM
+{
+   int retval;
+
+   if (initParams->magicNumber != INIT_BLOCK_MAGIC) {
+      Warning("Bad magic number for init block 0x%x\n",
+              initParams->magicNumber);
+
+      return 1;
+   }
+   if (initParams->numVCPUs > MAX_INITBLOCK_CPUS) {
+      Warning("Too many VCPUs for init block %d\n", initParams->numVCPUs);
+
+      return 1;
+   }
+   vm->numVCPUs = initParams->numVCPUs;
+
+   HostIF_InitFP(vm);
+
+   /*
+    * Initialize the driver's part of the cross-over page used to
+    * talk to the monitor
+    */
+
+   retval = Task_InitCrosspage(vm, initParams);
+   if (retval) {
+      Warning("Task crosspage init died with retval=%d\n", retval);
+      /*
+       *  Note that any clean-up of resources will be handled during
+       *  power-off when Vmx86_ReleaseVM() is called as part of
+       *  MonitorLoop_PowerOff().
+       */
+
+      return 1;
+   }
+
+   /*
+    *  Check if we want to arbitrarily fail every N VM initializations.
+    *  Useful in testing PR 72482.
+    */
+
+   if (initParams->vmInitFailurePeriod != 0) {
+      static uint32 counter = 0;
+
+      if ((++counter) % initParams->vmInitFailurePeriod == 0) {
+         Warning("VM initialization failed on %d iteration\n", counter);
+
+         return 1;
+      }
+   }
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_ReadTSCAndUptime --
+ *
+ *      Atomically read the TSC and the uptime.
+ *
+ * Results:
+ *      The current TSC and uptime values.
+ *
+ * Side effects:
+ *      none
+ *
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_ReadTSCAndUptime(VmTimeStart *st)	// OUT: return value
+{
+   uintptr_t flags;
+
+   SAVE_FLAGS(flags);
+   CLEAR_INTERRUPTS();
+
+   st->count = RDTSC();
+   st->time = HostIF_ReadUptime();
+
+   RESTORE_FLAGS(flags);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_ComputekHz --
+ *
+ *      Given aggregate cycles and system uptime, computes cycle rate as,
+ *
+ *      khz = cycles / (uptime / HostIF_UptimeFrequency()) / 1000
+ *
+ *      We need to do the computation carefully to avoid overflow or
+ *      undue loss of precision.  Also, on Linux we can't do a
+ *      64/64=64 bit division directly, as the gcc stub for that
+ *      is not linked into the kernel.
+ *
+ * Results:
+ *      Returns the computed khz value, or 0 if uptime == 0.
+ *
+ * Side effects:
+ *      none
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint32
+Vmx86_ComputekHz(uint64 cycles, uint64 uptime)
+{
+   uint64 hz;
+   uint64 freq;
+
+   freq = HostIF_UptimeFrequency();
+   while (cycles > MAX_UINT64 / freq) {
+      cycles >>= 1;
+      uptime >>= 1;
+   }
+ 
+   if (uptime == 0) {
+      return 0;
+   }
+
+   hz  = (cycles * freq) / uptime;
+   return (uint32) ((hz + 500) / 1000);
+}
+
+
+#ifdef __APPLE__
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86GetBusyKHzEstimate
+ *
+ *      Return an estimate the of the processor's kHz rating, based on
+ *      a spinloop.  This is especially useful on systems where the TSC
+ *      is known to run at its maximum rate when we are using the CPU.
+ *      As of 2006, Intel Macs are this way... the TSC rate is 0 if the
+ *      CPU is in a deep enough sleep state, or at its max rate otherwise.
+ *
+ * Results:
+ *      Processor speed in kHz.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER uint32
+Vmx86GetBusyKHzEstimate(void)
+{
+   static const int ITERS = 100;
+   static const int CYCLES_PER_ITER = 20000;
+   int i;
+   uint64 j;
+   uint64 aggregateCycles = 0;
+   uint64 aggregateUptime = 0;
+
+   for (i = 0; i < ITERS; i++) {
+      NO_INTERRUPTS_BEGIN() {
+         aggregateCycles -= RDTSC();
+         aggregateUptime -= HostIF_ReadUptime();
+         for (j = RDTSC() + CYCLES_PER_ITER; RDTSC() < j; )
+            ;
+         aggregateCycles += RDTSC();
+         aggregateUptime += HostIF_ReadUptime();
+      } NO_INTERRUPTS_END();
+   }
+
+   return Vmx86_ComputekHz(aggregateCycles, aggregateUptime);
+}
+#else // ifdef __APPLE__
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86GetkHzEstimate
+ *
+ *      Return an estimate of the processor's kHz rating, based on
+ *      the ratio of the cycle counter and system uptime since the
+ *      driver was loaded.
+ *      This function could be called (on Windows) at IRQL DISPATCH_LEVEL.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER uint32
+Vmx86GetkHzEstimate(VmTimeStart *st)	// IN: start time
+{
+   uint64 cDiff, tDiff;
+   uintptr_t flags;
+
+   SAVE_FLAGS(flags);
+   CLEAR_INTERRUPTS();
+   cDiff = RDTSC() - st->count;
+   tDiff = HostIF_ReadUptime() - st->time;
+   RESTORE_FLAGS(flags);
+
+   return Vmx86_ComputekHz(cDiff, tDiff);
+}
+#endif // ifdef __APPLE__
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetkHzEstimate
+ *
+ *      Return an estimate of the processor's kHz rating, based on
+ *      the ratio of the cycle counter and system uptime since the
+ *      driver was loaded.  Or based on a spinloop.
+ *
+ *      This function could be called (on Windows) at IRQL DISPATCH_LEVEL.
+ *
+ * Results:
+ *      Processor speed in kHz.
+ *
+ * Side effects:
+ *      Result is cached.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint32
+Vmx86_GetkHzEstimate(VmTimeStart *st)	// IN: start time
+{
+   static uint32 kHz;
+
+   /*
+    * Cache and return the first result for consistency.
+    * TSC values can be changed without notification.
+    * TSC frequency can be vary too (SpeedStep, slowing clock on HALT, etc.)
+    */
+   if (kHz != 0) {
+      return kHz;
+   }
+
+#ifdef __APPLE__
+   return kHz = Vmx86GetBusyKHzEstimate();
+#else
+   return kHz = Vmx86GetkHzEstimate(st);
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_SetHostClockRate --
+ *
+ *      The monitor wants to poll for events at the given rate. If no VM
+ *      is specified, then 'rate' is ignored and the last set rate is set
+ *      again.
+ *
+ * Results:
+ *      0 for success, host-specific error code for failure.
+ *
+ * Side effects:
+ *      May increase the host timer interrupt rate, etc.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_SetHostClockRate(VMDriver *vm,  // IN: VM instance pointer
+                       unsigned rate) // IN: rate in Hz
+{
+   unsigned newGlobalRate;
+   VMDriver *cur;
+   int retval = 0;
+
+   if (!vm) {
+      Log("Resetting last set host clock rate of %d\n", globalFastClockRate);
+      HostIF_FastClockLock(0);
+      retval = HostIF_SetFastClockRate(globalFastClockRate);
+      HostIF_FastClockUnlock(0);
+
+      return retval;
+   }
+
+   /* Quick test before locks are acquired. */
+   if (vm->fastClockRate == rate) {
+      return retval;
+   }
+
+   HostIF_FastClockLock(2);
+   if (vm->fastClockRate == rate) {
+      HostIF_FastClockUnlock(2);
+
+      return retval;
+   }
+
+   /*
+    * Loop through all vms to find new max rate.
+    */
+   newGlobalRate = rate;
+   HostIF_GlobalLock(19);
+   for (cur = vmDriverList; cur != NULL; cur = cur->nextDriver) {
+      if (cur != vm && cur->fastClockRate > newGlobalRate) {
+         newGlobalRate = cur->fastClockRate;
+      }
+   }
+   HostIF_GlobalUnlock(19);
+
+   if (newGlobalRate != globalFastClockRate) {
+      retval = HostIF_SetFastClockRate(newGlobalRate);
+      if (!retval) {
+         globalFastClockRate = newGlobalRate;
+      }
+   }
+   if (!retval) {
+      vm->fastClockRate = rate;
+   }
+   HostIF_FastClockUnlock(2);
+
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_MonTimerIPI --
+ *
+ *      Check for VCPUs that are in the monitor and need an IPI to fire
+ *      their next MonTimer callback.  Should be called once per fast
+ *      timer interrupt if the fast timer is in use.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      May send IPIs.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_MonTimerIPI(void)
+{
+   VMDriver *vm;
+   VmAbsoluteTS pNow, expiry;
+
+   /*
+    * Loop through all vms -- needs the global lock to protect vmDriverList.
+    */
+
+   HostIF_GlobalLock(21);
+
+   pNow = Vmx86_GetPseudoTSC();
+
+   for (vm = vmDriverList; vm != NULL; vm = vm->nextDriver) {
+      Vcpuid v;
+      VCPUSet expiredVCPUs;
+      VCPUSet_Empty(&expiredVCPUs);
+
+      for (v = 0; v < vm->numVCPUs; v++) {
+         VMCrossPage *crosspage = vm->crosspage[v];
+
+         if (!crosspage) {
+            continue;  // VCPU is not initialized yet
+         }
+         expiry = crosspage->crosspageData.monTimerExpiry;
+         if (expiry != 0 && expiry <= pNow) {
+            VCPUSet_Include(&expiredVCPUs, v);
+         }
+      }
+      if (!VCPUSet_IsEmpty(&expiredVCPUs) &&
+          HostIF_IPI(vm, &expiredVCPUs) == IPI_BROADCAST) {
+         // no point in doing a broadcast for more than one VM.
+         break;
+      }
+   }
+   HostIF_GlobalUnlock(21);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetNumVMs  --
+ *
+ *      Return the number of VMs.
+ *
+ * Results:
+ *      The number of VMs.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int32
+Vmx86_GetNumVMs(void)
+{
+   return vmCount;
+}
+
+
+int32
+Vmx86_GetTotalMemUsage(void)
+{
+   VMDriver *vm;
+   int totalmem = 0;
+
+   HostIF_GlobalLock(15);
+   vm = vmDriverList;
+
+   for (vm = vmDriverList; vm != NULL; vm = vm->nextDriver) {
+      /*
+       * The VM lock is not strictly necessary as the vm will
+       * stay on the list until we release the global lock and
+       * because of order in which "admitted" and "mainMemSize"
+       * are set when each VM is admitted.
+       */
+
+      if (vm->memInfo.admitted) {
+          totalmem += PAGES_2_MBYTES(ROUNDUP(vm->memInfo.mainMemSize,
+                                             MBYTES_2_PAGES(1)));
+      }
+   }
+
+   HostIF_GlobalUnlock(15);
+
+   return totalmem;
+}
+
+
+static INLINE unsigned
+Vmx86MinAllocationFunc(unsigned nonpaged,
+                       unsigned anonymous,
+                       unsigned mainmem,
+                       unsigned memPct)
+{
+   return RatioOf(memPct, mainmem, 100) + nonpaged + anonymous;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86MinAllocation --
+ *
+ *      Computes the minimum number of pages that must be allocated to a
+ *      specific vm.  The minAllocation for a vm is defined as
+ *      some percentage of guest memory plus 100% of nonpagable (overhead)
+ *      memory.
+ *
+ * Results:
+ *	The minAllocation for this vm.
+ *
+ *
+ * Side effects:
+ *      Analyzes the vm info, requiring the vm lock.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE unsigned
+Vmx86MinAllocation(VMDriver *vm,
+                   unsigned memPct)
+{
+   ASSERT(HostIF_VMLockIsHeld(vm));
+
+   return Vmx86MinAllocationFunc(vm->memInfo.nonpaged, vm->memInfo.anonymous,
+                                 vm->memInfo.mainMemSize, memPct);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86CalculateGlobalMinAllocation --
+ *
+ *      Computes the sum of minimum allocations of each vm assuming a given
+ *      percentage of guest memory must fit within host RAM.
+ *
+ * Results:
+ *	Number of pages that must fit within host ram for a given overcommit
+ *      level.
+ *
+ *
+ * Side effects:
+ *      None. The actual minAllocations of each vm are NOT updated during
+ *      this computation.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static unsigned
+Vmx86CalculateGlobalMinAllocation(unsigned memPct)
+{
+   VMDriver *vm;
+   unsigned minAllocation = 0;
+
+   ASSERT(HostIF_GlobalLockIsHeld());
+   /* Pages of other vms required to fit inside the hard limit. */
+   for (vm = vmDriverList; vm; vm = vm->nextDriver) {
+      HostIF_VMLock(vm, 2);
+      if (vm->memInfo.admitted) {
+         minAllocation += Vmx86MinAllocation(vm, memPct);
+      }
+      HostIF_VMUnlock(vm, 2);
+   }
+
+   return minAllocation;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86UpdateMinAllocations --
+ *
+ *      Updates the minimum allocation for each vm based on the global
+ *      overcommitment percentage.
+ *
+ * Results:
+ *      minAllocations for vms are changed.
+ *
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+Vmx86UpdateMinAllocations(unsigned memPct)  // IN:
+{
+   VMDriver *vm;
+
+   ASSERT(HostIF_GlobalLockIsHeld());
+   /* Pages of other vms required to fit inside the hard limit. */
+   for (vm = vmDriverList; vm; vm = vm->nextDriver) {
+      HostIF_VMLock(vm, 3);
+      if (vm->memInfo.admitted) {
+         vm->memInfo.minAllocation = Vmx86MinAllocation(vm, memPct);
+      }
+      HostIF_VMUnlock(vm, 3);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_SetConfiguredLockedPagesLimit --
+ *
+ *      Set the user defined limit on the number of pages that can
+ *      be locked.  This limit can be raised at any time but not lowered.
+ *      This avoids having a user lower the limit as vms are running and
+ *      inadvertently cause the vms to crash because of memory starvation.
+ *
+ * Results:
+ *      Returns TRUE on success and FALSE on failure to set the limit
+ *
+ * Side effects:
+ *      Hard limit may be changed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_SetConfiguredLockedPagesLimit(unsigned limit)  // IN:
+{
+   Bool retval = FALSE;
+
+   HostIF_GlobalLock(4);
+   if (limit >= lockedPageLimit.configured) {
+      lockedPageLimit.configured = limit;
+      retval = TRUE;
+   }
+   HostIF_GlobalUnlock(4);
+
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_SetDynamicLockedPageLimit --
+ *
+ *      Set the dynamic locked page limit.  This limit is determined by
+ *      authd in response to host pressure.  It can be both raised and
+ *      lowered at any time.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Hard limit may be changed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_SetDynamicLockedPagesLimit(unsigned limit)  // IN:
+{
+   HostIF_GlobalLock(11);
+   lockedPageLimit.dynamic = limit;
+   HostIF_GlobalUnlock(11);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_LockPage --
+ *
+ *      Lock a page.
+ *
+ * Results:
+ *      A PAGE_LOCK_* status code and the MPN of the locked page on success.
+ *
+ * Side effects:
+ *      Number of global and per-VM locked pages increased.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_LockPage(VMDriver *vm,                 // IN: VMDriver
+               VA64 uAddr,                   // IN: VA of the page to lock
+               Bool allowMultipleMPNsPerVA,  // IN: allow locking many pages with the same VA
+               MPN *mpn)                     // OUT
+{
+   int retval;
+
+   /* Atomically check and reserve locked memory */
+   if (!Vmx86ReserveFreePages(vm, 1, FALSE)) {
+      return PAGE_LOCK_LIMIT_EXCEEDED;
+   }
+
+   HostIF_VMLock(vm, 4);
+   retval = HostIF_LockPage(vm, uAddr, allowMultipleMPNsPerVA, mpn);
+   HostIF_VMUnlock(vm, 4);
+
+   if (retval != PAGE_LOCK_SUCCESS) {
+      Vmx86UnreserveFreePages(vm, 1);
+   }
+
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_UnlockPage --
+ *
+ *      Unlock a page.
+ *
+ * Results:
+ *      A PAGE_UNLOCK_* status code.
+ *
+ * Side effects:
+ *      Number of global and per-VM locked pages decreased.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_UnlockPage(VMDriver *vm, // IN
+                 VA64 uAddr)   // IN
+{
+   int retval;
+
+   HostIF_VMLock(vm, 5);
+   retval = HostIF_UnlockPage(vm, uAddr);
+   HostIF_VMUnlock(vm, 5);
+
+   if (retval == PAGE_UNLOCK_SUCCESS) {
+      Vmx86UnreserveFreePages(vm, 1);
+   }
+
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_UnlockPageByMPN --
+ *
+ *      Unlock a page.
+ *
+ * Results:
+ *      A PAGE_UNLOCK_* status code.
+ *
+ * Side effects:
+ *      Number of global and per-VM locked pages decreased.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
+                      MPN mpn,      // IN: the page to unlock
+                      VA64 uAddr)   // IN: optional valid VA for this MPN
+{
+   int retval;
+
+   HostIF_VMLock(vm, 6);
+   retval = HostIF_UnlockPageByMPN(vm, mpn, uAddr);
+   HostIF_VMUnlock(vm, 6);
+
+   if (retval == PAGE_UNLOCK_SUCCESS) {
+      Vmx86UnreserveFreePages(vm, 1);
+   }
+
+   return retval;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_AllocLockedPages --
+ *
+ *      Allocate physical locked pages from the kernel.
+ *
+ *      Initially the pages are not mapped to any user or kernel
+ *      address space.
+ *
+ * Results:
+ *      Non-negative value on partial/full completion: actual number of
+ *      allocated MPNs. MPNs of the allocated pages are copied to the
+ *      caller's buffer at 'addr'.
+ *
+ *	Negative system specific error code on error (NTSTATUS on Windows,
+ *      etc.)
+ *
+ * Side effects:
+ *      Number of global and per-VM locked pages is increased.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+Vmx86_AllocLockedPages(VMDriver *vm,	     // IN: VMDriver
+		       VA64 addr,	     // OUT: VA of an array for
+                                             //      allocated MPNs.
+		       unsigned numPages,    // IN: number of pages to allocate
+		       Bool kernelMPNBuffer, // IN: is the MPN buffer in kernel
+                                             //     or user address space?
+                       Bool ignoreLimits)    // IN: should limits be ignored?
+{
+   int allocatedPages;
+
+   if (!Vmx86ReserveFreePages(vm, numPages, ignoreLimits)) {
+      // XXX What kind of system-specific error code is that? --hpreg
+      return PAGE_LOCK_LIMIT_EXCEEDED;
+   }
+
+   HostIF_VMLock(vm, 7);
+   allocatedPages = HostIF_AllocLockedPages(vm, addr, numPages,
+                                            kernelMPNBuffer);
+   HostIF_VMUnlock(vm, 7);
+
+   if (allocatedPages < 0) {
+      Vmx86UnreserveFreePages(vm, numPages);
+   } else if (allocatedPages < numPages) {
+      Vmx86UnreserveFreePages(vm, numPages - allocatedPages);
+   }
+
+   return allocatedPages;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_FreeLockedPages --
+ *
+ *      Frees physical locked pages from the kernel previosly allocated
+ *      by Vmx86_AllocLockedPages().
+ *
+ * Results:
+ *	0 on success,
+ *	non-0 system specific error code on error (NTSTATUS on Windows, etc.)
+ *
+ * Side effects:
+ *      Number of global and per-VM locked pages is decreased.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_FreeLockedPages(VMDriver *vm,	    // IN: VM instance pointer
+		      VA64 addr,            // IN: user or kernel array of MPNs to free
+		      unsigned numPages,    // IN: number of pages to free
+		      Bool kernelMPNBuffer) // IN: is the MPN buffer in kernel or user address space?
+{
+   int ret;
+
+   HostIF_VMLock(vm, 8);
+   ret = HostIF_FreeLockedPages(vm, addr, numPages, kernelMPNBuffer);
+   HostIF_VMUnlock(vm, 8);
+
+   if (ret == 0) {
+      Vmx86UnreserveFreePages(vm, numPages);
+   }
+
+   return ret;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetNextAnonPage --
+ *
+ *      Queries the driver to retrieve the list of anonymous pages. 
+ *      A supplied value of INVALID_MPN will start the query from
+ *      the head of the list. Callers supply the previously received
+ *      mpn to retrieve the next in the chain. Note: There is no
+ *      guarantee of coherency. 
+ *
+ * Results:
+ *      A valid mpn or INVALID_MPN if the list has been exhausted.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+Vmx86_GetNextAnonPage(VMDriver *vm,       // IN: VM instance pointer
+                      MPN mpn)            // IN: MPN
+{
+   MPN ret;
+
+   HostIF_VMLock(vm, 22);
+   ret = HostIF_GetNextAnonPage(vm, mpn);
+   HostIF_VMUnlock(vm, 22);
+
+   return ret;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetLockedPageList --
+ *
+ *      puts MPNs of pages that were allocated by HostIF_AllocLockedPages()
+ *      into user mode buffer.
+ *
+ * Results:
+ *	non-negative number of the MPNs in the buffer on success.
+ *	negative error code on error.
+ *
+ * Side effects:
+ *      none
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_GetLockedPageList(VMDriver *vm,          // IN: VM instance pointer
+                        VA64 uAddr,            // OUT: user mode buffer for MPNs
+		        unsigned int numPages) // IN: size of the buffer in MPNs
+{
+   int ret;
+
+   HostIF_VMLock(vm, 9);
+   ret = HostIF_GetLockedPageList(vm, uAddr, numPages);
+   HostIF_VMUnlock(vm, 9);
+
+   return ret;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetMemInfo --
+ *
+ *      Return the info about all VMs. 
+ *
+ * Results:
+ *      TRUE if all info was successfully copied.
+ *
+ * Side effects:
+ *      VMGetMemInfoArgs is filled in. If the supplied curVM is null 
+ *      then only the baseline information will be returned. Calling
+ *      with a null curVM may return results for maxLockedPages 
+ *      that differ from those  when the vm is passed if huge pages 
+ *      are in use. 
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_GetMemInfo(VMDriver *curVM,
+                 Bool curVMOnly,
+                 VMMemInfoArgs *outArgs,
+                 int outArgsLength)
+{
+   VMDriver *vm;
+   int outSize;
+   int wantedVMs;
+
+   HostIF_GlobalLock(7);
+
+   if (curVMOnly) {
+      wantedVMs = 1;
+   } else {
+      wantedVMs = vmCount;
+   }
+
+   outSize = VM_GET_MEM_INFO_SIZE(wantedVMs);
+   if (outSize > outArgsLength) {
+      HostIF_GlobalUnlock(7);
+
+      return FALSE;
+   }
+
+   outArgs->numVMs = wantedVMs;
+   outArgs->numLockedPages = numLockedPages;
+   outArgs->maxLockedPages = Vmx86LockedPageLimit(curVM);
+   outArgs->lockedPageLimit = lockedPageLimit;
+   outArgs->globalMinAllocation = Vmx86CalculateGlobalMinAllocation(minVmMemPct);
+   outArgs->minVmMemPct = minVmMemPct;
+   outArgs->callerIndex = (uint32)-1;
+   outArgs->currentTime = HostIF_ReadUptime() / HostIF_UptimeFrequency();
+
+   if (curVM == NULL) {
+      HostIF_GlobalUnlock(7);
+
+      return TRUE;
+   }
+
+   curVM->memInfo.timestamp = outArgs->currentTime;
+   if (wantedVMs == 1) {
+      outArgs->memInfo[0] = curVM->memInfo;
+      outArgs->callerIndex = 0;
+   } else {
+      int i;
+      for (i = 0, vm = vmDriverList;
+           vm != NULL && i < vmCount;
+           i++, vm = vm->nextDriver) {
+         if (vm == curVM) {
+            outArgs->callerIndex = i;
+         }
+         HostIF_VMLock(vm, 10);
+         outArgs->memInfo[i] = vm->memInfo;
+         HostIF_VMUnlock(vm, 10);
+      }
+   }
+
+   HostIF_GlobalUnlock(7);
+   if (outArgs->callerIndex == -1) {
+      return FALSE;
+   }
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86SetMemoryUsage --
+ *
+ *      Updates the paged, nonpaged, and anonymous memory reserved memory 
+ *      values for the vm.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86SetMemoryUsage(VMDriver *curVM,       // IN/OUT
+                    unsigned paged,        // IN
+                    unsigned nonpaged,     // IN
+                    unsigned anonymous,    // IN
+                    unsigned aminVmMemPct) // IN
+{
+   ASSERT(HostIF_VMLockIsHeld(curVM));
+   curVM->memInfo.paged         = paged;
+   curVM->memInfo.nonpaged      = nonpaged;
+   curVM->memInfo.anonymous     = anonymous;
+   curVM->memInfo.minAllocation = Vmx86MinAllocation(curVM, aminVmMemPct);
+   curVM->memInfo.maxAllocation = curVM->memInfo.mainMemSize + nonpaged +
+                                  anonymous;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_Admit --
+ *
+ *      Set the memory management information about this VM and handles
+ *      admission control. We allow vm to power on if there is room for
+ *      the minimum allocation for all running vms in memory.  Note that
+ *      the hard memory limit can change dynamically in windows so we
+ *      don't have guarantees due to admission control.
+ *
+ * Results:
+ *      Returns global information about the memory state in args as well
+ *      as a value indicating whether or not the virtual machine was
+ *      started.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_Admit(VMDriver *curVM,     // IN
+            VMMemInfoArgs *args) // IN/OUT
+{
+   Bool allowAdmissionCheck = FALSE;
+   unsigned int globalMinAllocation;
+
+   HostIF_GlobalLock(9);
+
+   /*
+    * Update the overcommitment level and minimums for all vms if they can
+    * fit under new minimum limit.  If they do not fit, do nothing.  And of
+    * course if existing VMs cannot fit under limit, likelihood that new VM
+    * will fit in is zero.
+    */
+
+   globalMinAllocation = Vmx86CalculateGlobalMinAllocation(args->minVmMemPct);
+   if (globalMinAllocation <= Vmx86LockedPageLimit(NULL)) {
+      allowAdmissionCheck = TRUE;
+      minVmMemPct = args->minVmMemPct;
+      Vmx86UpdateMinAllocations(args->minVmMemPct);
+   }
+
+   HostIF_VMLock(curVM, 12);
+
+   curVM->memInfo.shares = args->memInfo->shares;
+   curVM->memInfo.touchedPct = 100;
+   curVM->memInfo.dirtiedPct = 100;
+   curVM->memInfo.mainMemSize = args->memInfo->mainMemSize;
+   curVM->memInfo.perVMOverhead = args->memInfo->perVMOverhead;
+
+  /*
+   * Always set the allocations required for the current configuration
+   * so that the user will know how bad situation really is with the
+   * suggested percentage.
+   */
+
+  curVM->memInfo.admitted = FALSE;
+  Vmx86SetMemoryUsage(curVM, args->memInfo->paged, args->memInfo->nonpaged,
+                      args->memInfo->anonymous, args->minVmMemPct);
+  if (allowAdmissionCheck &&
+      globalMinAllocation + curVM->memInfo.minAllocation <=
+         Vmx86LockedPageLimit(curVM)) {
+      curVM->memInfo.admitted = TRUE;
+   }
+
+#if defined _WIN32
+   if (curVM->memInfo.admitted) {
+      unsigned int allocatedPages, nonpaged;
+      signed int pages;
+      MPN *mpns;
+
+      /*
+       * More admission control: Get enough memory for the nonpaged portion
+       * of the VM.  Drop locks for this long operation.
+       * XXX Timeout?
+       */
+
+      HostIF_VMUnlock(curVM, 12);
+      HostIF_GlobalUnlock(9);
+
+#define ALLOCATE_CHUNK_SIZE 64
+      allocatedPages = 0;
+      nonpaged = args->memInfo->nonpaged + args->memInfo->anonymous;
+      mpns = HostIF_AllocKernelMem(nonpaged * sizeof *mpns, FALSE);
+      if (mpns == NULL) {
+         goto undoAdmission;
+      }
+      while (allocatedPages < nonpaged) {
+         pages = Vmx86_AllocLockedPages(curVM,
+                                        PtrToVA64(mpns + allocatedPages),
+	                                MIN(ALLOCATE_CHUNK_SIZE, nonpaged - allocatedPages),
+	                                TRUE,
+                                        FALSE);
+         if (pages <= 0) {
+            break;
+         }
+         allocatedPages += pages;
+      }
+
+      /*
+       * Free the allocated pages.
+       * XXX Do not free the pages but hand them directly to the admitted VM.
+       */
+
+      for (pages = 0; pages < allocatedPages; pages += ALLOCATE_CHUNK_SIZE) {
+         Vmx86_FreeLockedPages(curVM, PtrToVA64(mpns + pages),
+                               MIN(ALLOCATE_CHUNK_SIZE, allocatedPages - pages), TRUE);
+      }
+      HostIF_FreeKernelMem(mpns);
+#undef ALLOCATE_CHUNK_SIZE
+
+undoAdmission:
+      if (allocatedPages != nonpaged) {
+          curVM->memInfo.admitted = FALSE; // undo admission
+      }
+
+      HostIF_GlobalLock(9);
+      HostIF_VMLock(curVM, 12);
+   }
+#endif
+
+   /* Return global state to the caller. */
+   args->memInfo[0] = curVM->memInfo;
+   args->numVMs = vmCount;
+   args->numLockedPages = numLockedPages;
+   args->maxLockedPages = Vmx86LockedPageLimit(curVM);
+   args->lockedPageLimit = lockedPageLimit;
+   args->globalMinAllocation = globalMinAllocation;
+   HostIF_VMUnlock(curVM, 12);
+   HostIF_GlobalUnlock(9);
+}
+
+
+Bool
+Vmx86_Readmit(VMDriver *curVM, OvhdMem_Deltas *delta)
+{
+   unsigned globalMinAllocation, newMinAllocation;
+   Bool retval = FALSE;
+   int paged;
+   int nonpaged;
+   int anonymous;
+
+   HostIF_GlobalLock(31);
+   globalMinAllocation = Vmx86CalculateGlobalMinAllocation(minVmMemPct);
+   HostIF_VMLock(curVM, 31);
+   paged = curVM->memInfo.paged + delta->paged;
+   nonpaged = curVM->memInfo.nonpaged + delta->nonpaged;
+   anonymous = curVM->memInfo.anonymous + delta->anonymous;
+
+   if (nonpaged >= 0 && paged >= 0 && anonymous >= 0) {
+      globalMinAllocation -= Vmx86MinAllocation(curVM, minVmMemPct);
+      newMinAllocation = Vmx86MinAllocationFunc(nonpaged, anonymous,
+                                                curVM->memInfo.mainMemSize,
+                                                minVmMemPct);
+      if (globalMinAllocation + newMinAllocation <= Vmx86LockedPageLimit(curVM) ||
+          (delta->paged <= 0 && delta->nonpaged <= 0 && delta->anonymous <= 0)) {
+         Vmx86SetMemoryUsage(curVM, paged, nonpaged, anonymous, minVmMemPct);
+         retval = TRUE;
+      }
+   }
+   HostIF_VMUnlock(curVM, 31);
+   HostIF_GlobalUnlock(31);
+
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_UpdateMemInfo --
+ *
+ *      Updates information about this VM with the new data supplied in
+ *      a patch.
+ *
+ * Results:
+ *      Sets the memory usage by this vm based on its memSample data.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_UpdateMemInfo(VMDriver *curVM,
+                    const VMMemMgmtInfoPatch *patch)
+{
+   ASSERT(patch->touchedPct <= 100 && patch->dirtiedPct <= 100);
+   HostIF_VMLock(curVM, 13);
+   curVM->memInfo.touchedPct = AsPercent(patch->touchedPct);
+   curVM->memInfo.dirtiedPct = AsPercent(patch->dirtiedPct);
+   curVM->memInfo.hugePageBytes = patch->hugePageBytes;
+   HostIF_VMUnlock(curVM, 13);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_PAEEnabled --
+ *
+ *      Is PAE enabled?
+ *
+ * Results:
+ *      TRUE if PAE enabled.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_PAEEnabled(void)
+{
+   uintptr_t cr4;
+
+   GET_CR4(cr4);
+
+   return (cr4 & CR4_PAE) != 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_VMXEnabled --
+ *
+ *      Test the VMXE bit as an easy proxy for whether VMX operation
+ *      is enabled.
+ *
+ * Results:
+ *      TRUE if the CPU supports VT and CR4.VMXE is set.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_VMXEnabled(void)
+{
+   if (VT_CapableCPU()) {
+      uintptr_t cr4;
+
+      GET_CR4(cr4);
+
+      return (cr4 & CR4_VMXE) != 0;
+   } else {
+      return FALSE;
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86LookupVMByUserIDLocked --
+ *
+ *      Lookup a VM by userID. The caller must hold the global lock.
+ *
+ * Returns:
+ *      On success: Pointer to the driver's VM instance.
+ *      On failure: NULL (not found).
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static VMDriver *
+Vmx86LookupVMByUserIDLocked(int userID) // IN
+{
+   VMDriver *vm;
+
+   ASSERT(HostIF_GlobalLockIsHeld());
+
+   for (vm = vmDriverList; vm != NULL; vm = vm->nextDriver) {
+      if (vm->userID == userID) {
+         return vm;
+      }
+   }
+
+   return NULL;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_LookupVMByUserID --
+ *
+ *      Lookup a VM by userID.
+ *
+ * Returns:
+ *      On success: Pointer to the driver's VM instance.
+ *      On failure: NULL (not found).
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+VMDriver *
+Vmx86_LookupVMByUserID(int userID) // IN
+{
+   VMDriver *vm;
+
+   HostIF_GlobalLock(10);
+   vm = Vmx86LookupVMByUserIDLocked(userID);
+   HostIF_GlobalUnlock(10);
+
+   return vm;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_FastSuspResSetOtherFlag --
+ *
+ *      Sets the value of other VM's fastSuspResFlag.
+ *
+ * Returns:
+ *      TRUE if VM was found and flag was set successfully.
+ *      FALSE if VM was not found.
+ *
+ * Side effects:
+ *      The value we set the flag to is this VM's userID.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_FastSuspResSetOtherFlag(VMDriver *vm,      // IN
+                              int otherVmUserId) // IN
+{
+   VMDriver *otherVM;
+
+   HostIF_GlobalLock(35);
+   otherVM = Vmx86LookupVMByUserIDLocked(otherVmUserId);
+   if (otherVM != NULL) {
+      ASSERT(otherVM->fastSuspResFlag == 0);
+      otherVM->fastSuspResFlag = vm->userID;
+   } else {
+      Warning("otherVmUserId (%d) is invalid", otherVmUserId);
+   }
+   HostIF_GlobalUnlock(35);
+
+   return otherVM != NULL;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_FastSuspResGetMyFlag --
+ *
+ *      Gets the value of fastSuspResFlag. If blockWait is true, this
+ *      function will not return until the flag is non-zero, or until
+ *      timeout.
+ *
+ * Returns:
+ *      The value of the flag which, if non-zero, should be the userID of
+ *      the vm that set it.
+ *
+ * Side effects:
+ *      The flag is reset to zero once read.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_FastSuspResGetMyFlag(VMDriver *vm,   // IN
+                           Bool blockWait) // IN
+{
+   int retval = 0;
+   int ntries = 1;
+   const int waitInterval = 10;     /* Wait 10ms at a time. */
+   const int maxWaitTime  = 100000; /* Wait maximum of 100 seconds. */
+
+   if (blockWait) {
+      ntries = maxWaitTime / waitInterval;
+   }
+
+   while (ntries--) {
+      HostIF_GlobalLock(6);
+      retval = vm->fastSuspResFlag;
+      vm->fastSuspResFlag = 0;
+      HostIF_GlobalUnlock(6);
+      if (retval || !ntries) {
+         break;
+      }
+      HostIF_Wait(waitInterval);
+   }
+
+   return retval;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86EnableHVOnCPU --
+ *
+ *      Enable HV on the current CPU, if possible.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      HV will be enabled, if possible.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+Vmx86EnableHVOnCPU(void)
+{
+   if (SVM_CapableCPU()) {
+      uint64 vmCR = __GET_MSR(MSR_VM_CR);
+      if (!SVM_LockedFromFeatures(vmCR)) {
+         CPUIDRegs regs;
+         __GET_CPUID(0x8000000A, &regs);
+         if (CPUID_GET(0x8000000A, EDX, SVM_LOCK, regs.edx) != 0) {
+            __SET_MSR(MSR_VM_CR, (vmCR & ~MSR_VM_CR_SVME_DISABLE) |
+                                  MSR_VM_CR_SVM_LOCK);
+         }
+      }
+   }
+   if (VT_CapableCPU()) {
+      uint64 featCtl = __GET_MSR(MSR_FEATCTL);
+      if (!VT_LockedFromFeatures(featCtl)) {
+         __SET_MSR(MSR_FEATCTL, featCtl | MSR_FEATCTL_LOCK | MSR_FEATCTL_VMXE);
+      }
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86RefClockInCycles --
+ *
+ *    Convert the reference clock (HostIF_Uptime) to cycle units.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Vmx86RefClockInCycles(uint64 uptime)
+{
+   return Mul64x3264(uptime, 
+                     pseudoTSC.refClockToPTSC.ratio.mult,
+                     pseudoTSC.refClockToPTSC.ratio.shift);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86RefClockToPTSC --
+ *
+ *    Convert from the reference clock (HostIF_Uptime) time to pseudo TSC.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Vmx86RefClockToPTSC(uint64 uptime)
+{
+   return Vmx86RefClockInCycles(uptime) + 
+      Atomic_Read64(&pseudoTSC.refClockToPTSC.add);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_InitPseudoTSC --
+ *
+ *      Initialize the pseudo TSC state if it is not already initialized.
+ *      If another vmx has initialized the pseudo TSC, then we continue to
+ *      use the parameters specified by the first vmx.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      - Updates tscHz, the frequency of the PTSC in Hz. That frequency may
+ *        differ from the value passed in if another VM is already running.
+ *      - Updates the refClkToTSC parameters to be consistent with the tscHz
+ *        value that's in use.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+Vmx86_InitPseudoTSC(PTSCInitParams *params) // IN/OUT
+{
+   VmTimeStart startTime;
+   uint64 tsc, uptime;
+
+   HostIF_GlobalLock(36);
+
+   if (!pseudoTSC.initialized) {
+      pseudoTSC.hz = params->tscHz;
+      pseudoTSC.refClockToPTSC.ratio.mult  = params->refClockToPTSC.mult;
+      pseudoTSC.refClockToPTSC.ratio.shift = params->refClockToPTSC.shift;
+
+      Vmx86_ReadTSCAndUptime(&startTime);
+      tsc    = startTime.count;
+      uptime = startTime.time;
+
+      /* Start Pseudo TSC at initialPTSC (usually 0). */
+      pseudoTSC.tscOffset = params->initialPTSC - tsc;
+      Atomic_Write64(&pseudoTSC.refClockToPTSC.add,
+                     params->initialPTSC - Vmx86RefClockInCycles(uptime));
+
+      /* forceRefClock gets priority. */
+      pseudoTSC.useRefClock           = params->forceRefClock;
+      pseudoTSC.neverSwitchToRefClock = params->forceTSC;
+      pseudoTSC.hwTSCsSynced          = params->hwTSCsSynced;
+      Log("PTSC: initialized at %"FMT64"u Hz using %s, TSCs are %ssynchronized.\n",
+          pseudoTSC.hz, pseudoTSC.useRefClock ? "reference clock" : "TSC",
+          pseudoTSC.hwTSCsSynced ? "" : "not ");
+
+      pseudoTSC.initialized = TRUE;
+   }
+   /* 
+    * Allow the calling vmx to respect ptsc.noTSC=TRUE config option
+    * even if another vmx is already running (pseudoTSC was already
+    * initialized).  Useful for testing.
+    */
+   if (params->forceRefClock) {
+      Vmx86_SetPseudoTSCUseRefClock();
+   }
+   params->refClockToPTSC.mult  = pseudoTSC.refClockToPTSC.ratio.mult;
+   params->refClockToPTSC.shift = pseudoTSC.refClockToPTSC.ratio.shift;
+   params->refClockToPTSC.add   = Atomic_Read64(&pseudoTSC.refClockToPTSC.add);
+   params->tscOffset    = pseudoTSC.tscOffset;
+   params->tscHz        = pseudoTSC.hz;
+   params->hwTSCsSynced = pseudoTSC.hwTSCsSynced;
+
+   HostIF_GlobalUnlock(36);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_GetPseudoTSC --
+ *
+ *    Read the pseudo TSC.  We prefer to implement the pseudo TSC using
+ *    TSC.  On systems where the TSC varies its rate (e.g. Pentium M),
+ *    stops advancing when the core is in deep sleep (e.g. Core 2 Duo),
+ *    or the TSCs can get out of sync across cores (e.g. Opteron due to
+ *    halt clock ramping, Core 2 Duo due to independent core deep sleep
+ *    states; though WinXP does handle the Core 2 Duo out of sync case;
+ *    and on IBM x-Series NUMA machines), we use a reference clock
+ *    (HostIF_ReadUptime()) as the basis for pseudo TSC.
+ *
+ *    Note that we depend on HostIF_ReadUptime being a high resolution
+ *    timer that is synchronized across all cores.
+ *
+ * Results:
+ *    Current value of the PTSC.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+uint64
+Vmx86_GetPseudoTSC(void)
+{
+   if (Vmx86_PseudoTSCUsesRefClock()) {
+      return Vmx86RefClockToPTSC(HostIF_ReadUptime());
+   }
+   return RDTSC() + pseudoTSC.tscOffset;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_CheckPseudoTSC --
+ *
+ *    Periodically called by userspace to check whether the TSC is
+ *    reliable, using the reference clock as the trusted time source.
+ *    If the TSC is unreliable, switch the basis of the PTSC from the
+ *    TSC to the reference clock.
+ *
+ *    Also, recompute the "add" component of the reference clock to PTSC
+ *    conversion, to periodically eliminate the drift between the two
+ *    clocks.  That way, if the PTSC switches from using the TSC to the
+ *    reference clock, PTSC will remain (roughly) continuous.  See PR
+ *    547055.
+ *
+ *    Note that we might be executing concurrently with other threads,
+ *    but it doesn't matter since we only ever go from using the TSC to
+ *    using the reference clock, never the other direction.
+ *
+ * Results:
+ *    TRUE if the PTSC is implemented by the reference clock.
+ *    FALSE if the PTSC is implemented by the TSC.
+ *
+ * Side effects:
+ *    May switch the basis of the PTSC from the TSC to the reference clock.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_CheckPseudoTSC(uint64 *lastTSC, // IN/OUT: last/current value of the TSC
+                     uint64 *lastRC)  // IN/OUT: last/current value of the reference clock
+{
+   VmTimeStart curTime;
+
+   Vmx86_ReadTSCAndUptime(&curTime);
+
+   if (pseudoTSC.initialized && *lastTSC && !Vmx86_PseudoTSCUsesRefClock()) {
+      uint64 tsc, refClkTS, refClkLastTS;
+      uint64 tscDiff, refClkDiff;
+
+      tsc = curTime.count;
+
+      refClkTS     = Vmx86RefClockInCycles(curTime.time);
+      refClkLastTS = Vmx86RefClockInCycles(*lastRC);
+
+      tscDiff    = tsc - *lastTSC;
+      refClkDiff = refClkTS - refClkLastTS;
+
+      if (((int64)tscDiff < 0) ||
+          (tscDiff * 100 < refClkDiff * 95) ||
+          (tscDiff * 95 > refClkDiff * 100)) {
+         /*
+          * TSC went backwards or drifted from the reference clock by
+          * more than 5% over the last poll period.
+          */
+         Vmx86_SetPseudoTSCUseRefClock();
+      } else {
+         uint64 ptscFromTSC = tsc + pseudoTSC.tscOffset;
+         Atomic_Write64(&pseudoTSC.refClockToPTSC.add, ptscFromTSC - refClkTS);
+      }
+   }
+   *lastTSC = curTime.count;
+   *lastRC  = curTime.time;
+
+   return Vmx86_PseudoTSCUsesRefClock();
+}
+
+
+typedef struct {
+   Atomic_uint32 index;
+   MSRQuery *query;
+} Vmx86GetMSRData;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86GetMSR --
+ *
+ *      Collect MSR value on the current logical CPU.
+ *
+ *	Function must not block (it is invoked from interrupt context).
+ *      Only VT MSRs are supported on VT-capable processors.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      'data->index' is atomically incremented by one.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+Vmx86GetMSR(void *clientData) // IN/OUT: A Vmx86GetMSRData *
+{
+   Vmx86GetMSRData *data = (Vmx86GetMSRData *)clientData;
+   MSRQuery *query;
+   uint32 index;
+   int err;
+
+   ASSERT(data);
+   query = data->query;
+   ASSERT(query);
+
+   index = Atomic_ReadInc32(&data->index);
+   if (index >= query->numLogicalCPUs) {
+      return;
+   }
+
+   query->logicalCPUs[index].tag = HostIF_GetCurrentPCPU();
+
+   /*
+    * We treat BIOS_SIGN_ID (microcode version) specially on Intel,
+    * where the preferred read sequence involves a macro.
+    */
+
+   if (CPUID_GetVendor() == CPUID_VENDOR_INTEL &&
+       query->msrNum == MSR_BIOS_SIGN_ID) {
+      /* safe to read: MSR_BIOS_SIGN_ID architectural since Pentium Pro */
+      query->logicalCPUs[index].msrVal = INTEL_MICROCODE_VERSION();
+      err = 0;
+   } else {
+      /*
+       * Try to enable HV any time these MSRs are queried.  We have seen
+       * buggy formware that forgets to re-enable HV after waking from
+       * deep sleep. [PR 1020692]
+       */
+      if (query->msrNum == MSR_FEATCTL || query->msrNum == MSR_VM_CR) {
+         Vmx86EnableHVOnCPU();
+      }
+      err = HostIF_SafeRDMSR(query->msrNum, &query->logicalCPUs[index].msrVal);
+   }
+
+   query->logicalCPUs[index].implemented = (err == 0) ? 1 : 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_GetAllMSRs --
+ *
+ *      Collect MSR value on all logical CPUs.
+ *
+ *      The caller is responsible for ensuring that the requested MSR is valid
+ *      on all logical CPUs.
+ *
+ *      'query->numLogicalCPUs' is the size of the 'query->logicalCPUs' output
+ *      array.
+ *
+ * Results:
+ *      On success: TRUE. 'query->logicalCPUs' is filled and
+ *                  'query->numLogicalCPUs' is adjusted accordingly.
+ *      On failure: FALSE. Happens if 'query->numLogicalCPUs' was too small.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_GetAllMSRs(MSRQuery *query) // IN/OUT
+{
+   Vmx86GetMSRData data;
+
+   Atomic_Write32(&data.index, 0);
+   data.query = query;
+
+   HostIF_CallOnEachCPU(Vmx86GetMSR, &data);
+
+   /*
+    * At this point, Atomic_Read32(&data.index) is the number of logical CPUs
+    * who replied.
+    */
+
+   if (Atomic_Read32(&data.index) > query->numLogicalCPUs) {
+      return FALSE;
+   }
+
+   ASSERT(Atomic_Read32(&data.index) <= query->numLogicalCPUs);
+   query->numLogicalCPUs = Atomic_Read32(&data.index);
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_YieldToSet --
+ *
+ *      Yield the CPU until a vCPU from the requested set has run.
+ *
+ *      usecs is the total spin time in monitor.  Very low numbers
+ *      indicate we detected there was a vCPU thread that was not
+ *      in the monitor, so we didn't spin.  In that case, simply 
+ *      nudge the threads we want and return.
+ *
+ * Results:
+ *      The current CPU yields whenever possible.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_YieldToSet(VMDriver *vm,       // IN:
+                 Vcpuid currVcpu,    // IN:
+                 const VCPUSet *req, // IN:
+                 uint32 usecs,       // IN:
+                 Bool skew)          // IN:
+{
+   VCPUSet vcpus;
+
+   if (VCPUSet_IsEmpty(req)) {
+      return;
+   }
+
+#ifdef __APPLE__
+   if (skew) {
+      /* Mac scheduler yield does fine in the skew case */
+      (void)thread_block(THREAD_CONTINUE_NULL);
+      return;
+   }
+#endif
+
+   /* Crosscalls should spin a few times before blocking */
+   if (!skew && usecs < CROSSCALL_SPIN_SHORT_US) {
+      HostIF_WakeUpYielders(vm, currVcpu);
+      return;
+   }
+
+   if (HostIF_PrepareWaitForThreads(vm, currVcpu)) {
+      return;
+   }
+
+   VCPUSet_Empty(&vcpus);
+   FOR_EACH_VCPU_IN_SET(req, vcpuid) {
+      if (vcpuid == currVcpu) {
+         continue;
+      }
+      /*
+       * First assume the vCPU we want to have wake up the current vCPU
+       * is out of the monitor, so set its wakeup bit corresponding to
+       * the current vCPU.  It may or may not actually be on the vmmon side.
+       */
+
+      VCPUSet_AtomicInclude(&vm->crosscallWaitSet[vcpuid], currVcpu);
+
+      /*
+       * Now that the bit is set, check whether the vCPU is in vmmon.  If
+       * it was previously in vmmon, and then took a trip to the monitor
+       * and back before we got here, then the wakeup has already been sent.
+       * If it is in the monitor, either it started in vmmon and sent the
+       * wakeup, or it was there the entire time.  In either case we can
+       * clear the bit.  This is safe because the bit is directed solely
+       * at the current vCPU.
+       */
+
+      if (vm->currentHostCpu[vcpuid] != INVALID_PCPU) {
+         VCPUSet_AtomicRemove(&vm->crosscallWaitSet[vcpuid], currVcpu);
+      } else {
+         if (VCPUSet_AtomicIsMember(&vm->crosscallWaitSet[vcpuid], currVcpu)) {
+            VCPUSet_Include(&vcpus, vcpuid);
+         }
+      }
+   } ROF_EACH_VCPU_IN_SET();
+
+   /*
+    * Wake up any threads that had previously yielded the processor to
+    * let this one run.
+    */
+
+   HostIF_WakeUpYielders(vm, currVcpu);
+
+   /*
+    * If this thread has other threads to wait for, and no other threads
+    * are waiting for this thread, block until one of the threads we're
+    * waiting for has run.
+    */
+
+   if (!VCPUSet_IsEmpty(&vcpus) &&
+       VCPUSet_IsEmpty(&vm->crosscallWaitSet[currVcpu])) {
+      HostIF_WaitForThreads(vm, currVcpu);
+   }
+
+   /*
+    * Tell other vcpus that they no longer have to wake this one.
+    * This is optional, the other threads will eventually clear their
+    * bits anyway.
+    */
+
+   FOR_EACH_VCPU_IN_SET(&vcpus, vcpuid) {
+      VCPUSet_AtomicRemove(&vm->crosscallWaitSet[vcpuid], currVcpu);
+   } ROF_EACH_VCPU_IN_SET();
+
+   HostIF_CancelWaitForThreads(vm, currVcpu);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86PerfCtrInUse --
+ *
+ *      Determine which performance counters are already in use by the
+ *      host on the current PCPU.  A performance counter is considered
+ *      in use if its event select enable bit is set or if this method
+ *      is unable to count events with the performance counter.
+ *
+ * Results:
+ *      Return TRUE if counter is in use.
+ *
+ * Side effects:
+ *      None.
+ *----------------------------------------------------------------------
+ */
+static Bool
+Vmx86PerfCtrInUse(Bool isGen, unsigned pmcNum, unsigned ctrlMSR,
+                  unsigned cntMSR, Bool hasPGC)
+{
+   volatile unsigned delay;
+   uint64 origPGC = hasPGC ? __GET_MSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR) : 0;
+   uint64 pmcCtrl;
+   uint64 pmcCount, count;
+   uint64 ctrlEna, pgcEna;
+
+   pmcCtrl = __GET_MSR(ctrlMSR);
+   if (isGen) {
+      ASSERT(pmcNum < 32);
+      if ((pmcCtrl & PERFCTR_CPU_ENABLE) != 0) {
+         return TRUE;
+      }
+      ctrlEna = PERFCTR_CPU_ENABLE | PERFCTR_CPU_KERNEL_MODE |
+                PERFCTR_CORE_INST_RETIRED;
+      pgcEna = CONST64U(1) << pmcNum;
+   } else {
+      ASSERT(pmcNum < 3);
+      if ((pmcCtrl & PERFCTR_CORE_FIXED_ENABLE_MASKn(pmcNum)) != 0) {
+         return TRUE;
+      }
+      ctrlEna = pmcCtrl | PERFCTR_CORE_FIXED_KERNEL_MASKn(pmcNum);
+      pgcEna = CONST64U(1) << (pmcNum + 32);
+   }
+   pmcCount = __GET_MSR(cntMSR);
+   /* Enable the counter. */
+   __SET_MSR(ctrlMSR, ctrlEna);
+   if (hasPGC) {
+      __SET_MSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR, pgcEna | origPGC);
+   }
+   /* Retire some instructions and wait a few cycles. */
+   for (delay = 0; delay < 100; delay++) ;
+   /* Disable the counter. */
+   if (hasPGC) {
+      __SET_MSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR, origPGC);
+   }
+   count = __GET_MSR(cntMSR);
+   __SET_MSR(ctrlMSR, pmcCtrl);
+   __SET_MSR(cntMSR, pmcCount);
+   return count == pmcCount;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86GetUnavailPerfCtrsOnCPU --
+ *
+ *      Determine which performance counters are already in use by the
+ *      host on the current PCPU. 
+ *
+ * Results:
+ *      A bitset representing unavailable performance counter.
+ *      Bits 0-31 represent general purpose counters, and bits 32-63
+ *      represent fixed counters.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86GetUnavailPerfCtrsOnCPU(void *data)
+{
+   CPUIDRegs regs;
+   unsigned i, numGen = 0, numFix = 0, stride = 1;
+   uint32 selBase = 0;
+   uint32 ctrBase = 0;
+   Bool hasPGC = FALSE;
+   Atomic_uint64 *ctrs = (Atomic_uint64 *)data;
+   uintptr_t flags;
+   if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
+      unsigned version;
+      if (__GET_EAX_FROM_CPUID(0) < 0xA) {
+         return;
+      }
+      __GET_CPUID(0xA, &regs);
+      version = CPUID_GET(0xA, EAX, PMC_VERSION, regs.eax);
+      if (version == 0) {
+         return;
+      }
+      numGen = CPUID_GET(0xA, EAX, PMC_NUM_GEN, regs.eax);
+      if (version >= 2) {
+         numFix = CPUID_GET(0xA, EDX, PMC_NUM_FIXED, regs.edx);
+         hasPGC = TRUE;
+      }
+      selBase = PERFCTR_CORE_PERFEVTSEL0_ADDR;
+      ctrBase = PERFCTR_CORE_PERFCTR0_ADDR;
+   } else if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
+      if (CPUID_FAMILY_IS_BULLDOZER(__GET_EAX_FROM_CPUID(1))) {
+         numGen  = 6;
+         selBase = PERFCTR_BD_BASE_ADDR + PERFCTR_BD_EVENTSEL;
+         ctrBase = PERFCTR_BD_BASE_ADDR + PERFCTR_BD_CTR;
+         stride  = 2;
+      } else {
+         numGen  = 4;
+         selBase = PERFCTR_AMD_PERFEVTSEL0_ADDR;
+         ctrBase = PERFCTR_AMD_PERFCTR0_ADDR;
+      }
+   }
+   ASSERT(numGen <= 32 && numFix <= 32);
+
+   /*
+    * Vmx86PerfCtrInUse modifies performance counters to determine if
+    * if they are usable, disable interrupts to avoid racing with
+    * interrupt handlers.
+    */
+   SAVE_FLAGS(flags);
+   CLEAR_INTERRUPTS();
+   for (i = 0; i < numGen; i++) {
+      if (Vmx86PerfCtrInUse(TRUE, i, selBase + i * stride,
+                            ctrBase + i * stride, hasPGC)) {
+         Atomic_SetBit64(ctrs, i);
+      }
+   }
+   if (numFix > 0) {
+      for (i = 0; i < numFix; i++) {
+         if (Vmx86PerfCtrInUse(FALSE, i, PERFCTR_CORE_FIXED_CTR_CTRL_ADDR,
+                               PERFCTR_CORE_FIXED_CTR0_ADDR + i, hasPGC)) {
+            Atomic_SetBit64(ctrs, i + 32);
+         }
+      }
+   }
+   RESTORE_FLAGS(flags);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetUnavailablePerfCtrs --
+ *
+ *      Determine which performance counters are already in use by the
+ *      host on across all PCPUs, and therefore unavailable for use by
+ *      the monitor.  A performance counter is considered in use if its
+ *      event select enable bit on any PCPU is set.
+ *
+ * Results:
+ *      A bitset representing unavailable performance counter.
+ *      Bits 0-31 represent general purpose counters, and bits 32-63
+ *      represent fixed counters.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint64
+Vmx86_GetUnavailablePerfCtrs(void)
+{
+   Atomic_uint64 unavailCtrs;
+   Atomic_Write64(&unavailCtrs, 0);
+   HostIF_CallOnEachCPU(Vmx86GetUnavailPerfCtrsOnCPU, &unavailCtrs);
+   return Atomic_Read64(&unavailCtrs);
+}
+
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
new file mode 100644
index 00000000..71ea01b9
--- /dev/null
+++ b/vmmon-only/common/vmx86.h
@@ -0,0 +1,201 @@
+/*********************************************************
+ * Copyright (C) 1998-2013,2015-2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *  vmx86.h - Platform independent data and interface for supporting
+ *            the vmx86 device driver.
+ */
+
+#ifndef VMX86_H
+#define VMX86_H
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "x86apic.h"
+#include "x86msr.h"
+#include "modulecall.h"
+#include "vcpuid.h"
+#include "initblock.h"
+#include "iocontrols.h"
+#include "numa_defs.h"
+#include "rateconv.h"
+#include "vmmem_shared.h"
+#include "apic.h"
+
+typedef struct PseudoTSCOffsetInfo {
+   uint32 inVMMCnt;                  /* Number of vcpus executing in the VMM. */
+   uint32 vcpuid;                    /* Index into VMDriver.ptscOffsets. */
+} PseudoTSCOffsetInfo;
+
+typedef struct TSCDelta {
+   Atomic_uint64 min;
+   Atomic_uint64 max;
+} TSCDelta;
+
+/*
+ * VMDriver - the main data structure for the driver side of a
+ *            virtual machine.
+ */
+
+typedef struct VMDriver {
+   /* Unique (in the driver), strictly positive, VM ID used by userland. */
+   int                          userID;
+
+   struct VMDriver             *nextDriver;   /* Next on list of all VMDrivers */
+
+   Vcpuid                       numVCPUs;     /* Number of vcpus in VM. */
+   struct VMHost               *vmhost;       /* Host-specific fields. */
+
+   /* Pointers to the crossover pages shared with the monitor. */
+   struct VMCrossPage          *crosspage[MAX_INITBLOCK_CPUS];
+   volatile uint32              currentHostCpu[MAX_INITBLOCK_CPUS];
+   VCPUSet                      crosscallWaitSet[MAX_INITBLOCK_CPUS];
+   APICDescriptor               hostAPIC;
+
+   struct MemTrack             *memtracker;   /* Memory tracker pointer */
+   Bool                         checkFuncFailed;
+   struct PerfCounter          *perfCounter;
+   VMMemMgmtInfo                memInfo;
+   unsigned                     fastClockRate;/* Protected by FastClockLock. */
+   int                          fastSuspResFlag;
+
+   volatile PseudoTSCOffsetInfo ptscOffsetInfo; /* Volatile per PR 699101#29. */
+   Atomic_uint64                ptscLatest;
+   int64                        ptscOffsets[MAX_INITBLOCK_CPUS];
+} VMDriver;
+
+typedef struct VmTimeStart {
+   uint64 count;
+   uint64 time;
+} VmTimeStart;
+
+typedef struct RefClockParams {
+   RateConv_Ratio ratio;
+   Atomic_uint64  add;
+} RefClockParams;
+
+typedef struct PseudoTSC {
+   RefClockParams refClockToPTSC;
+   int64          tscOffset;
+   uint64         hz;
+   volatile Bool  useRefClock;
+   Bool           neverSwitchToRefClock;
+   Bool           hwTSCsSynced;
+   volatile Bool  initialized;
+} PseudoTSC;
+
+extern PseudoTSC pseudoTSC;
+
+#define MAX_LOCKED_PAGES (-1)
+
+extern VMDriver *Vmx86_CreateVM(void);
+extern int Vmx86_ReleaseVM(VMDriver *vm);
+extern int Vmx86_InitVM(VMDriver *vm, InitBlock *initParams);
+extern int Vmx86_LateInitVM(VMDriver *vm);
+extern int Vmx86_RunVM(VMDriver *vm, Vcpuid vcpuid);
+extern void Vmx86_YieldToSet(VMDriver *vm, Vcpuid currVcpu, const VCPUSet *req,
+                             uint32 usecs, Bool skew);
+extern void Vmx86_ReadTSCAndUptime(VmTimeStart *st);
+extern uint32 Vmx86_ComputekHz(uint64 cycles, uint64 uptime);
+extern uint32 Vmx86_GetkHzEstimate(VmTimeStart *st);
+extern int Vmx86_SetHostClockRate(VMDriver *vm, unsigned rate);
+extern int Vmx86_LockPage(VMDriver *vm,
+                          VA64 uAddr,
+                          Bool allowMultipleMPNsPerVA,
+                          MPN *mpn);
+extern int Vmx86_UnlockPage(VMDriver *vm, VA64 uAddr);
+extern int Vmx86_UnlockPageByMPN(VMDriver *vm, MPN mpn, VA64 uAddr);
+extern MPN Vmx86_GetRecycledPage(VMDriver *vm);
+extern int Vmx86_ReleaseAnonPage(VMDriver *vm, MPN mpn);
+extern int Vmx86_AllocLockedPages(VMDriver *vm, VA64 addr,
+				  unsigned numPages, Bool kernelMPNBuffer,
+                                  Bool ignoreLimits);
+extern int Vmx86_FreeLockedPages(VMDriver *vm, VA64 addr,
+				 unsigned numPages, Bool kernelMPNBuffer);
+extern MPN Vmx86_GetNextAnonPage(VMDriver *vm, MPN mpn);
+extern int Vmx86_GetLockedPageList(VMDriver *vm, VA64 uAddr,
+				   unsigned int numPages);
+
+extern int32 Vmx86_GetNumVMs(void);
+extern int32 Vmx86_GetTotalMemUsage(void);
+extern Bool Vmx86_SetConfiguredLockedPagesLimit(unsigned limit);
+extern void Vmx86_SetDynamicLockedPagesLimit(unsigned limit);
+extern Bool Vmx86_GetMemInfo(VMDriver *curVM,
+                             Bool curVMOnly,
+                             VMMemInfoArgs *args,
+                             int outArgsLength);
+extern void Vmx86_Admit(VMDriver *curVM, VMMemInfoArgs *args);
+extern Bool Vmx86_Readmit(VMDriver *curVM, OvhdMem_Deltas *delta);
+extern void Vmx86_UpdateMemInfo(VMDriver *curVM,
+                                const VMMemMgmtInfoPatch *patch);
+extern void Vmx86_Add2MonPageTable(VMDriver *vm, VPN vpn, MPN mpn,
+				   Bool readOnly);
+extern Bool Vmx86_PAEEnabled(void);
+extern Bool Vmx86_VMXEnabled(void);
+extern Bool Vmx86_GetAllMSRs(MSRQuery *query);
+extern void Vmx86_MonTimerIPI(void);
+extern void Vmx86_InitIDList(void);
+extern VMDriver *Vmx86_LookupVMByUserID(int userID);
+extern Bool Vmx86_FastSuspResSetOtherFlag(VMDriver *vm, int otherVmUserId);
+extern int  Vmx86_FastSuspResGetMyFlag(VMDriver *vm, Bool blockWait);
+extern void Vmx86_Open(void);
+extern void Vmx86_Close(void);
+
+static INLINE Bool
+Vmx86_HwTSCsSynced(void)
+{
+   return pseudoTSC.hwTSCsSynced;
+}
+
+static INLINE Bool
+Vmx86_PseudoTSCUsesRefClock(void)
+{
+   return pseudoTSC.useRefClock;
+}
+
+static INLINE Bool
+Vmx86_SetPseudoTSCUseRefClock(void)
+{
+   if (!pseudoTSC.useRefClock && !pseudoTSC.neverSwitchToRefClock) {
+      pseudoTSC.useRefClock = TRUE;
+      return TRUE;
+   }
+   return FALSE;
+}
+
+static INLINE uint64
+Vmx86_GetPseudoTSCHz(void)
+{
+   return pseudoTSC.hz;
+}
+
+static INLINE uint64
+Vmx86_GetPseudoTSCOffset(void)
+{
+   return pseudoTSC.tscOffset;
+}
+
+extern void Vmx86_InitPseudoTSC(PTSCInitParams *params);
+extern Bool Vmx86_CheckPseudoTSC(uint64 *lastTSC, uint64 *lastRC);
+extern uint64 Vmx86_GetPseudoTSC(void);
+
+extern uint64 Vmx86_GetUnavailablePerfCtrs(void);
+
+#endif 
diff --git a/vmmon-only/include/address_defs.h b/vmmon-only/include/address_defs.h
new file mode 100644
index 00000000..f7ba0645
--- /dev/null
+++ b/vmmon-only/include/address_defs.h
@@ -0,0 +1,95 @@
+/*********************************************************
+ * Copyright (C) 2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * address_defs.h --
+ *
+ *	Macros for virtual/physical/machine address/page conversions, page types.
+ */
+
+#ifndef _ADDRESS_DEFS_H_
+#define _ADDRESS_DEFS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_defs.h" // For PAGE_SHIFT
+
+/*
+ * Virtual, physical, machine address and page conversion macros
+ */
+
+#define VA_2_VPN(_va)  ((_va) >> PAGE_SHIFT)
+#define PTR_2_VPN(_ptr) VA_2_VPN((VA)(_ptr))
+#define VPN_2_VA(_vpn) ((_vpn) << PAGE_SHIFT)
+#define VPN_2_PTR(_vpn) ((void *)VPN_2_VA(_vpn))
+
+/*
+ * Notice that we don't cast PA_2_PPN's argument to an unsigned type, because
+ * we would lose compile-time checks for pointer operands and byte-sized
+ * operands. If you use a signed quantity for _pa, ones may be shifted into the
+ * high bits of your ppn.
+ */
+
+#define PA_2_PPN(_pa)     ((_pa) >> PAGE_SHIFT)
+#define PPN_2_PA(_ppn)    ((PA)(_ppn) << PAGE_SHIFT)
+
+static INLINE MA    MPN_2_MA(MPN mpn)     { return  (MA)mpn << PAGE_SHIFT;  }
+static INLINE MPN   MA_2_MPN(MA ma)       { return (MPN)(ma >> PAGE_SHIFT); }
+
+static INLINE IOA   IOPN_2_IOA(IOPN iopn) { return (IOA)(iopn << PAGE_SHIFT); }
+static INLINE IOPN  IOA_2_IOPN(IOA ioa)   { return (IOPN)(ioa >> PAGE_SHIFT); }
+
+typedef char PageArray[PAGE_SIZE];
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IsGoodMPN --
+ *
+ *      Is the given MPN valid?
+ *
+ * Results:
+ *      Return TRUE if "mpn" looks plausible. We could make this stricter on
+ *      a per-architecture basis.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+IsGoodMPN(MPN mpn)
+{
+   return mpn <= MAX_MPN;
+}
+
+static INLINE Bool
+IsGoodMPNOrMemref(MPN mpn)
+{
+   return IsGoodMPN(mpn) || mpn == MEMREF_MPN;
+}
+
+#endif
diff --git a/vmmon-only/include/basic_initblock.h b/vmmon-only/include/basic_initblock.h
new file mode 100644
index 00000000..438e9b61
--- /dev/null
+++ b/vmmon-only/include/basic_initblock.h
@@ -0,0 +1,60 @@
+/*********************************************************
+ * Copyright (C) 2006 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * basic_initblock.h --
+ *
+ *    VM initialization block.
+ */
+
+#ifndef _BASIC_INITBLOCK_H_
+#define _BASIC_INITBLOCK_H_
+
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+
+#include "vcpuid.h"
+
+
+#define MAX_INITBLOCK_CPUS     128
+
+
+typedef
+#include "vmware_pack_begin.h"
+struct InitBlock {
+   uint32 magicNumber;     /* Magic number (INIT_BLOCK_MAGIC) */
+   Vcpuid numVCPUs;
+   VA64   crosspage[MAX_INITBLOCK_CPUS];
+   uint32 vmInitFailurePeriod;
+   LA64   crossGDTHKLA;
+   MPN    crossGDTMPNs[5];  // CROSSGDT_NUMPAGES
+}
+#include "vmware_pack_end.h"
+InitBlock;
+
+
+#endif // _BASIC_INITBLOCK_H_
diff --git a/vmmon-only/include/circList.h b/vmmon-only/include/circList.h
new file mode 100644
index 00000000..ac4f48f1
--- /dev/null
+++ b/vmmon-only/include/circList.h
@@ -0,0 +1,428 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *   circList.h --
+ *
+ * macros, prototypes and struct definitions for double-linked
+ * circular lists.
+ */
+
+#ifndef _CIRCLIST_H_
+#define _CIRCLIST_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#include "includeCheck.h"
+#include "vmware.h"
+
+typedef struct ListItem {
+   struct ListItem *prev;
+   struct ListItem *next;
+} ListItem;
+
+/* A list with no elements is a null pointer. */
+#define   LIST_ITEM_DEF(name)   \
+   ListItem * name = NULL
+
+#define   LIST_EMPTY(l)      ((l) == NULL)
+
+/* initialize list item */
+#define   INIT_LIST_ITEM(p)   \
+   do {   \
+      (p)->prev = (p)->next = (p);   \
+   } while (0)
+
+/* check if initialized */
+#define   IS_LIST_ITEM_INITIALIZED(li)   \
+   (((li) == (li)->prev) && ((li) == (li)->next))
+
+/* return first element in the list */
+#define   LIST_FIRST(l)      (l)
+#define   LIST_FIRST_CHK(l)   (l)
+
+/* return last element in the list */
+#define   LIST_LAST(l)      ((l)->prev)
+#define   LIST_LAST_CHK(l)   (LIST_EMPTY(l) ? NULL : LIST_LAST(l))
+
+/*
+ * LIST_CONTAINER - get the struct for this entry (like list_entry)
+ * @ptr: the &struct ListItem pointer.
+ * @type:   the type of the struct this is embedded in.
+ * @member: the name of the list struct within the struct.
+ */
+#define LIST_CONTAINER(ptr, type, member) \
+   VMW_CONTAINER_OF(ptr, type, member)
+
+/*
+ * delete item from the list
+ */
+#define   LIST_DEL            DelListItem
+
+/*
+ * link two lists together
+ */
+#define   LIST_SPLICE         SpliceLists
+
+/*
+ * Split a list into two lists
+ */
+#define   LIST_SPLIT          SplitLists
+
+/*
+ * Add item to front of stack. List pointer points to new head.
+ */
+#define   LIST_PUSH           PushListItem
+
+/*
+ * Add item at back of queue. List pointer only changes if list was empty.
+ */
+#define   LIST_QUEUE          QueueListItem
+
+/*
+ * Get the list size.
+ */
+#define   LIST_SIZE           GetListSize
+
+/*
+ * LIST_SCAN_FROM scans the list from "from" up until "until".
+ * The loop variable p should not be destroyed in the process.
+ * "from" is an element in the list where to start scanning.
+ * "until" is the element where search should stop.
+ * member is the field to use for the search - either "next" or "prev".
+ */
+#define   LIST_SCAN_FROM(p, from, until, member)   \
+   for (p = (from); (p) != NULL;   \
+      (p) = (((p)->member == (until)) ? NULL : (p)->member))
+
+/* scan the entire list (non-destructively) */
+#define   LIST_SCAN(p, l)   \
+   LIST_SCAN_FROM(p, LIST_FIRST(l), LIST_FIRST(l), next)
+
+
+/* scan a list backward from last element to first (non-destructively) */
+#define   LIST_SCAN_BACK(p, l)   \
+   LIST_SCAN_FROM(p, LIST_LAST_CHK(l), LIST_LAST(l), prev)
+
+/* scan the entire list where loop element may be destroyed */
+#define   LIST_SCAN_SAFE(p, pn, l)   \
+   if (!LIST_EMPTY(l))  \
+      for (p = (l), (pn) = NextListItem(p, l); (p) != NULL;   \
+           (p) = (pn), (pn) = NextListItem(p, l))
+
+/* scan the entire list backwards where loop element may be destroyed */
+#define   LIST_SCAN_BACK_SAFE(p, pn, l)   \
+   if (!LIST_EMPTY(l))  \
+      for (p = LIST_LAST(l), (pn) = PrevListItem(p, l); (p) != NULL;   \
+           (p) = (pn), (pn) = PrevListItem(p, l))
+
+
+/* function definitions */
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * NextListItem --
+ *
+ *      Returns the next member of a doubly linked list, or NULL if last.
+ *      Assumes: p is member of the list headed by head.
+ *
+ * Result:
+ *      If head or p is NULL, return NULL. Otherwise,
+ *      next list member (or null if last).
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE ListItem *
+NextListItem(ListItem *p,        // IN
+             ListItem *head)     // IN
+{
+   if (head == NULL || p == NULL) {
+      return NULL;
+   }
+   /* both p and head are non-null */
+   p = p->next;
+   return p == head ? NULL : p;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PrevListItem --
+ *
+ *      Returns the prev member of a doubly linked list, or NULL if first.
+ *      Assumes: p is member of the list headed by head.
+ *
+ * Result:
+ *      If head or prev is NULL, return NULL. Otherwise,
+ *      prev list member (or null if first).
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE ListItem *
+PrevListItem(ListItem *p,        // IN
+             ListItem *head)     // IN
+{
+   if (head == NULL || p == NULL) {
+      return NULL;
+   }
+   /* both p and head are non-null */
+   return p == head ? NULL : p->prev;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * DelListItem --
+ *
+ *      Deletes a member of a doubly linked list, possibly modifies the
+ *      list header itself.
+ *      Assumes neither p nor headp is null and p is a member of *headp.
+ *
+ * Result:
+ *      None
+ *
+ * Side effects:
+ *      Modifies *headp.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+DelListItem(ListItem *p,         // IN
+            ListItem **headp)    // IN/OUT
+{
+   ListItem *next;
+
+   ASSERT(p);
+   ASSERT(headp);
+
+   next = p->next;
+   if (p == next) {
+      *headp = NULL;
+   } else {
+      next->prev = p->prev;
+      p->prev->next = next;
+      if (*headp == p) {
+         *headp = next;
+      }
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * QueueListItem --
+ *
+ *      Adds a new member to the back of a doubly linked list (queue)
+ *      Assumes neither p nor headp is null and p is not a member of *headp.
+ *
+ * Result:
+ *      None
+ *
+ * Side effects:
+ *      Modifies *headp.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+QueueListItem(ListItem *p,              // IN
+              ListItem **headp)         // IN/OUT
+{
+   ListItem *head;
+
+   head = *headp;
+   if (LIST_EMPTY(head)) {
+      INIT_LIST_ITEM(p);
+      *headp = p;
+   } else {
+      p->prev = head->prev;
+      p->next = head;
+      p->prev->next = p;
+      head->prev = p;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PushListItem --
+ *
+ *      Adds a new member to the front of a doubly linked list (stack)
+ *      Assumes neither p nor headp is null and p is not a member of *headp.
+ *
+ * Result:
+ *      None
+ *
+ * Side effects:
+ *      Modifies *headp.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+PushListItem(ListItem *p,               // IN
+             ListItem **headp)          // IN/OUT
+{
+   QueueListItem(p, headp);
+   *headp = p;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SpliceLists --
+ *
+ *      Make a single list {l1 l2} from {l1} and {l2} and return it.
+ *      It is okay for one or both lists to be NULL.
+ *      No checking is done. It is assumed that l1 and l2 are two
+ *      distinct lists.
+ *
+ * Result:
+ *      A list { l1 l2 }.
+ *
+ * Side effects:
+ *      Modifies l1 and l2 list pointers.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE ListItem *
+SpliceLists(ListItem *l1,      // IN
+            ListItem *l2)      // IN
+{
+   ListItem *l1Last, *l2Last;
+
+   if (LIST_EMPTY(l1)) {
+      return l2;
+   }
+
+   if (LIST_EMPTY(l2)) {
+      return l1;
+   }
+
+   l1Last = l1->prev;   /* last elem of l1 */
+   l2Last = l2->prev;   /* last elem of l2 */
+
+   /*
+    *    l1 -> ... -> l1Last    l2 -> ... l2Last
+    */
+   l1Last->next = l2;
+   l2->prev = l1Last;
+
+   l1->prev = l2Last;
+   l2Last->next = l1;
+
+   return l1;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SplitLists --
+ *
+ *      Make a list l = {l1 l2} into two separate lists {l1} and {l2}, where:
+ *      l = { ... x -> p -> ... } split into:
+ *      l1 = { ... -> x }
+ *      l2 = { p -> ... }
+ *      Assumes neither p nor l is null and p is a member of l.
+ *      If p is the first element of l, then l1 will be NULL.
+ *
+ * Result:
+ *      None.
+ *
+ * Side effects:
+ *      Sets *l1p and *l2p to the resulting two lists.
+ *      Modifies l's pointers.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+SplitLists(ListItem *p,         // IN
+           ListItem *l,         // IN
+           ListItem **l1p,      // OUT
+           ListItem **l2p)      // OUT
+{
+   ListItem *last;
+
+   if (p == LIST_FIRST(l)) {   /* first element */
+      *l1p = NULL;
+      *l2p = l;
+      return;
+   }
+
+   last = l->prev;
+
+   *l1p = l;
+   p->prev->next = l;
+   l->prev = p->prev;
+
+   *l2p = p;
+   p->prev = last;
+   last->next = p;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * GetListSize --
+ *
+ *	Return the number of items in the list.
+ *
+ * Result:
+ *	The number of items in the list.
+ *
+ * Side effects:
+ *	None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE int
+GetListSize(ListItem *head)     // IN
+{
+   ListItem *li;
+   int ret = 0;
+
+   LIST_SCAN(li, head) {
+      ret++;
+   }
+   return ret;
+}
+
+#endif /* _CIRCLIST_H_ */
diff --git a/vmmon-only/include/community_source.h b/vmmon-only/include/community_source.h
new file mode 100644
index 00000000..2d32d8fa
--- /dev/null
+++ b/vmmon-only/include/community_source.h
@@ -0,0 +1,67 @@
+/*********************************************************
+ * Copyright (C) 2009-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * community_source.h --
+ *
+ *    Macros for excluding source code from community.
+ */
+
+#ifndef _COMMUNITY_SOURCE_H_
+#define _COMMUNITY_SOURCE_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+/* 
+ * Convenience macro for COMMUNITY_SOURCE
+ */
+#undef EXCLUDE_COMMUNITY_SOURCE
+#ifdef COMMUNITY_SOURCE
+   #define EXCLUDE_COMMUNITY_SOURCE(x) 
+#else
+   #define EXCLUDE_COMMUNITY_SOURCE(x) x
+#endif
+
+#undef COMMUNITY_SOURCE_AMD_SECRET
+#if !defined(COMMUNITY_SOURCE) || defined(AMD_SOURCE)
+/*
+ * It's ok to include AMD_SECRET source code for non-Community Source,
+ * or for drops directed at AMD.
+ */
+   #define COMMUNITY_SOURCE_AMD_SECRET
+#endif
+
+#undef COMMUNITY_SOURCE_INTEL_SECRET
+#if !defined(COMMUNITY_SOURCE) || defined(INTEL_SOURCE)
+/*
+ * It's ok to include INTEL_SECRET source code for non-Community Source,
+ * or for drops directed at Intel.
+ */
+   #define COMMUNITY_SOURCE_INTEL_SECRET
+#endif
+
+#endif
diff --git a/vmmon-only/include/compat_autoconf.h b/vmmon-only/include/compat_autoconf.h
new file mode 100644
index 00000000..26064aa8
--- /dev/null
+++ b/vmmon-only/include/compat_autoconf.h
@@ -0,0 +1,41 @@
+/*********************************************************
+ * Copyright (C) 2009 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_AUTOCONF_H__
+#   define __COMPAT_AUTOCONF_H__
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMKDRIVERS
+#include "includeCheck.h"
+
+
+#ifndef LINUX_VERSION_CODE
+#   error "Include compat_version.h before compat_autoconf.h"
+#endif
+
+/* autoconf.h moved from linux/autoconf.h to generated/autoconf.h in 2.6.33-rc1. */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 33)
+#   include <linux/autoconf.h>
+#else
+#   include <generated/autoconf.h>
+#endif
+
+#endif /* __COMPAT_AUTOCONF_H__ */
diff --git a/vmmon-only/include/compat_cred.h b/vmmon-only/include/compat_cred.h
new file mode 100644
index 00000000..95a7baa7
--- /dev/null
+++ b/vmmon-only/include/compat_cred.h
@@ -0,0 +1,47 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_CRED_H__
+#   define __COMPAT_CRED_H__
+
+
+/*
+ * Include linux/cred.h via linux/sched.h - it is not nice, but
+ * as cpp does not have #ifexist...
+ */
+#include <linux/sched.h>
+
+#if !defined(current_fsuid) && LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 29)
+#define current_uid() (current->uid)
+#define current_euid() (current->euid)
+#define current_fsuid() (current->fsuid)
+#define current_gid() (current->gid)
+#define current_egid() (current->egid)
+#define current_fsgid() (current->fsgid)
+#endif
+
+#if !defined(cap_set_full)
+/* cap_set_full was removed in kernel version 3.0-rc4. */
+#define cap_set_full(_c) do { (_c) = CAP_FULL_SET; } while (0)
+#endif
+
+#if !defined(GLOBAL_ROOT_UID)
+#define GLOBAL_ROOT_UID (0)
+#endif
+
+#endif /* __COMPAT_CRED_H__ */
diff --git a/vmmon-only/include/compat_highmem.h b/vmmon-only/include/compat_highmem.h
new file mode 100644
index 00000000..263380d6
--- /dev/null
+++ b/vmmon-only/include/compat_highmem.h
@@ -0,0 +1,32 @@
+/*********************************************************
+ * Copyright (C) 2012 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_HIGHMEM_H__
+#   define __COMPAT_HIGHMEM_H__
+
+#include <linux/highmem.h>
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
+#   define compat_kmap_atomic(_page)   kmap_atomic(_page)
+#   define compat_kunmap_atomic(_page) kunmap_atomic(_page)
+#else
+#   define compat_kmap_atomic(_page)   kmap_atomic((_page), KM_USER0)
+#   define compat_kunmap_atomic(_page) kunmap_atomic((_page), KM_USER0)
+#endif
+
+#endif /* __COMPAT_HIGHMEM_H__ */
diff --git a/vmmon-only/include/compat_interrupt.h b/vmmon-only/include/compat_interrupt.h
new file mode 100644
index 00000000..1d72a4bb
--- /dev/null
+++ b/vmmon-only/include/compat_interrupt.h
@@ -0,0 +1,55 @@
+/*********************************************************
+ * Copyright (C) 2003 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_INTERRUPT_H__
+#   define __COMPAT_INTERRUPT_H__
+
+
+#include <linux/interrupt.h>
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 69)
+/*
+ * We cannot just define irqreturn_t, as some 2.4.x kernels have
+ * typedef void irqreturn_t; for "increasing" backward compatibility.
+ */
+typedef void compat_irqreturn_t;
+#define COMPAT_IRQ_NONE
+#define COMPAT_IRQ_HANDLED
+#define COMPAT_IRQ_RETVAL(x)
+#else
+typedef irqreturn_t compat_irqreturn_t;
+#define COMPAT_IRQ_NONE		IRQ_NONE
+#define COMPAT_IRQ_HANDLED	IRQ_HANDLED
+#define COMPAT_IRQ_RETVAL(x)	IRQ_RETVAL(x)
+#endif
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 18)
+#define COMPAT_IRQF_DISABLED    SA_INTERRUPT
+#define COMPAT_IRQF_SHARED      SA_SHIRQ
+#else
+#define COMPAT_IRQF_DISABLED    IRQF_DISABLED
+#define COMPAT_IRQF_SHARED      IRQF_SHARED
+#endif
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 20)
+#define COMPAT_IRQ_HANDLER_ARGS(irq, devp) (int irq, void *devp, struct pt_regs *regs)
+#else
+#define COMPAT_IRQ_HANDLER_ARGS(irq, devp) (int irq, void *devp)
+#endif
+
+#endif /* __COMPAT_INTERRUPT_H__ */
diff --git a/vmmon-only/include/compat_ioport.h b/vmmon-only/include/compat_ioport.h
new file mode 100644
index 00000000..bacdb50b
--- /dev/null
+++ b/vmmon-only/include/compat_ioport.h
@@ -0,0 +1,63 @@
+/*********************************************************
+ * Copyright (C) 2003 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_IOPORT_H__
+#   define __COMPAT_IOPORT_H__
+
+
+#include <linux/ioport.h>
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
+static inline void *
+compat_request_region(unsigned long start, unsigned long len, const char *name)
+{
+   if (check_region(start, len)) {
+      return NULL;
+   }
+   request_region(start, len, name);
+   return (void*)1;
+}
+#else
+#define compat_request_region(start, len, name) request_region(start, len, name)
+#endif
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 3, 7)
+/* mmap io support starts from 2.3.7, fail the call for kernel prior to that */
+static inline void *
+compat_request_mem_region(unsigned long start, unsigned long len, const char *name)
+{
+   return NULL;
+}
+
+static inline void
+compat_release_mem_region(unsigned long start, unsigned long len)
+{
+   return;
+}
+#else
+#define compat_request_mem_region(start, len, name) request_mem_region(start, len, name)
+#define compat_release_mem_region(start, len)       release_mem_region(start, len)
+#endif
+
+/* these two macro defs are needed by compat_pci_request_region */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 3, 15)
+#   define IORESOURCE_IO    0x00000100
+#   define IORESOURCE_MEM   0x00000200
+#endif
+
+#endif /* __COMPAT_IOPORT_H__ */
diff --git a/vmmon-only/include/compat_kernel.h b/vmmon-only/include/compat_kernel.h
new file mode 100644
index 00000000..04ba2d19
--- /dev/null
+++ b/vmmon-only/include/compat_kernel.h
@@ -0,0 +1,42 @@
+/*********************************************************
+ * Copyright (C) 2004 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_KERNEL_H__
+#   define __COMPAT_KERNEL_H__
+
+#include <asm/unistd.h>
+#include <linux/kernel.h>
+
+/*
+ * container_of was introduced in 2.5.28 but it's easier to check like this.
+ */
+#ifndef container_of
+#define container_of(ptr, type, member) ({			\
+        const typeof( ((type *)0)->member ) *__mptr = (ptr);	\
+        (type *)( (char *)__mptr - offsetof(type,member) );})
+#endif
+
+/*
+ * vsnprintf became available in 2.4.10. For older kernels, just fall back on
+ * vsprintf.
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 10)
+#define vsnprintf(str, size, fmt, args) vsprintf(str, fmt, args)
+#endif
+
+#endif /* __COMPAT_KERNEL_H__ */
diff --git a/vmmon-only/include/compat_module.h b/vmmon-only/include/compat_module.h
new file mode 100644
index 00000000..2af73722
--- /dev/null
+++ b/vmmon-only/include/compat_module.h
@@ -0,0 +1,83 @@
+/*********************************************************
+ * Copyright (C) 2007 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * compat_module.h --
+ */
+
+#ifndef __COMPAT_MODULE_H__
+#   define __COMPAT_MODULE_H__
+
+
+#include <linux/module.h>
+
+
+/*
+ * Modules wishing to use the GPL license are required to include a
+ * MODULE_LICENSE definition in their module source as of 2.4.10.
+ */
+#ifndef MODULE_LICENSE
+#define MODULE_LICENSE(license)
+#endif
+
+/*
+ * To make use of our own home-brewed MODULE_INFO, we need macros to
+ * concatenate two expressions to "__mod_", and and to convert an
+ * expression into a string. I'm sure we've got these in our codebase,
+ * but I'd rather not introduce such a dependency in a compat header.
+ */
+#ifndef __module_cat
+#define __module_cat_1(a, b) __mod_ ## a ## b
+#define __module_cat(a, b) __module_cat_1(a, b)
+#endif
+
+#ifndef __stringify
+#define __stringify_1(x) #x
+#define __stringify(x) __stringify_1(x)
+#endif
+
+/*
+ * MODULE_INFO was born in 2.5.69.
+ */
+#ifndef MODULE_INFO
+#define MODULE_INFO(tag, info)                                                \
+static const char __module_cat(tag, __LINE__)[]                               \
+  __attribute__((section(".modinfo"), unused)) = __stringify(tag) "=" info
+#endif
+
+/*
+ * MODULE_VERSION was born in 2.6.4. The earlier form appends a long "\0xxx"
+ * string to the module's version, but that was removed in 2.6.10, so we'll
+ * ignore it in our wrapper.
+ */
+#ifndef MODULE_VERSION
+#define MODULE_VERSION(_version) MODULE_INFO(version, _version)
+#endif
+
+/*
+ * Linux kernel < 2.6.31 takes 'int' for 'bool' module parameters.
+ * Linux kernel >= 3.3.0 takes 'bool' for 'bool' module parameters.
+ * Kernels between the two take either.  So flip switch at 3.0.0.
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 0, 0)
+   typedef bool compat_mod_param_bool;
+#else
+   typedef int compat_mod_param_bool;
+#endif
+
+#endif /* __COMPAT_MODULE_H__ */
diff --git a/vmmon-only/include/compat_page.h b/vmmon-only/include/compat_page.h
new file mode 100644
index 00000000..0bf0e251
--- /dev/null
+++ b/vmmon-only/include/compat_page.h
@@ -0,0 +1,75 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_PAGE_H__
+#   define __COMPAT_PAGE_H__
+
+
+#include <linux/mm.h>
+#include <asm/page.h>
+
+
+/* The pfn_to_page() API appeared in 2.5.14 and changed to function during 2.6.x */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0) && !defined(pfn_to_page)
+#   define pfn_to_page(_pfn) (mem_map + (_pfn))
+#   define page_to_pfn(_page) ((_page) - mem_map)
+#endif
+
+
+/* The virt_to_page() API appeared in 2.4.0 --hpreg */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0) && !defined(virt_to_page)
+#   define virt_to_page(_kvAddr) pfn_to_page(MAP_NR(_kvAddr))
+#endif
+
+
+/*
+ * The get_order() API appeared at some point in 2.3.x, and was then backported
+ * in 2.2.17-21mdk and in the stock 2.2.18. Because we can only detect its
+ * definition through makefile tricks, we provide our own for now --hpreg
+ */
+static inline int
+compat_get_order(unsigned long size) // IN
+{
+   int order;
+
+   size = (size - 1) >> (PAGE_SHIFT - 1);
+   order = -1;
+   do {
+      size >>= 1;
+      order++;
+   } while (size);
+
+   return order;
+}
+
+/* 
+ * BUG() was added to <asm/page.h> in 2.2.18, and was moved to <asm/bug.h>
+ * in 2.5.58.
+ * 
+ * XXX: Technically, this belongs in some sort of "compat_asm_page.h" file, but
+ * since our compatibility wrappers don't distinguish between <asm/xxx.h> and
+ * <linux/xxx.h>, putting it here is reasonable.
+ */
+#ifndef BUG
+#define BUG() do {                                                            \
+   printk("kernel BUG at %s:%d!\n", __FILE__, __LINE__);                      \
+  __asm__ __volatile__(".byte 0x0f,0x0b");                                    \
+} while (0)
+#endif
+
+#endif /* __COMPAT_PAGE_H__ */
diff --git a/vmmon-only/include/compat_pci.h b/vmmon-only/include/compat_pci.h
new file mode 100644
index 00000000..d1f897a7
--- /dev/null
+++ b/vmmon-only/include/compat_pci.h
@@ -0,0 +1,72 @@
+/*********************************************************
+ * Copyright (C) 1999 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * compat_pci.h: PCI compatibility wrappers.
+ */
+
+#ifndef __COMPAT_PCI_H__
+#define __COMPAT_PCI_H__
+
+#include "compat_ioport.h"
+#include <linux/pci.h>
+
+#ifndef DMA_BIT_MASK
+#  define DMA_BIT_MASK(n) DMA_##n##BIT_MASK
+#endif
+
+/*
+ * Power Management related compat wrappers.
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 10)
+#   define compat_pci_save_state(pdev)      pci_save_state((pdev), NULL)
+#   define compat_pci_restore_state(pdev)   pci_restore_state((pdev), NULL)
+#else
+#   define compat_pci_save_state(pdev)      pci_save_state((pdev))
+#   define compat_pci_restore_state(pdev)   pci_restore_state((pdev))
+#endif
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 11)
+#   define pm_message_t          u32
+#   define compat_pci_choose_state(pdev, state)  (state)
+#   define PCI_D0               0
+#   define PCI_D3hot            3
+#else
+#   define compat_pci_choose_state(pdev, state)  pci_choose_state((pdev), (state))
+#endif
+
+/* 2.6.14 changed the PCI shutdown callback */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 14)
+#   define COMPAT_PCI_SHUTDOWN(func)               .driver = { .shutdown = (func), }
+#   define COMPAT_PCI_DECLARE_SHUTDOWN(func, var)  (func)(struct device *(var))
+#   define COMPAT_PCI_TO_DEV(dev)                  (to_pci_dev(dev))
+#else
+#   define COMPAT_PCI_SHUTDOWN(func)               .shutdown = (func)
+#   define COMPAT_PCI_DECLARE_SHUTDOWN(func, var)  (func)(struct pci_dev *(var))
+#   define COMPAT_PCI_TO_DEV(dev)                  (dev)
+#endif
+
+/* 2.6.26 introduced the device_set_wakeup_enable() function */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 26)
+#   define compat_device_set_wakeup_enable(dev, val) do {} while(0)
+#else
+#   define compat_device_set_wakeup_enable(dev, val) \
+       device_set_wakeup_enable(dev, val)
+#endif
+
+#endif /* __COMPAT_PCI_H__ */
diff --git a/vmmon-only/include/compat_pgtable.h b/vmmon-only/include/compat_pgtable.h
new file mode 100644
index 00000000..dedc25ad
--- /dev/null
+++ b/vmmon-only/include/compat_pgtable.h
@@ -0,0 +1,139 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_PGTABLE_H__
+#   define __COMPAT_PGTABLE_H__
+
+
+#if defined(CONFIG_PARAVIRT) && defined(CONFIG_HIGHPTE)
+#   if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 21)
+#      include <asm/paravirt.h>
+#      undef paravirt_map_pt_hook
+#      define paravirt_map_pt_hook(type, va, pfn) do {} while (0)
+#   endif
+#endif
+#include <asm/pgtable.h>
+
+
+/* pte_page() API modified in 2.3.23 to return a struct page * --hpreg */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 23)
+#   define compat_pte_page pte_page
+#else
+#   include "compat_page.h"
+
+#   define compat_pte_page(_pte) virt_to_page(pte_page(_pte))
+#endif
+
+
+/* Appeared in 2.5.5 --hpreg */
+#ifndef pte_offset_map
+/*  Appeared in SuSE 8.0's 2.4.18 --hpreg */
+#   ifdef pte_offset_atomic
+#      define pte_offset_map pte_offset_atomic
+#      define pte_unmap pte_kunmap
+#   else
+#      define pte_offset_map pte_offset
+#      define pte_unmap(_pte)
+#   endif
+#endif
+
+
+/* Appeared in 2.5.74-mmX --petr */
+#ifndef pmd_offset_map
+#   define pmd_offset_map(pgd, address) pmd_offset(pgd, address)
+#   define pmd_unmap(pmd)
+#endif
+
+
+/*
+ * Appeared in 2.6.10-rc2-mm1.  Older kernels did L4 page tables as 
+ * part of pgd_offset, or they did not have L4 page tables at all.
+ * In 2.6.11 pml4 -> pgd -> pmd -> pte hierarchy was replaced by
+ * pgd -> pud -> pmd -> pte hierarchy.
+ */
+#ifdef PUD_MASK
+#   define compat_pgd_offset(mm, address)   pgd_offset(mm, address)
+#   define compat_pgd_present(pgd)          pgd_present(pgd)
+#   define compat_pud_offset(pgd, address)  pud_offset(pgd, address)
+#   define compat_pud_present(pud)          pud_present(pud)
+typedef pgd_t  compat_pgd_t;
+typedef pud_t  compat_pud_t;
+#elif defined(pml4_offset)
+#   define compat_pgd_offset(mm, address)   pml4_offset(mm, address)
+#   define compat_pgd_present(pml4)         pml4_present(pml4)
+#   define compat_pud_offset(pml4, address) pml4_pgd_offset(pml4, address)
+#   define compat_pud_present(pgd)          pgd_present(pgd)
+typedef pml4_t compat_pgd_t;
+typedef pgd_t  compat_pud_t;
+#else
+#   define compat_pgd_offset(mm, address)   pgd_offset(mm, address)
+#   define compat_pgd_present(pgd)          pgd_present(pgd)
+#   define compat_pud_offset(pgd, address)  (pgd)
+#   define compat_pud_present(pud)          (1)
+typedef pgd_t  compat_pgd_t;
+typedef pgd_t  compat_pud_t;
+#endif
+
+
+#define compat_pgd_offset_k(mm, address) pgd_offset_k(address)
+
+
+/* Introduced somewhere in 2.6.0, + backported to some 2.4 RedHat kernels */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0) && !defined(pte_pfn)
+#   define pte_pfn(pte) page_to_pfn(compat_pte_page(pte))
+#endif
+
+
+/* A page_table_lock field is added to struct mm_struct in 2.3.10 --hpreg */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 10)
+#   define compat_get_page_table_lock(_mm) (&(_mm)->page_table_lock)
+#else
+#   define compat_get_page_table_lock(_mm) NULL
+#endif
+
+
+/*
+ * Define VM_PAGE_KERNEL_EXEC for vmapping executable pages.
+ *
+ * On ia32 PAGE_KERNEL_EXEC was introduced in 2.6.8.1.  Unfortunately it accesses
+ * __PAGE_KERNEL_EXEC which is not exported for modules.  So we use
+ * __PAGE_KERNEL and just cut _PAGE_NX bit from it.
+ *
+ * For ia32 kernels before 2.6.8.1 we use PAGE_KERNEL directly, these kernels
+ * do not have noexec support.
+ *
+ * On x86-64 situation is a bit better: they always supported noexec, but
+ * before 2.6.8.1 flag was named PAGE_KERNEL_EXECUTABLE, and it was renamed
+ * to PAGE_KERNEL_EXEC when ia32 got noexec too (see above).
+ */
+#ifdef CONFIG_X86
+#ifdef _PAGE_NX
+#define VM_PAGE_KERNEL_EXEC __pgprot(__PAGE_KERNEL & ~_PAGE_NX)
+#else
+#define VM_PAGE_KERNEL_EXEC PAGE_KERNEL
+#endif
+#else
+#ifdef PAGE_KERNEL_EXECUTABLE
+#define VM_PAGE_KERNEL_EXEC PAGE_KERNEL_EXECUTABLE
+#else
+#define VM_PAGE_KERNEL_EXEC PAGE_KERNEL_EXEC
+#endif
+#endif
+
+
+#endif /* __COMPAT_PGTABLE_H__ */
diff --git a/vmmon-only/include/compat_sched.h b/vmmon-only/include/compat_sched.h
new file mode 100644
index 00000000..3f3304bd
--- /dev/null
+++ b/vmmon-only/include/compat_sched.h
@@ -0,0 +1,293 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_SCHED_H__
+#   define __COMPAT_SCHED_H__
+
+
+#include <linux/sched.h>
+
+/* CLONE_KERNEL available in 2.5.35 and higher. */
+#ifndef CLONE_KERNEL
+#define CLONE_KERNEL CLONE_FILES | CLONE_FS | CLONE_SIGHAND
+#endif
+
+/* TASK_COMM_LEN become available in 2.6.11. */
+#ifndef TASK_COMM_LEN
+#define TASK_COMM_LEN 16
+#endif
+
+/* The capable() API appeared in 2.1.92 --hpreg */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 1, 92)
+#   define capable(_capability) suser()
+#endif
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 2, 0)
+#   define need_resched() need_resched
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 3)
+#   define need_resched() (current->need_resched)
+#endif
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 3)
+#   define cond_resched() (need_resched() ? schedule() : (void) 0)
+#endif
+
+/* Oh well.  We need yield...  Happy us! */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 20)
+#   ifdef __x86_64__
+#      define compat_yield() there_is_nothing_like_yield()
+#   else
+#      include <linux/unistd.h>
+#      include <linux/kernel.h>
+
+/*
+ * Used by _syscallX macros. Note that this is global variable, so
+ * do not rely on its contents too much. As exit() is only function
+ * we use, and we never check return value from exit(), we have
+ * no problem...
+ */
+extern int errno;
+
+/*
+ * compat_exit() provides an access to the exit() function. It must 
+ * be named compat_exit(), as exit() (with different signature) is 
+ * provided by x86-64, arm and other (but not by i386).
+ */
+#      define __NR_compat_yield __NR_sched_yield
+static inline _syscall0(int, compat_yield);
+#   endif
+#else
+#   define compat_yield() yield()
+#endif
+
+
+/*
+ * Since 2.5.34 there are two methods to enumerate tasks:
+ * for_each_process(p) { ... } which enumerates only tasks and
+ * do_each_thread(g,t) { ... } while_each_thread(g,t) which enumerates
+ *     also threads even if they share same pid.
+ */
+#ifndef for_each_process
+#   define for_each_process(p) for_each_task(p)
+#endif
+
+#ifndef do_each_thread
+#   define do_each_thread(g, t) for_each_task(g) { t = g; do
+#   define while_each_thread(g, t) while (0) }
+#endif
+
+
+/*
+ * Lock for signal mask is moving target...
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 40) && defined(CLONE_PID)
+/* 2.4.x without NPTL patches or early 2.5.x */
+#define compat_sigmask_lock sigmask_lock
+#define compat_dequeue_signal_current(siginfo_ptr) \
+   dequeue_signal(&current->blocked, (siginfo_ptr))
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 60) && !defined(INIT_SIGHAND)
+/* RedHat's 2.4.x with first version of NPTL support, or 2.5.40 to 2.5.59 */
+#define compat_sigmask_lock sig->siglock
+#define compat_dequeue_signal_current(siginfo_ptr) \
+   dequeue_signal(&current->blocked, (siginfo_ptr))
+#else
+/* RedHat's 2.4.x with second version of NPTL support, or 2.5.60+. */
+#define compat_sigmask_lock sighand->siglock
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 0)
+#define compat_dequeue_signal_current(siginfo_ptr) \
+   dequeue_signal(&current->blocked, (siginfo_ptr))
+#else
+#define compat_dequeue_signal_current(siginfo_ptr) \
+   dequeue_signal(current, &current->blocked, (siginfo_ptr))
+#endif
+#endif
+
+/*
+ * recalc_sigpending() had task argument in the past
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 29) && defined(CLONE_PID)
+/* 2.4.x without NPTL patches or early 2.5.x */
+#define compat_recalc_sigpending() recalc_sigpending(current)
+#else
+/* RedHat's 2.4.x with NPTL support, or 2.5.29+ */
+#define compat_recalc_sigpending() recalc_sigpending()
+#endif
+
+
+/*
+ * reparent_to_init() was introduced in 2.4.8.  In 2.5.38 (or possibly
+ * earlier, but later than 2.5.31) a call to it was added into
+ * daemonize(), so compat_daemonize no longer needs to call it.
+ *
+ * In 2.4.x kernels reparent_to_init() forgets to do correct refcounting
+ * on current->user. It is better to count one too many than one too few...
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 8) && LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 38)
+#define compat_reparent_to_init() do { \
+					reparent_to_init(); \
+					atomic_inc(&current->user->__count); \
+				  } while (0)
+#else
+#define compat_reparent_to_init() do {} while (0)
+#endif
+
+
+/*
+ * daemonize appeared in 2.2.18. Except 2.2.17-4-RH7.0, which has it too.
+ * Fortunately 2.2.17-4-RH7.0 uses versioned symbols, so we can check
+ * its existence with defined().
+ */
+#if (LINUX_VERSION_CODE < KERNEL_VERSION(2, 2, 18)) && !defined(daemonize)
+static inline void daemonize(void) {
+   struct fs_struct *fs;
+
+   exit_mm(current);
+   current->session = 1;
+   current->pgrp = 1;
+   exit_fs(current);
+   fs = init_task.fs;
+   current->fs = fs;
+   atomic_inc(&fs->count);
+}
+#endif
+
+
+/*
+ * flush_signals acquires sighand->siglock since 2.5.61... Verify RH's kernels!
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 61)
+#define compat_flush_signals(task) do { \
+				      spin_lock_irq(&task->compat_sigmask_lock); \
+				      flush_signals(task); \
+				      spin_unlock_irq(&task->compat_sigmask_lock); \
+				   } while (0)
+#else
+#define compat_flush_signals(task) flush_signals(task)
+#endif
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 61)
+#define compat_allow_signal(signr) do { \
+                                      spin_lock_irq(&current->compat_sigmask_lock); \
+                                      sigdelset(&current->blocked, signr); \
+                                      compat_recalc_sigpending(); \
+                                      spin_unlock_irq(&current->compat_sigmask_lock); \
+                                   } while (0)
+#else
+#define compat_allow_signal(signr) allow_signal(signr)
+#endif
+
+/*
+ * daemonize can set process name since 2.5.61. Prior to 2.5.61, daemonize
+ * didn't block signals on our behalf.
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 61)
+#define compat_daemonize(x...)                                                \
+({                                                                            \
+   /* Beware! No snprintf here, so verify arguments! */                       \
+   sprintf(current->comm, x);                                                 \
+                                                                              \
+   /* Block all signals. */                                                   \
+   spin_lock_irq(&current->compat_sigmask_lock);                              \
+   sigfillset(&current->blocked);                                             \
+   compat_recalc_sigpending();                                                \
+   spin_unlock_irq(&current->compat_sigmask_lock);                            \
+   compat_flush_signals(current);                                             \
+                                                                              \
+   daemonize();                                                               \
+   compat_reparent_to_init();                                                 \
+})
+#else
+#define compat_daemonize(x...) daemonize(x)
+#endif
+
+
+/*
+ * try to freeze a process. For kernels 2.6.11 or newer, we know how to choose
+ * the interface. The problem is that the oldest interface, introduced in
+ * 2.5.18, was backported to 2.4.x kernels. So if we're older than 2.6.11,
+ * we'll decide what to do based on whether or not swsusp was configured
+ * for the kernel.  For kernels 2.6.20 and newer, we'll also need to include
+ * freezer.h since the try_to_freeze definition was pulled out of sched.h.
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 20)
+#include <linux/freezer.h>
+#endif
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 13) || defined(VMW_TL10S64_WORKAROUND)
+#define compat_try_to_freeze() try_to_freeze()
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 11)
+#define compat_try_to_freeze() try_to_freeze(PF_FREEZE)
+#elif defined(CONFIG_SOFTWARE_SUSPEND) || defined(CONFIG_SOFTWARE_SUSPEND2)
+#include "compat_mm.h"
+#include <linux/errno.h>
+#include <linux/suspend.h>
+static inline int compat_try_to_freeze(void)  { 
+   if (current->flags & PF_FREEZE) {
+      refrigerator(PF_FREEZE); 
+      return 1;
+   } else {
+      return 0;
+   }
+}
+#else
+static inline int compat_try_to_freeze(void) { return 0; }
+#endif
+
+/*
+ * As of 2.6.23-rc1, kernel threads are no longer freezable by
+ * default. Instead, kernel threads that need to be frozen must opt-in
+ * by calling set_freezable() as soon as the thread is created.
+ */
+
+#if LINUX_VERSION_CODE > KERNEL_VERSION(2, 6, 22)
+#define compat_set_freezable() do { set_freezable(); } while (0)
+#else
+#define compat_set_freezable() do {} while (0)
+#endif
+
+/*
+ * Around 2.6.27 kernel stopped sending signals to kernel
+ * threads being frozen, instead threads have to check
+ * freezing() or use wait_event_freezable(). Unfortunately
+ * wait_event_freezable() completely hides the fact that
+ * thread was frozen from calling code and sometimes we do
+ * want to know that.
+ */
+#ifdef PF_FREEZER_NOSIG
+#define compat_wait_check_freezing() freezing(current)
+#else
+#define compat_wait_check_freezing() (0)
+#endif
+
+/*
+ * Since 2.6.27-rc2 kill_proc() is gone... Replacement (GPL-only!)
+ * API is available since 2.6.19.  Use them from 2.6.27-rc1 up.
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 27)
+typedef int compat_pid;
+#define compat_find_get_pid(pid) (pid)
+#define compat_put_pid(pid) do { } while (0)
+#define compat_kill_pid(pid, sig, flag) kill_proc(pid, sig, flag)
+#else
+typedef struct pid * compat_pid;
+#define compat_find_get_pid(pid) find_get_pid(pid)
+#define compat_put_pid(pid) put_pid(pid)
+#define compat_kill_pid(pid, sig, flag) kill_pid(pid, sig, flag)
+#endif
+
+
+#endif /* __COMPAT_SCHED_H__ */
diff --git a/vmmon-only/include/compat_semaphore.h b/vmmon-only/include/compat_semaphore.h
new file mode 100644
index 00000000..f5527b9c
--- /dev/null
+++ b/vmmon-only/include/compat_semaphore.h
@@ -0,0 +1,49 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_SEMAPHORE_H__
+#   define __COMPAT_SEMAPHORE_H__
+
+
+/* <= 2.6.25 have asm only, 2.6.26 has both, and 2.6.27-rc2+ has linux only. */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 27)
+#   include <asm/semaphore.h>
+#else
+#   include <linux/semaphore.h>
+#endif
+
+
+/*
+* The init_MUTEX_LOCKED() API appeared in 2.2.18, and is also in
+* 2.2.17-21mdk --hpreg
+*/
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 2, 18)
+   #ifndef init_MUTEX_LOCKED
+      #define init_MUTEX_LOCKED(_sem) *(_sem) = MUTEX_LOCKED
+   #endif
+   #ifndef DECLARE_MUTEX
+      #define DECLARE_MUTEX(name) struct semaphore name = MUTEX
+   #endif
+   #ifndef DECLARE_MUTEX_LOCKED
+      #define DECLARE_MUTEX_LOCKED(name) struct semaphore name = MUTEX_LOCKED
+   #endif
+#endif
+
+
+#endif /* __COMPAT_SEMAPHORE_H__ */
diff --git a/vmmon-only/include/compat_spinlock.h b/vmmon-only/include/compat_spinlock.h
new file mode 100644
index 00000000..b8987a5a
--- /dev/null
+++ b/vmmon-only/include/compat_spinlock.h
@@ -0,0 +1,48 @@
+/*********************************************************
+ * Copyright (C) 2005 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_SPINLOCK_H__
+#   define __COMPAT_SPINLOCK_H__
+
+#include <linux/spinlock.h>
+
+/*
+ * Preempt support was added during 2.5.x development cycle, and later
+ * it was backported to 2.4.x.  In 2.4.x backport these definitions
+ * live in linux/spinlock.h, that's why we put them here (in 2.6.x they
+ * are defined in linux/preempt.h which is included by linux/spinlock.h).
+ */
+#ifdef CONFIG_PREEMPT
+#define compat_preempt_disable() preempt_disable()
+#define compat_preempt_enable()  preempt_enable()
+#else
+#define compat_preempt_disable() do { } while (0)
+#define compat_preempt_enable()  do { } while (0)
+#endif
+
+/* Some older kernels - 2.6.10 and earlier - lack DEFINE_SPINLOCK */
+#ifndef DEFINE_SPINLOCK
+#define DEFINE_SPINLOCK(x) spinlock_t x = SPIN_LOCK_UNLOCKED
+#endif
+
+/* Same goes for DEFINE_RWLOCK */
+#ifndef DEFINE_RWLOCK
+#define DEFINE_RWLOCK(x)   rwlock_t x = RW_LOCK_UNLOCKED
+#endif
+
+#endif /* __COMPAT_SPINLOCK_H__ */
diff --git a/vmmon-only/include/compat_version.h b/vmmon-only/include/compat_version.h
new file mode 100644
index 00000000..56d021cf
--- /dev/null
+++ b/vmmon-only/include/compat_version.h
@@ -0,0 +1,131 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_VERSION_H__
+#   define __COMPAT_VERSION_H__
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMKDRIVERS
+#include "includeCheck.h"
+
+
+#ifndef __linux__
+#   error "linux-version.h"
+#endif
+
+
+#include <linux/version.h>
+
+#ifndef KERNEL_VERSION
+#   error KERNEL_VERSION macro is not defined, environment is busted
+#endif
+
+
+/*
+ * Distinguish relevant classes of Linux kernels.
+ *
+ * The convention is that version X defines all
+ * the KERNEL_Y symbols where Y <= X.
+ *
+ * XXX Do not add more definitions here. This way of doing things does not
+ *     scale, and we are going to phase it out soon --hpreg
+ */
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 1, 0)
+#   define KERNEL_2_1
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 2, 0)
+#   define KERNEL_2_2
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 1)
+#   define KERNEL_2_3_1
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 15)
+/*   new networking */
+#   define KERNEL_2_3_15
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 25)
+/*  new procfs */
+#   define KERNEL_2_3_25
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 29)
+/*  even newer procfs */
+#   define KERNEL_2_3_29
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 43)
+/*  softnet changes */
+#   define KERNEL_2_3_43
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 47)
+/*  more softnet changes */
+#   define KERNEL_2_3_47
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 99)
+/*  name in netdevice struct is array and not pointer */
+#   define KERNEL_2_3_99
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 0)
+/*  New 'owner' member at the beginning of struct file_operations */
+#      define KERNEL_2_4_0
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 8)
+/*  New netif_rx_ni() --hpreg */
+#   define KERNEL_2_4_8
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 5, 2)
+/*  New kdev_t, major()/minor() API --hpreg */
+#   define KERNEL_2_5_2
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 5, 5)
+/*  New sk_alloc(), pte_offset_map()/pte_unmap() --hpreg */
+#   define KERNEL_2_5_5
+#endif
+
+/* Linux kernel 3.0 can be called 2.6.40, and 3.1 can be 2.6.41...
+ * Use COMPAT_LINUX_VERSION_CHECK_LT iff you need to compare running kernel to
+ * versions 3.0 and above.
+ *
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 0, 0)
+   /* Straight forward comparison if kernel version is 3.0.0 and beyond */
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) LINUX_VERSION_CODE < KERNEL_VERSION (a, b, c)
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 40)
+   /* Use b of the check to calculate corresponding c of kernel
+    *  version to compare */
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) LINUX_VERSION_CODE < KERNEL_VERSION (2, 6, (b + 40))
+#else
+    /* This is anyways lesser than any 3.x versions */
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) 1
+#endif
+
+#endif /* __COMPAT_VERSION_H__ */
diff --git a/vmmon-only/include/contextinfo.h b/vmmon-only/include/contextinfo.h
new file mode 100644
index 00000000..0e6dcbb2
--- /dev/null
+++ b/vmmon-only/include/contextinfo.h
@@ -0,0 +1,78 @@
+/*********************************************************
+ * Copyright (C) 2005-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * contextinfo.h
+ *
+ *    Context structures shared across all products
+ */
+
+#ifndef _CONTEXTINFO_H
+#define _CONTEXTINFO_H
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "x86desc.h"
+
+#pragma pack(push, 1)
+typedef struct Context64 {
+   uint64 cr3;
+   uint64 rax;
+   uint64 rcx;
+   uint64 rdx;
+   uint64 rbx;
+   uint64 rsi;
+   uint64 rdi;
+   uint64 rbp;
+   uint64 rsp;
+   uint64 r8;
+   uint64 r9;
+   uint64 r10;
+   uint64 r11;
+   uint64 r12;
+   uint64 r13;
+   uint64 r14;
+   uint64 r15;
+   uint32 cs;
+   uint32 ds;
+   uint32 ss;
+   uint32 es;
+   uint32 fs;
+   uint32 gs;
+   uint64 rip;
+   uint64 eflags;
+   uint16 ldt;
+   uint16 _pad[3];
+} Context64;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct ContextInfo64 {
+   DTRWords64 gdtr;
+   DTRWords64 idtr;
+   Context64  context;
+   uint16     tr;
+   uint16     _pad0;
+} ContextInfo64;
+#pragma pack(pop)
+
+#endif
diff --git a/vmmon-only/include/cpu_defs.h b/vmmon-only/include/cpu_defs.h
new file mode 100644
index 00000000..03f7b702
--- /dev/null
+++ b/vmmon-only/include/cpu_defs.h
@@ -0,0 +1,49 @@
+/*********************************************************
+ * Copyright (C) 2009 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * cpu_defs.h --
+ *
+ *	CPU-related definitions shared between vmkernel and user-space.
+ */
+
+#ifndef CPU_DEFS_H
+#define CPU_DEFS_H
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+
+#define INCLUDE_ALLOW_VMX
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+typedef uint32 PCPU;
+#define INVALID_PCPU		((PCPU) -1)
+
+#define MAX_PCPUS       576
+#define MAX_PCPUS_BITS  10  // MAX_PCPUS <= (1 << MAX_PCPUS_BITS)
+#define MAX_PCPUS_MASK  ((1 << MAX_PCPUS_BITS) - 1)
+
+#endif
diff --git a/vmmon-only/include/cpuid_info.h b/vmmon-only/include/cpuid_info.h
new file mode 100644
index 00000000..1d3ba307
--- /dev/null
+++ b/vmmon-only/include/cpuid_info.h
@@ -0,0 +1,95 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _CPUID_INFO_H
+#define _CPUID_INFO_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+
+#include "includeCheck.h"
+
+#include "vm_basic_asm.h"
+#include "x86cpuid_asm.h"
+
+
+typedef struct CPUID0 {
+   int numEntries;
+   char name[16];      // 4 extra bytes to null terminate
+} CPUID0;
+
+typedef struct CPUID1 {
+   uint32 version;
+   uint32 ebx;
+   uint32 ecxFeatures;
+   uint32 edxFeatures;
+} CPUID1;
+
+typedef struct CPUID80 {
+   uint32 numEntries;
+   uint32 ebx;
+   uint32 ecx;
+   uint32 edx;
+} CPUID80;
+
+typedef struct CPUID81 {
+   uint32 eax;
+   uint32 ebx;
+   uint32 ecxFeatures;
+   uint32 edxFeatures;
+} CPUID81;
+
+typedef struct CPUIDSummary {
+   CPUID0  id0;
+   CPUID1  id1;
+   CPUIDRegs ida;
+   CPUID80 id80;
+   CPUID81 id81;
+   CPUIDRegs id88, id8a;
+} CPUIDSummary;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUIDSummary_RegsFromCpuid0 --
+ *
+ *      Fills in the given CPUIDRegs struct with the values from the CPUID0 struct.
+ *
+ * Results:
+ *      Returns the CPUIDRegs pointer passed in.
+ *
+ * Side effects:
+ *	None.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE CPUIDRegs*
+CPUIDSummary_RegsFromCpuid0(CPUID0* id0In,
+                            CPUIDRegs* id0Out)
+{
+   id0Out->eax = id0In->numEntries;
+   id0Out->ebx = *(uint32 *) (id0In->name + 0);
+   id0Out->edx = *(uint32 *) (id0In->name + 4);
+   id0Out->ecx = *(uint32 *) (id0In->name + 8);
+   return id0Out;
+}
+
+#endif
diff --git a/vmmon-only/include/crossgdt.h b/vmmon-only/include/crossgdt.h
new file mode 100644
index 00000000..ad823eaa
--- /dev/null
+++ b/vmmon-only/include/crossgdt.h
@@ -0,0 +1,79 @@
+/*********************************************************
+ * Copyright (C) 2006-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * crossgdt.h --
+ *
+ *      This GDT is used for switching between monitor and host context.
+ *      It contains the host and monitor basic segment descriptors.
+ *      There is only one in the whole host system, shared by all VMs.
+ *      It is allocated when the first VCPU is started and freed when the
+ *      driver is unloaded.
+ */
+
+#ifndef _CROSSGDT_H_
+#define _CROSSGDT_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_defs.h"  // PAGE_SIZE
+#include "x86types.h"       // Descriptor
+
+typedef struct CrossGDT {
+   Descriptor gdtes[0x5000 / sizeof (Descriptor)];  // 0x5000 > GDT_LIMIT
+} CrossGDT;
+
+#define CROSSGDT_NUMPAGES ((sizeof (CrossGDT) + PAGE_SIZE - 1) / PAGE_SIZE)
+
+/*
+ * Out of the 5 pages, only the first and last are really used.
+ *
+ * All we need to map are the first and last pages.  This mask tells
+ * the setup code which pages it can put stuff in and it tells the
+ * mapping and invalidation code which pages are mapped and unmapped.
+ */
+#define CROSSGDT_PAGEMASK 0x11
+
+/*
+ * These segments are placed in the first crossGDT page.  We assume
+ * they do not overlap any host segments (checked by
+ * Task_InitCrossGDT).  The only real requirement is that they (and
+ * the host CS/SS) be physically contiguous with the start of the
+ * crossGDT so they will remain valid when paging is turned off.
+ *
+ * As of this writing (Nov 2006), host GDT limits:
+ *     Linux 64 bit:  80 (yes 80, not 7F)
+ *           32 bit:  FF
+ *     MacOS 64 bit:  8F
+ *           32 bit:  8F
+ *   Windows 64 bit:  6F
+ *           32 bit: 3FF
+ */
+#define CROSSGDT_LOWSEG   (0x0FD0 / 8)  // all host segs must be below this
+#define CROSSGDT_64BITCS  (0x0FD0 / 8)  // 64-bit code segment
+#define CROSSGDT_64BITSS  (0x0FD8 / 8)  // 64-bit data segment
+#define CROSSGDT_FLAT32CS (0x0FE0 / 8)  // 32-bit flat code seg
+#define CROSSGDT_FLAT32SS (0x0FE8 / 8)  // 32-bit flat data seg
+#define CROSSGDT_MON32CS  (0x0FF0 / 8)  // 32-bit FFC00000 base code seg
+#define CROSSGDT_MON32SS  (0x0FF8 / 8)  // 32-bit FFC00000 base data seg
+
+#endif
diff --git a/vmmon-only/include/driver-config.h b/vmmon-only/include/driver-config.h
new file mode 100644
index 00000000..fbf45d3c
--- /dev/null
+++ b/vmmon-only/include/driver-config.h
@@ -0,0 +1,79 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * Sets the proper defines from the Linux header files
+ *
+ * This file must be included before the inclusion of any kernel header file,
+ * with the exception of linux/autoconf.h and linux/version.h --hpreg
+ */
+
+#ifndef __VMX_CONFIG_H__
+#define __VMX_CONFIG_H__
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMKDRIVERS
+#include "includeCheck.h"
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+/*
+ * We rely on Kernel Module support.  Check here.
+ */
+#ifndef CONFIG_MODULES
+#   error "No Module support in this kernel.  Please configure with CONFIG_MODULES"
+#endif
+
+/*
+ * 2.2 kernels still use __SMP__ (derived from CONFIG_SMP
+ * in the main Makefile), so we do it here.
+ */
+
+#ifdef CONFIG_SMP
+#   define __SMP__ 1
+#endif
+
+#if defined(CONFIG_MODVERSIONS) && defined(KERNEL_2_1)
+#   if LINUX_VERSION_CODE < KERNEL_VERSION(2,5,60)
+/*
+ * MODVERSIONS might be already defined when using kernel's Makefiles.
+ */
+#      ifndef MODVERSIONS
+#         define MODVERSIONS
+#      endif
+#      include <linux/modversions.h>
+#   endif
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24)
+/*
+ * Force the uintptr_t definition to come from linux/types.h instead of vm_basic_types.h.
+ */
+#   include <linux/types.h>
+#   define _STDINT_H 1
+#endif
+
+#ifndef __KERNEL__
+#   define __KERNEL__
+#endif
+
+#endif
diff --git a/vmmon-only/include/hashFunc.h b/vmmon-only/include/hashFunc.h
new file mode 100644
index 00000000..fec72614
--- /dev/null
+++ b/vmmon-only/include/hashFunc.h
@@ -0,0 +1,345 @@
+/*********************************************************
+ * Copyright (C) 2001,2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _HASH_FUNC_H
+#define _HASH_FUNC_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+
+#include "includeCheck.h"
+
+/*
+ * hashFunc.h --
+ *
+ *	Hash functions defined as simple wrappers around code placed
+ *	in the public domain by Bob Jenkins.  His original code can
+ *	be used freely for any purpose, including commercial (see the
+ *	original comments in the enclosed code).
+ */
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "vm_assert.h"
+
+/*
+ * operations
+ */
+
+extern uint64 HashFunc_HashBytes(const uint8 *key,  uint32 nBytes);
+extern uint64 HashFunc_HashMoreBytes(const uint8 *key, uint32 nBytes, 
+                                     uint64 initialValue);
+extern uint64 HashFunc_HashBytesSlow(const uint8 *key, uint32 nBytes);
+extern uint64 HashFunc_HashQuads(const uint64 *key, uint32 nQuads);
+extern uint64 HashFunc_HashPage(const void *addr);
+
+/*
+--------------------------------------------------------------------
+Hashes 32-bit key and returns a value that can fit into numBits bits.
+--------------------------------------------------------------------
+*/
+
+static INLINE uint32
+HashFunc_TruncHash32(uint32 key, unsigned numBits)
+{
+   const uint32 hashConst = 0x9e3779b9; /* the golden ratio */
+   ASSERT(numBits > 0 && numBits <= 32);
+   return (key * hashConst) >> (32 - numBits);
+}
+
+/*
+--------------------------------------------------------------------
+Hashes 64-bit key and returns a value that can fit into numBits bits.
+--------------------------------------------------------------------
+*/
+
+static INLINE uint32
+HashFunc_TruncHash64(uint64 key, unsigned numBits)
+{
+   return HashFunc_TruncHash32((uint32)(key ^ (key >> 32)), numBits);
+}
+
+
+/*
+ * Original Bob Jenkins public-domain code with minor modifications
+ * (static functions, 32-bit length args, disabled self-test code).
+ */
+
+
+typedef uint64 ub8;   /* unsigned 8-byte quantities */
+typedef uint32 ub4;   /* unsigned 4-byte quantities */
+typedef uint8  ub1;
+
+#define hashsize(n) ((ub8)1<<(n))
+#define hashmask(n) (hashsize(n)-1)
+
+/*
+--------------------------------------------------------------------
+mix -- mix 3 64-bit values reversibly.
+mix() takes 48 machine instructions, but only 24 cycles on a superscalar
+  machine (like Intel's new MMX architecture).  It requires 4 64-bit
+  registers for 4::2 parallelism.
+All 1-bit deltas, all 2-bit deltas, all deltas composed of top bits of
+  (a,b,c), and all deltas of bottom bits were tested.  All deltas were
+  tested both on random keys and on keys that were nearly all zero.
+  These deltas all cause every bit of c to change between 1/3 and 2/3
+  of the time (well, only 113/400 to 287/400 of the time for some
+  2-bit delta).  These deltas all cause at least 80 bits to change
+  among (a,b,c) when the mix is run either forward or backward (yes it
+  is reversible).
+This implies that a hash using mix64 has no funnels.  There may be
+  characteristics with 3-bit deltas or bigger, I didn't test for
+  those.
+--------------------------------------------------------------------
+*/
+#define mix64(a,b,c) \
+{ \
+  a -= b; a -= c; a ^= (c>>43); \
+  b -= c; b -= a; b ^= (a<<9); \
+  c -= a; c -= b; c ^= (b>>8); \
+  a -= b; a -= c; a ^= (c>>38); \
+  b -= c; b -= a; b ^= (a<<23); \
+  c -= a; c -= b; c ^= (b>>5); \
+  a -= b; a -= c; a ^= (c>>35); \
+  b -= c; b -= a; b ^= (a<<49); \
+  c -= a; c -= b; c ^= (b>>11); \
+  a -= b; a -= c; a ^= (c>>12); \
+  b -= c; b -= a; b ^= (a<<18); \
+  c -= a; c -= b; c ^= (b>>22); \
+}
+
+/*
+--------------------------------------------------------------------
+hash() -- hash a variable-length key into a 64-bit value
+  k     : the key (the unaligned variable-length array of bytes)
+  len   : the length of the key, counting by bytes
+  level : can be any 8-byte value
+Returns a 64-bit value.  Every bit of the key affects every bit of
+the return value.  No funnels.  Every 1-bit and 2-bit delta achieves
+avalanche.  About 41+5len instructions.
+
+The best hash table sizes are powers of 2.  There is no need to do
+mod a prime (mod is sooo slow!).  If you need less than 64 bits,
+use a bitmask.  For example, if you need only 10 bits, do
+  h = (h & hashmask(10));
+In which case, the hash table should have hashsize(10) elements.
+
+If you are hashing n strings (ub1 **)k, do it like this:
+  for (i=0, h=0; i<n; ++i) h = hash( k[i], len[i], h);
+
+By Bob Jenkins, Jan 4 1997.  bob_jenkins@burtleburtle.net.  You may
+use this code any way you wish, private, educational, or commercial,
+as long as this whole comment accompanies it.
+
+See http://burtleburtle.net/bob/hash/evahash.html
+Use for hash table lookup, or anything where one collision in 2^^64
+is acceptable.  Do NOT use for cryptographic purposes.
+--------------------------------------------------------------------
+*/
+
+static INLINE ub8 hash(register const ub1 *k, /* the key */
+                       register ub4 length,   /* the length of the key */
+                       register ub8 level)    /* the previous hash, or an arbitrary value */
+{
+  register ub8 a,b,c;
+  ub4 len;
+
+  /* Set up the internal state */
+  len = length;
+  a = b = level;                         /* the previous hash value */
+  c = CONST64U(0x9e3779b97f4a7c13); /* the golden ratio; an arbitrary value */
+
+  /*---------------------------------------- handle most of the key */
+  while (len >= 24)
+  {
+    a += (k[0]        +((ub8)k[ 1]<< 8)+((ub8)k[ 2]<<16)+((ub8)k[ 3]<<24)
+     +((ub8)k[4 ]<<32)+((ub8)k[ 5]<<40)+((ub8)k[ 6]<<48)+((ub8)k[ 7]<<56));
+    b += (k[8]        +((ub8)k[ 9]<< 8)+((ub8)k[10]<<16)+((ub8)k[11]<<24)
+     +((ub8)k[12]<<32)+((ub8)k[13]<<40)+((ub8)k[14]<<48)+((ub8)k[15]<<56));
+    c += (k[16]       +((ub8)k[17]<< 8)+((ub8)k[18]<<16)+((ub8)k[19]<<24)
+     +((ub8)k[20]<<32)+((ub8)k[21]<<40)+((ub8)k[22]<<48)+((ub8)k[23]<<56));
+    mix64(a,b,c);
+    k += 24; len -= 24;
+  }
+
+  /*------------------------------------- handle the last 23 bytes */
+  c += length;
+  switch(len)              /* all the case statements fall through */
+  {
+  case 23: c+=((ub8)k[22]<<56);
+  case 22: c+=((ub8)k[21]<<48);
+  case 21: c+=((ub8)k[20]<<40);
+  case 20: c+=((ub8)k[19]<<32);
+  case 19: c+=((ub8)k[18]<<24);
+  case 18: c+=((ub8)k[17]<<16);
+  case 17: c+=((ub8)k[16]<<8);
+    /* the first byte of c is reserved for the length */
+  case 16: b+=((ub8)k[15]<<56);
+  case 15: b+=((ub8)k[14]<<48);
+  case 14: b+=((ub8)k[13]<<40);
+  case 13: b+=((ub8)k[12]<<32);
+  case 12: b+=((ub8)k[11]<<24);
+  case 11: b+=((ub8)k[10]<<16);
+  case 10: b+=((ub8)k[ 9]<<8);
+  case  9: b+=((ub8)k[ 8]);
+  case  8: a+=((ub8)k[ 7]<<56);
+  case  7: a+=((ub8)k[ 6]<<48);
+  case  6: a+=((ub8)k[ 5]<<40);
+  case  5: a+=((ub8)k[ 4]<<32);
+  case  4: a+=((ub8)k[ 3]<<24);
+  case  3: a+=((ub8)k[ 2]<<16);
+  case  2: a+=((ub8)k[ 1]<<8);
+  case  1: a+=((ub8)k[ 0]);
+    /* case 0: nothing left to add */
+  }
+  mix64(a,b,c);
+  /*-------------------------------------------- report the result */
+  return c;
+}
+
+/*
+--------------------------------------------------------------------
+ This works on all machines, is identical to hash() on little-endian 
+ machines, and it is much faster than hash(), but it requires
+ -- that the key be an array of ub8's, and
+ -- that all your machines have the same endianness, and
+ -- that the length be the number of ub8's in the key
+--------------------------------------------------------------------
+*/
+static INLINE ub8 hash2(register const ub8 *k, /* the key */
+                        register ub4 length,   /* the length of the key */
+                        register ub8 level)    /* the previous hash, or an arbitrary value */
+{
+  register ub8 a,b,c;
+  ub4 len;
+
+  /* Set up the internal state */
+  len = length;
+  a = b = level;                         /* the previous hash value */
+  c = CONST64U(0x9e3779b97f4a7c13); /* the golden ratio; an arbitrary value */
+
+  /*---------------------------------------- handle most of the key */
+  while (len >= 3)
+  {
+    a += k[0];
+    b += k[1];
+    c += k[2];
+    mix64(a,b,c);
+    k += 3; len -= 3;
+  }
+
+  /*-------------------------------------- handle the last 2 ub8's */
+  c += length;
+  switch(len)              /* all the case statements fall through */
+  {
+    /* c is reserved for the length */
+  case  2: b+=k[1];
+  case  1: a+=k[0];
+    /* case 0: nothing left to add */
+  }
+  mix64(a,b,c);
+  /*-------------------------------------------- report the result */
+  return c;
+}
+
+/*
+--------------------------------------------------------------------
+ This is identical to hash() on little-endian machines, and it is much
+ faster than hash(), but a little slower than hash2(), and it requires
+ -- that all your machines be little-endian, for example all Intel x86
+    chips or all VAXen.  It gives wrong results on big-endian machines.
+--------------------------------------------------------------------
+*/
+
+static INLINE ub8 hash3(register const ub1 *k, /* the key */
+                        register ub4 length,   /* the length of the key */
+                        register ub8 level)    /* the previous hash, or an arbitrary value */
+{
+  register ub8 a,b,c;
+  ub4 len;
+
+  /* Set up the internal state */
+  len = length;
+  a = b = level;                         /* the previous hash value */
+  c = CONST64U(0x9e3779b97f4a7c13); /* the golden ratio; an arbitrary value */
+
+  /*---------------------------------------- handle most of the key */
+  if (((size_t)k)&7)
+  {
+    while (len >= 24)
+    {
+      a += (k[0]        +((ub8)k[ 1]<< 8)+((ub8)k[ 2]<<16)+((ub8)k[ 3]<<24)
+       +((ub8)k[4 ]<<32)+((ub8)k[ 5]<<40)+((ub8)k[ 6]<<48)+((ub8)k[ 7]<<56));
+      b += (k[8]        +((ub8)k[ 9]<< 8)+((ub8)k[10]<<16)+((ub8)k[11]<<24)
+       +((ub8)k[12]<<32)+((ub8)k[13]<<40)+((ub8)k[14]<<48)+((ub8)k[15]<<56));
+      c += (k[16]       +((ub8)k[17]<< 8)+((ub8)k[18]<<16)+((ub8)k[19]<<24)
+       +((ub8)k[20]<<32)+((ub8)k[21]<<40)+((ub8)k[22]<<48)+((ub8)k[23]<<56));
+      mix64(a,b,c);
+      k += 24; len -= 24;
+    }
+  }
+  else
+  {
+    while (len >= 24)    /* aligned */
+    {
+      a += *(ub8 *)(k+0);
+      b += *(ub8 *)(k+8);
+      c += *(ub8 *)(k+16);
+      mix64(a,b,c);
+      k += 24; len -= 24;
+    }
+  }
+
+  /*------------------------------------- handle the last 23 bytes */
+  c += length;
+  switch(len)              /* all the case statements fall through */
+  {
+  case 23: c+=((ub8)k[22]<<56);
+  case 22: c+=((ub8)k[21]<<48);
+  case 21: c+=((ub8)k[20]<<40);
+  case 20: c+=((ub8)k[19]<<32);
+  case 19: c+=((ub8)k[18]<<24);
+  case 18: c+=((ub8)k[17]<<16);
+  case 17: c+=((ub8)k[16]<<8);
+    /* the first byte of c is reserved for the length */
+  case 16: b+=((ub8)k[15]<<56);
+  case 15: b+=((ub8)k[14]<<48);
+  case 14: b+=((ub8)k[13]<<40);
+  case 13: b+=((ub8)k[12]<<32);
+  case 12: b+=((ub8)k[11]<<24);
+  case 11: b+=((ub8)k[10]<<16);
+  case 10: b+=((ub8)k[ 9]<<8);
+  case  9: b+=((ub8)k[ 8]);
+  case  8: a+=((ub8)k[ 7]<<56);
+  case  7: a+=((ub8)k[ 6]<<48);
+  case  6: a+=((ub8)k[ 5]<<40);
+  case  5: a+=((ub8)k[ 4]<<32);
+  case  4: a+=((ub8)k[ 3]<<24);
+  case  3: a+=((ub8)k[ 2]<<16);
+  case  2: a+=((ub8)k[ 1]<<8);
+  case  1: a+=((ub8)k[ 0]);
+    /* case 0: nothing left to add */
+  }
+  mix64(a,b,c);
+  /*-------------------------------------------- report the result */
+  return c;
+}
+
+#endif //_HASH_FUNC_H
diff --git a/vmmon-only/include/includeCheck.h b/vmmon-only/include/includeCheck.h
new file mode 100644
index 00000000..08fd1e58
--- /dev/null
+++ b/vmmon-only/include/includeCheck.h
@@ -0,0 +1,17 @@
+/*********************************************************
+ * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
diff --git a/vmmon-only/include/initblock.h b/vmmon-only/include/initblock.h
new file mode 100644
index 00000000..e101e9ff
--- /dev/null
+++ b/vmmon-only/include/initblock.h
@@ -0,0 +1,43 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _INITBLOCK_H
+#define _INITBLOCK_H
+
+
+#define INCLUDE_ALLOW_VMX
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+
+#include "basic_initblock.h"
+
+
+#define MAX_LOGFILE_NAME_LENGTH 256
+#define MAX_MONITOR_REGIONS     8
+#define INIT_BLOCK_MAGIC     (0x1789+14)
+
+
+/*
+ * Option flags 
+ */
+/* None yet */
+
+
+#endif
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
new file mode 100644
index 00000000..6bce93ee
--- /dev/null
+++ b/vmmon-only/include/iocontrols.h
@@ -0,0 +1,623 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * iocontrols.h
+ *
+ *        The driver io controls.
+ */
+
+#ifndef _IOCONTROLS_H_
+#define _IOCONTROLS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_MODULE
+#include "includeCheck.h"
+
+#ifdef VMX86_SERVER
+#error iocontrols.h is for hosted vmmon, do not use on visor
+#endif
+
+#include "basic_initblock.h"
+#include "x86segdescrs.h"
+#include "rateconv.h"
+#include "overheadmem_types.h"
+#include "pageLock_defs.h"
+#include "numa_defs.h"
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VA64ToPtr --
+ *
+ *      Convert a VA64 to a pointer.
+ *
+ *      Usage of this function is strictly limited to these 2 cases:
+ *
+ *      1) In a VMX function which does an ioctl to vmmon, and receives a VMX
+ *         pointer as a result.
+ *
+ *      2) In the vmmon code, for the functions which have a VA64 and need
+ *         to call kernel APIs which take pointers.
+ *
+ * Results:
+ *      Virtual address.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void *
+VA64ToPtr(VA64 va64) // IN
+{
+#ifdef VM_64BIT
+   ASSERT_ON_COMPILE(sizeof (void *) == 8);
+#else
+   ASSERT_ON_COMPILE(sizeof (void *) == 4);
+   // Check that nothing of value will be lost.
+   ASSERT(!(va64 >> 32));
+#endif
+   return (void *)(uintptr_t)va64;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PtrToVA64 --
+ *
+ *      Convert a pointer to a VA64.
+ *
+ *      Usage of this function is strictly limited to these 2 cases:
+ *
+ *      1) In a VMX function which does an ioctl to vmmon, and passes in a VMX
+ *         pointer.
+ *
+ *      2) In the vmmon code, for the functions which need to pass in a kernel
+ *         pointer to functions which can take either a user or a kernel
+ *         pointer in the same parameter.
+ *
+ * Results:
+ *      Virtual address.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE VA64
+PtrToVA64(void const *ptr) // IN
+{
+   ASSERT_ON_COMPILE(sizeof ptr <= sizeof (VA64));
+   return (VA64)(uintptr_t)ptr;
+}
+
+
+/*
+ * Driver version.
+ *
+ * Increment major version when you make an incompatible change.
+ * Compatibility goes both ways (old driver with new executable
+ * as well as new driver with old executable).
+ *
+ * Note: Vmcore compatibility is different from driver versioning.
+ * For vmcore puposes, the bora tree is conceptually split in two:
+ * vmcore, and rest-of-bora. The vmmon driver is largely outside
+ * vmcore and vmcore imports functionality from vmmon. Addition,
+ * deletion or modification of an iocontrol used only by rest-of-bora
+ * does not break vmcore compatibility. 
+ *
+ * See bora/doc/vmcore details.
+ *
+ */
+
+#define VMMON_VERSION           (308 << 16 | 0)
+#define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
+#define VMMON_VERSION_MINOR(v)  ((uint16) (v))
+
+
+/*
+ * ENOMEM returned after MAX_VMS virtual machines created
+ */
+
+#ifdef VMX86_SERVER
+#define MAX_VMS 128
+#else
+#define MAX_VMS 64
+#endif
+/* 
+ * MsgWaitForMultipleObjects doesn't scale well enough on Win32. 
+ * Allocate with MAX_VMS so static buffers are large, but do
+ * admissions control with this value on Win32 until we check
+ * scalability (probably in authd).
+ */
+#ifdef _WIN32
+#define MAX_VMS_WIN32 64
+#endif
+
+
+#if !__linux__
+/*
+ * On platforms other than Linux, IOCTLCMD_foo values are just numbers, and
+ * we build the IOCTL_VMX86_foo values around these using platform-specific
+ * format for encoding arguments and sizes.
+ */
+#  define IOCTLCMD(_cmd) IOCTLCMD_ ## _cmd
+#else // if __linux__
+/*
+ * Linux defines _IO* macros, but the core kernel code ignore the encoded
+ * ioctl value. It is up to individual drivers to decode the value (for
+ * example to look at the size of a structure to determine which version
+ * of a specific command should be used) or not (which is what we
+ * currently do, so right now the ioctl value for a given command is the
+ * command itself).
+ *
+ * Hence, we just define the IOCTL_VMX86_foo values directly, with no
+ * intermediate IOCTLCMD_ representation.
+ */
+#  define IOCTLCMD(_cmd) IOCTL_VMX86_ ## _cmd
+#endif
+
+
+enum IOCTLCmd {
+   /*
+    * We need to bracket the range of values used for ioctls, because x86_64
+    * Linux forces us to explicitly register ioctl handlers by value for
+    * handling 32 bit ioctl syscalls.  Hence FIRST and LAST.  FIRST must be
+    * 2001 so that VERSION is 2001 for backwards compatibility.
+    */
+#if defined __linux__ || defined _WIN32
+   /* Start at 2001 because legacy code did. */
+   IOCTLCMD(FIRST) = 2001,
+#else
+   /* Start at 0. */
+   IOCTLCMD(FIRST),
+#endif
+   IOCTLCMD(VERSION) = IOCTLCMD(FIRST),
+   IOCTLCMD(CREATE_VM),
+   IOCTLCMD(RELEASE_VM),
+   IOCTLCMD(GET_NUM_VMS),
+   IOCTLCMD(ALLOC_CROSSGDT),
+   IOCTLCMD(INIT_VM),
+   IOCTLCMD(INIT_CROSSGDT),
+   IOCTLCMD(RUN_VM),
+   IOCTLCMD(LOOK_UP_MPN),
+   IOCTLCMD(LOCK_PAGE),
+   IOCTLCMD(UNLOCK_PAGE),
+   IOCTLCMD(APIC_INIT),
+   IOCTLCMD(SET_HARD_LIMIT),
+   IOCTLCMD(GET_MEM_INFO),
+   IOCTLCMD(ADMIT),
+   IOCTLCMD(UPDATE_MEM_INFO),
+   IOCTLCMD(READMIT),
+   IOCTLCMD(PAE_ENABLED),
+   IOCTLCMD(GET_TOTAL_MEM_USAGE),
+   IOCTLCMD(GET_KHZ_ESTIMATE),
+   IOCTLCMD(SET_HOST_CLOCK_RATE),
+   IOCTLCMD(READ_PAGE),
+   IOCTLCMD(WRITE_PAGE),
+   IOCTLCMD(LOCK_PAGE_NEW),
+   IOCTLCMD(UNLOCK_PAGE_BY_MPN),
+    /* AWE calls */
+   IOCTLCMD(ALLOC_LOCKED_PAGES),
+   IOCTLCMD(FREE_LOCKED_PAGES),
+   IOCTLCMD(GET_NEXT_ANON_PAGE),
+   IOCTLCMD(GET_LOCKED_PAGES_LIST),
+
+   IOCTLCMD(GET_ALL_MSRS),
+
+   IOCTLCMD(COUNT_PRESENT_PAGES),
+  
+   IOCTLCMD(GET_REFERENCE_CLOCK_HZ),
+   IOCTLCMD(INIT_PSEUDO_TSC),
+   IOCTLCMD(CHECK_PSEUDO_TSC),
+   IOCTLCMD(GET_PSEUDO_TSC),
+
+   IOCTLCMD(SYNC_GET_TSCS),
+
+   IOCTLCMD(GET_IPI_VECTORS),
+   IOCTLCMD(SEND_IPI),
+
+   /*
+    * Keep host-specific calls at the end so they can be undefined
+    * without renumbering the common calls.
+    */
+
+#if defined __linux__
+   IOCTLCMD(SET_UID),		// VMX86_DEVEL only
+#endif
+
+#if defined __linux__ || defined __APPLE__
+   IOCTLCMD(GET_ALL_CPUID),
+   IOCTLCMD(GET_KERNEL_CLOCK_RATE),
+#endif
+
+#if defined _WIN32 || defined __APPLE__
+   IOCTLCMD(ALLOC_CONTIG_PAGES),
+#endif
+
+#if defined _WIN32
+   IOCTLCMD(FREE_CONTIG_PAGES),
+   IOCTLCMD(HARD_LIMIT_MONITOR_STATUS),	// Windows 2000 only
+   IOCTLCMD(BLUE_SCREEN),	// USE_BLUE_SCREEN only
+   IOCTLCMD(CHANGE_HARD_LIMIT),
+   IOCTLCMD(GET_KERNEL_PROC_ADDRESS),
+   IOCTLCMD(READ_VA64),
+   IOCTLCMD(SET_MEMORY_PARAMS),
+   IOCTLCMD(REMEMBER_KHZ_ESTIMATE),
+   IOCTLCMD(REMAP_SCATTER_LIST),
+   IOCTLCMD(UNMAP_SCATTER_LIST),
+#endif
+
+#if defined __APPLE__
+   IOCTLCMD(ALLOC_LOW_PAGES),
+   IOCTLCMD(INIT_DRIVER),
+   IOCTLCMD(BLUEPILL),
+#endif
+
+   IOCTLCMD(SET_POLL_TIMEOUT_PTR),
+
+   IOCTLCMD(FAST_SUSP_RES_SET_OTHER_FLAG),
+   IOCTLCMD(FAST_SUSP_RES_GET_MY_FLAG),
+
+#if defined __linux__
+   IOCTLCMD(SET_HOST_CLOCK_PRIORITY),
+   IOCTLCMD(VMX_ENABLED),
+   IOCTLCMD(SET_HOST_SWAP_SIZE),
+#endif
+
+   IOCTLCMD(GET_UNAVAIL_PERF_CTRS),
+   // Must be last.
+   IOCTLCMD(LAST)
+};
+
+
+#if defined _WIN32
+/*
+ * Windows ioctl definitions.
+ *
+ * We use the IRP Information field for the return value
+ * of IOCTLCMD_RUN_VM, to be faster since it is used a lot.
+ */
+
+#define FILE_DEVICE_VMX86        0x8101
+#define VMX86_IOCTL_BASE_INDEX   0x801
+#define VMIOCTL_BUFFERED(name) \
+     CTL_CODE(FILE_DEVICE_VMX86, \
+	       VMX86_IOCTL_BASE_INDEX + IOCTLCMD_ ## name, \
+	       METHOD_BUFFERED, \
+	       FILE_ANY_ACCESS)
+#define VMIOCTL_NEITHER(name) \
+      CTL_CODE(FILE_DEVICE_VMX86, \
+	       VMX86_IOCTL_BASE_INDEX + IOCTLCMD_ ## name, \
+	       METHOD_NEITHER, \
+	       FILE_ANY_ACCESS)
+
+#define IOCTL_VMX86_VERSION             VMIOCTL_BUFFERED(VERSION)
+#define IOCTL_VMX86_CREATE_VM           VMIOCTL_BUFFERED(CREATE_VM)
+#define IOCTL_VMX86_RELEASE_VM          VMIOCTL_BUFFERED(RELEASE_VM)
+#define IOCTL_VMX86_GET_NUM_VMS         VMIOCTL_BUFFERED(GET_NUM_VMS)
+#define IOCTL_VMX86_ALLOC_CROSSGDT      VMIOCTL_BUFFERED(ALLOC_CROSSGDT)
+#define IOCTL_VMX86_INIT_VM             VMIOCTL_BUFFERED(INIT_VM)
+#define IOCTL_VMX86_INIT_CROSSGDT       VMIOCTL_BUFFERED(INIT_CROSSGDT)
+#define IOCTL_VMX86_RUN_VM              VMIOCTL_NEITHER(RUN_VM)
+#define IOCTL_VMX86_SEND_IPI            VMIOCTL_NEITHER(SEND_IPI)
+#define IOCTL_VMX86_GET_IPI_VECTORS     VMIOCTL_BUFFERED(GET_IPI_VECTORS)
+#define IOCTL_VMX86_LOOK_UP_MPN         VMIOCTL_BUFFERED(LOOK_UP_MPN)
+#define IOCTL_VMX86_LOCK_PAGE           VMIOCTL_BUFFERED(LOCK_PAGE)
+#define IOCTL_VMX86_UNLOCK_PAGE         VMIOCTL_BUFFERED(UNLOCK_PAGE)
+#define IOCTL_VMX86_APIC_INIT           VMIOCTL_BUFFERED(APIC_INIT)
+#define IOCTL_VMX86_SET_HARD_LIMIT      VMIOCTL_BUFFERED(SET_HARD_LIMIT)
+#define IOCTL_VMX86_GET_MEM_INFO        VMIOCTL_BUFFERED(GET_MEM_INFO)
+#define IOCTL_VMX86_ADMIT               VMIOCTL_BUFFERED(ADMIT)
+#define IOCTL_VMX86_READMIT             VMIOCTL_BUFFERED(READMIT)
+#define IOCTL_VMX86_UPDATE_MEM_INFO     VMIOCTL_BUFFERED(UPDATE_MEM_INFO)
+#define IOCTL_VMX86_PAE_ENABLED         VMIOCTL_BUFFERED(PAE_ENABLED)
+#define IOCTL_VMX86_BEEP                VMIOCTL_BUFFERED(BEEP)
+#define IOCTL_VMX86_HARD_LIMIT_MONITOR_STATUS   VMIOCTL_BUFFERED(HARD_LIMIT_MONITOR_STATUS)
+#define IOCTL_VMX86_CHANGE_HARD_LIMIT   VMIOCTL_BUFFERED(CHANGE_HARD_LIMIT)
+#define IOCTL_VMX86_ALLOC_CONTIG_PAGES  VMIOCTL_BUFFERED(ALLOC_CONTIG_PAGES)
+#define IOCTL_VMX86_FREE_CONTIG_PAGES   VMIOCTL_BUFFERED(FREE_CONTIG_PAGES)
+
+#define IOCTL_VMX86_GET_TOTAL_MEM_USAGE	VMIOCTL_BUFFERED(GET_TOTAL_MEM_USAGE)
+#define IOCTL_VMX86_GET_KHZ_ESTIMATE    VMIOCTL_BUFFERED(GET_KHZ_ESTIMATE)
+#define IOCTL_VMX86_SET_HOST_CLOCK_RATE VMIOCTL_BUFFERED(SET_HOST_CLOCK_RATE)
+#define IOCTL_VMX86_SYNC_GET_TSCS       VMIOCTL_BUFFERED(SYNC_GET_TSCS)
+#define IOCTL_VMX86_READ_PAGE           VMIOCTL_BUFFERED(READ_PAGE)
+#define IOCTL_VMX86_WRITE_PAGE          VMIOCTL_BUFFERED(WRITE_PAGE)
+#define IOCTL_VMX86_LOCK_PAGE_NEW       VMIOCTL_BUFFERED(LOCK_PAGE_NEW)
+#define IOCTL_VMX86_UNLOCK_PAGE_BY_MPN  VMIOCTL_BUFFERED(UNLOCK_PAGE_BY_MPN)
+#define IOCTL_VMX86_ALLOC_LOCKED_PAGES  VMIOCTL_BUFFERED(ALLOC_LOCKED_PAGES)
+#define IOCTL_VMX86_FREE_LOCKED_PAGES   VMIOCTL_BUFFERED(FREE_LOCKED_PAGES)
+#define IOCTL_VMX86_GET_NEXT_ANON_PAGE  VMIOCTL_BUFFERED(GET_NEXT_ANON_PAGE)
+#define IOCTL_VMX86_GET_LOCKED_PAGES_LIST VMIOCTL_BUFFERED(GET_LOCKED_PAGES_LIST)
+
+#define IOCTL_VMX86_GET_KERNEL_PROC_ADDRESS  VMIOCTL_BUFFERED(GET_KERNEL_PROC_ADDRESS)
+#define IOCTL_VMX86_READ_VA64           VMIOCTL_BUFFERED(READ_VA64)
+#define IOCTL_VMX86_SET_MEMORY_PARAMS   VMIOCTL_BUFFERED(SET_MEMORY_PARAMS)
+
+#define IOCTL_VMX86_REMEMBER_KHZ_ESTIMATE VMIOCTL_BUFFERED(REMEMBER_KHZ_ESTIMATE)
+
+#define IOCTL_VMX86_GET_ALL_MSRS        VMIOCTL_BUFFERED(GET_ALL_MSRS)
+#define IOCTL_VMX86_COUNT_PRESENT_PAGES	VMIOCTL_BUFFERED(COUNT_PRESENT_PAGES)
+
+#define IOCTL_VMX86_FAST_SUSP_RES_SET_OTHER_FLAG VMIOCTL_BUFFERED(FAST_SUSP_RES_SET_OTHER_FLAG)
+#define IOCTL_VMX86_FAST_SUSP_RES_GET_MY_FLAG    VMIOCTL_BUFFERED(FAST_SUSP_RES_GET_MY_FLAG)
+
+#define IOCTL_VMX86_GET_REFERENCE_CLOCK_HZ   VMIOCTL_BUFFERED(GET_REFERENCE_CLOCK_HZ)
+#define IOCTL_VMX86_INIT_PSEUDO_TSC          VMIOCTL_BUFFERED(INIT_PSEUDO_TSC)
+#define IOCTL_VMX86_CHECK_PSEUDO_TSC         VMIOCTL_BUFFERED(CHECK_PSEUDO_TSC)
+#define IOCTL_VMX86_GET_PSEUDO_TSC           VMIOCTL_NEITHER(GET_PSEUDO_TSC)
+#define IOCTL_VMX86_SET_HOST_CLOCK_PRIORITY  VMIOCTL_BUFFERED(SET_HOST_CLOCK_PRIORITY)
+#define IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS    VMIOCTL_NEITHER(GET_UNAVAIL_PERF_CTRS)
+#define IOCTL_VMX86_REMAP_SCATTER_LIST VMIOCTL_BUFFERED(REMAP_SCATTER_LIST)
+#define IOCTL_VMX86_UNMAP_SCATTER_LIST VMIOCTL_BUFFERED(UNMAP_SCATTER_LIST)
+#endif
+
+
+/*
+ * Flags sent into APICBASE ioctl
+ */
+
+#define APIC_FLAG_DISABLE_NMI       0x00000001
+#define APIC_FLAG_PROBE             0x00000002
+#define APIC_FLAG_FORCE_ENABLE      0x00000004
+
+typedef
+#include "vmware_pack_begin.h"
+struct VMLockPageRet {
+   MPN   mpn;      // OUT: MPN
+   int32 status;   // OUT: PAGE_* status code
+}
+#include "vmware_pack_end.h"
+VMLockPageRet;
+
+typedef
+#include "vmware_pack_begin.h"
+union {
+   VA64 uAddr;        // IN: user address
+   VMLockPageRet ret; // OUT: status code and MPN
+}
+#include "vmware_pack_end.h"
+VMLockPage;
+
+
+typedef struct VMAPICInfo {
+   uint32 flags;
+} VMAPICInfo; 
+
+#define VMX86_DRIVER_VCPUID_OFFSET	1000
+
+
+/*
+ * We keep track of 3 different limits on the number of pages we can lock.
+ * The host limit is determined at driver load time (in windows only) to
+ * make sure we do not starve the host by locking too many pages.
+ * The static limit is user defined in the UI and the dynamic limit is 
+ * set by authd's hardLimitMonitor code (windows only), which queries
+ * host load and adjusts the limit accordingly.  We lock the minimum of 
+ * all these values at any given time.
+ */
+typedef struct LockedPageLimit {
+   uint32 host;        // driver calculated maximum for this host
+   uint32 configured;  // user defined maximum pages to lock
+   uint32 dynamic;     // authd hardLimitMonitor pages to lock
+} LockedPageLimit;
+
+/*
+ * Sentinel VA for IOCTL_VMX86_SET_MEMORY_PARAMS, indicates
+ * NtQuerySystemInformation should be used to determine the host
+ * LockedPageLimit.
+ */
+#define MEMORY_PARAM_USE_SYSINFO_FOR_LOCKED_PAGE_LIMIT   ((VA64)(int64)-1)
+
+/*
+ * Data structures for the GET_MEM_INFO and ADMIT ioctls.
+ *
+ * Be careful adding structs and fields to VMMemInfoArgs and its
+ * substructures. These are compiled into both the 32-bit and 64-bit
+ * vmmon drivers and the 32-bit and 64-bit vmx's and need to have
+ * the same size and layout in all four combinations. Note the
+ * use of padding below to ensure that this happens.
+ */
+
+typedef struct VMMemMgmtInfo {
+   uint32          minAllocation;   // minimum pages for vm
+   uint32          maxAllocation;   // maximum pages the vm could lock
+   uint32          shares;          // proportional sharing weight
+   uint32          nonpaged;        // overhead memory (guest, mmap)
+   uint32          paged;           // vmx memory (malloc, statics)
+   uint32          anonymous;       // vmm memory
+   uint32          mainMemSize;     // guest main memory size
+   uint32          locked;          // number of pages locked by this vm
+   uint32          perVMOverhead;   // memory for vmx/vmmon overheads
+   Percent         touchedPct;      // % of guest memory being touched
+   Percent         dirtiedPct;      // % of guest memory being dirtied
+   Bool            admitted;        // admission control
+   uint8           _pad;            // for alignment of 64-bit fields
+   uint64          hugePageBytes;   // number of bytes occupied by huge pages
+   uint64          timestamp;       // most recent poll of get mem info time
+} VMMemMgmtInfo;
+
+typedef struct VMMemMgmtInfoPatch {
+   Percent         touchedPct;      // % of guest memory being touched
+   Percent         dirtiedPct;      // % of guest memory being dirtied
+   uint8           _pad[6];
+   uint64          hugePageBytes;
+} VMMemMgmtInfoPatch;
+
+/*
+ * See comment on padding and size/layout constraints above when
+ * when modifying VMMemInfoArgs or its components.
+ */
+
+typedef struct VMMemInfoArgs {
+   uint64          currentTime;        // Host time in secs of the call. 
+   uint32          minVmMemPct;        // % of vm that must fit in memory
+   uint32          globalMinAllocation;// pages that must fit in maxLockedPages
+   uint32          numLockedPages;     // total locked pages by all vms
+   LockedPageLimit lockedPageLimit;    // set of locked page limits
+   uint32          maxLockedPages;     // effective limit on locked pages
+   uint32          callerIndex;        // this vm's index memInfo array
+   uint32          numVMs;             // number of running VMs
+   uint8           _pad[4];
+   VMMemMgmtInfo   memInfo[1];
+} VMMemInfoArgs;
+
+#define VM_GET_MEM_INFO_SIZE(numVMs) \
+   (sizeof(VMMemInfoArgs) - sizeof(VMMemMgmtInfo) + (numVMs) * sizeof(VMMemMgmtInfo))
+
+typedef struct VMMPNNext {
+   MPN         inMPN;   // IN
+   MPN         outMPN;  // OUT
+} VMMPNNext;
+
+typedef struct VMMPNList {
+   uint32    mpnCount;   // IN (and OUT on Mac OS)
+   Bool      ignoreLimits;
+   uint8     _pad[3];
+   VA64      mpnList;    // IN: User VA of an array of 64-bit MPNs.
+} VMMPNList;
+
+typedef struct VARange {
+   VA64     addr;
+   VA64     bv;
+   unsigned len;
+   uint32   pad;
+} VARange;
+
+typedef struct VMMUnlockPageByMPN {
+   MPN       mpn;
+   VA64      uAddr;         /* IN: User VA of the page (optional). */
+} VMMUnlockPageByMPN;
+
+typedef struct VMMReadWritePage {
+   MPN          mpn;   // IN
+   VA64         uAddr; // IN: User VA of a PAGE_SIZE-large buffer.
+} VMMReadWritePage;
+
+struct passthrough_iorange {
+   unsigned short ioBase;   /* Base of range to pass through. */
+   unsigned short numPorts; /* Length of range. */
+};
+
+/*
+ * Data structure for the INIT_PSEUDO_TSC and CHECK_PSEUDO_TSC.
+ */
+
+typedef struct PTSCInitParams {
+   RateConv_Params refClockToPTSC;
+   uint64          tscHz;
+   uint64          initialPTSC;
+   int64           tscOffset;
+   Bool            forceRefClock;
+   Bool            forceTSC;
+   Bool            hwTSCsSynced;
+   uint8           _pad[5];
+} PTSCInitParams;
+
+typedef struct PTSCCheckParams {
+   uint64 lastTSC;
+   uint64 lastRC;
+   Bool   usingRefClock;
+   uint8  _pad[7];
+} PTSCCheckParams;
+
+#ifndef VMX86_SERVER
+
+typedef struct IPIVectors {
+   /*
+    * Vector(s) the host uses for its own IPIs; we use this as a performance
+    * hint.
+    */
+   uint8 hostIPIVectors[2];
+   /* 
+    * Vectors we have allocated or stolen for the monitor interrupts.
+    */
+   uint8 monitorIPIVector; 
+   uint8 hvIPIVector;
+} IPIVectors;
+
+#endif
+
+/*
+ * This struct is passed to IOCTL_VMX86_INIT_CROSSGDT to fill in a crossGDT
+ * entry.
+ */
+typedef struct InitCrossGDT {
+   uint32 index;      // index in crossGDT to update (offset / 8)
+   Descriptor value;  // value to set the crossGDT entry to
+} InitCrossGDT;
+
+#if defined __linux__
+
+/*
+ * Linux uses mmap(2) to allocate contiguous locked pages, and uses these
+ * macros to marshall real arguments to mmap's made-up 'offset' argument.
+ */
+
+#define VMMON_MAP_MT_LOW4GB     0
+#define VMMON_MAP_MT_LOW16MB    1
+#define VMMON_MAP_MT_ANY        2
+
+#define VMMON_MAP_OFFSET_SHIFT  0
+#define VMMON_MAP_OFFSET_MASK   0x00000FFF
+#define VMMON_MAP_ORDER_SHIFT   12
+#define VMMON_MAP_ORDER_MASK    0xF
+#define VMMON_MAP_MT_SHIFT      16
+#define VMMON_MAP_MT_MASK       0x7
+#define VMMON_MAP_RSVD_SHIFT    19
+
+#define VMMON_MAP_RSVD(base)    \
+                ((base) >> VMMON_MAP_RSVD_SHIFT)
+#define VMMON_MAP_MT(base)      \
+                (((base) >> VMMON_MAP_MT_SHIFT) & VMMON_MAP_MT_MASK)
+#define VMMON_MAP_ORDER(base)   \
+                (((base) >> VMMON_MAP_ORDER_SHIFT) & VMMON_MAP_ORDER_MASK)
+#define VMMON_MAP_OFFSET(base)  \
+                (((base) >> VMMON_MAP_OFFSET_SHIFT) & VMMON_MAP_OFFSET_MASK)
+
+#define VMMON_MAP_BASE(mt, order)   (((mt) << VMMON_MAP_MT_SHIFT) | \
+                                     ((order) << VMMON_MAP_ORDER_SHIFT))
+
+#elif defined _WIN32
+/*
+ * Windows uses an ioctl to allocate contiguous locked pages.
+ */
+
+typedef struct VMAllocContiguousMem {
+   VA64   mpnList;  // IN: User VA of an array of 64-bit MPNs.
+   uint32 mpnCount; // IN
+   uint32 order;    // IN
+   MPN    maxMPN;   // IN
+} VMAllocContiguousMem;
+#elif defined __APPLE__
+#   include "iocontrolsMacos.h"
+#endif
+
+/* Clean up helper macros */
+#undef IOCTLCMD
+
+#endif // ifndef _IOCONTROLS_H_
diff --git a/vmmon-only/include/memDefaults.h b/vmmon-only/include/memDefaults.h
new file mode 100644
index 00000000..68611708
--- /dev/null
+++ b/vmmon-only/include/memDefaults.h
@@ -0,0 +1,154 @@
+/*********************************************************
+ * Copyright (C) 1998-2012 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+#ifndef _MEMDEFAULTS_H_
+#define _MEMDEFAULTS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_MODULE
+
+#include "includeCheck.h"
+
+#include "vm_basic_math.h"
+#include "vm_basic_defs.h"
+
+#define MEMDEFAULTS_MIN_HOST_PAGES   MBYTES_2_PAGES(128)
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MemDefaults_CalcMaxLockedPages --
+ *
+ *      Calculate the rough estimate of the maximum amount of memory
+ *      that can be locked (total for the kernel, all VMs, and other apps),
+ *      based on the size of host memory as supplied in pages.
+ *
+ * Results:
+ *      The estimated maximum memory that can be locked in pages.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE unsigned
+MemDefaults_CalcMaxLockedPages(unsigned hostPages)  // IN:
+{
+   unsigned reservedPages;
+
+#if defined(__APPLE__)
+   /*
+    * Reserve (25% of the host memory + 512 MB) or 4 GB, whichever is lower.
+    * 4 GB hosts perform poorly with less than 1.5 GB reserved, and large
+    * memory hosts (>= 16 GB) may want to use more than 75% for VMs.
+    */
+   reservedPages = MIN((hostPages / 4) + MBYTES_2_PAGES(512),
+                       GBYTES_2_PAGES(4));
+#elif defined(_WIN32)
+   {
+      unsigned int hostGig = PAGES_2_GBYTES(hostPages);
+
+      if (hostGig <= 4) {
+         reservedPages = hostPages / 4;
+      } else if (hostGig >= 16) {
+         reservedPages = hostPages / 8;
+      } else {
+         /*
+          * Increment by 1/32 for each 4GB of host mem between 4 and 16.
+          * See PR779556.
+          */
+         reservedPages = hostPages / 32 * (8 - hostGig / 4);
+      }
+   }
+#else  // Linux
+   reservedPages = hostPages / 8;
+#endif
+
+   reservedPages = MAX(reservedPages, MEMDEFAULTS_MIN_HOST_PAGES);
+
+   return hostPages > reservedPages ? hostPages - reservedPages : 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MemDefaults_CalcMaxLockedMBs --
+ *
+ *      Calculate the rough estimate of the maximum amount of memory
+ *      that can be locked based on the size of host memory as supplied
+ *      in MBytes.
+ *
+ * Results:
+ *      The estimated maximum memory that can be locked in MBytes.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+MemDefaults_CalcMaxLockedMBs(uint32 hostMem)  // IN:
+{
+   return PAGES_2_MBYTES(
+             MemDefaults_CalcMaxLockedPages(MBYTES_2_PAGES(hostMem)));
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MemDefaults_CalcMinReservedMBs --
+ *
+ *      Provide a lower bound on the user as to the minimum amount
+ *      of memory to lock based on the size of host memory. This
+ *      threshold might be crossed as a result of the user limiting
+ *      the amount of memory consumed by all VMs.
+ *
+ * Results:
+ *      The minimum locked memory requirement in MBytes.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+MemDefaults_CalcMinReservedMBs(uint32 hostMem)  // IN:
+{
+   if (hostMem < 512) {
+      return 32;
+   } else if (hostMem < 1024) {
+      return 64;
+   } else {
+      return 128;
+   }
+}
+
+
+void MemDefaults_GetReservedMemory(uint32 *host, uint32 *min,
+                                   uint32 *max, uint32 *recommended);
+
+#endif
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
new file mode 100644
index 00000000..3f6f444b
--- /dev/null
+++ b/vmmon-only/include/modulecall.h
@@ -0,0 +1,495 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * modulecall.h
+ *
+ *        Monitor <-->  Module (kernel driver) interface
+ */
+
+#ifndef _MODULECALL_H
+#define _MODULECALL_H
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "x86types.h"
+#include "x86desc.h"
+#include "ptsc.h"
+#include "vcpuid.h"
+#include "vcpuset.h"
+#include "vmm_constants.h"
+#include "contextinfo.h"
+#include "rateconv.h"
+#include "modulecallstructs.h"
+#include "mon_assert.h"
+
+#define NUM_EXCEPTIONS 20       /* EXC_DE ... EXC_XF. */
+ 
+#define MODULECALL_TABLE                                                      \
+   MC(INTR)                                                                   \
+   MC(SEMAWAIT)                                                               \
+   MC(SEMASIGNAL)                                                             \
+   MC(SEMAFORCEWAKEUP)                                                        \
+   MC(IPI)          /* Hit thread with IPI. */                                \
+   MC(USERRETURN)   /* Return codes for user calls. */                        \
+   MC(GET_RECYCLED_PAGES)                                                     \
+   MC(RELEASE_ANON_PAGES)                                                     \
+   MC(LOOKUP_MPN)                                                             \
+   MC(COSCHED)                                                                \
+   MC(ALLOC_VMX_PAGE)                                                         \
+   MC(ALLOC_TMP_GDT)                                                          \
+   MC(PIN_MPN)
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * ModuleCallType --
+ *
+ *      Enumeration of support calls done by the module.
+ *
+ *      If anything changes in the enum, please update kstatModuleCallPtrs
+ *      for stats purposes.
+ *
+ *----------------------------------------------------------------------
+ */
+
+typedef enum ModuleCallType {
+   MODULECALL_NONE = 100,
+#define MC(_modulecall) MODULECALL_##_modulecall,
+   MODULECALL_TABLE
+#undef MC
+   MODULECALL_LAST                   // Number of entries. Must be the last one
+} ModuleCallType;
+
+#define MODULECALL_USERCALL_NONE     300
+
+/*
+ * Define VMX86_UCCOST in the makefiles (Local.mk,
+ * typically) if you want a special build whose only purpose
+ * is to measure the overhead of a user call and its
+ * breakdown.
+ *
+ * WINDOWS NOTE: I don't know how to pass VMX86_UCCOST to
+ * the driver build on Windows.  It must be defined by hand.
+ *
+ * ESX Note: we don't have a crosspage in which to store these
+ * timestamps.  Such a feature would perhaps be nice (if we
+ * ever tire of the argument that esx does so few usercalls
+ * that speed doesn't matter).
+ */
+
+#if defined(VMX86_UCCOST) && !defined(VMX86_SERVER)
+#define UCTIMESTAMP(cp, stamp) \
+             do { (cp)->ucTimeStamps[UCCOST_ ## stamp] = RDTSC(); } while (0)
+#else
+#define UCTIMESTAMP(cp, stamp)
+#endif
+
+#ifdef VMX86_SERVER
+typedef struct UCCostResults {
+   uint32 vmksti;
+   uint32 vmkcli;
+   uint32 ucnop;
+} UCCostResults;
+#else
+
+typedef struct UCCostResults {
+   uint32 htom;
+   uint32 mtoh;
+   uint32 ucnop;
+} UCCostResults;
+
+typedef enum UCCostStamp {
+#define UC(x) UCCOST_ ## x,
+#include "uccostTable.h"
+   UCCOST_MAX
+} UCCostStamp;
+#endif // VMX86_SERVER
+
+/*
+ * Header for the wsBody64.S worldswitch code file.
+ */
+typedef struct WSModule {
+   uint32 vmmonVersion;  // VMMON_VERSION when assembled as part of monitor
+   uint16 moduleSize;    // size of whole wsBody64 module
+   uint16 hostToVmm;     // offset from beginning of header to hostToVmm
+   uint16 vmm64ToHost;
+   uint16 _pad[3];
+
+   uint8 code[1024];      // big enough for MAX('.wsBody64', 'wsBody64Log')
+} WSModule;
+
+typedef
+#include "vmware_pack_begin.h"
+struct SwitchNMIOffsets {
+   uint16         db;    // offset to start of  #DB handler
+   uint16         nmi;   // offset to start of #NMI handler
+   uint16         df;    // offset to start of  #DF handler
+   uint16         ud;    // offset to start of  #UD handler
+   uint16         gp;    // offset to start of  #GP handler
+   uint16         pf;    // offset to start of  #PF handler
+   uint16         mce;   // offset to start of #MCE handler
+}
+#include "vmware_pack_end.h"
+SwitchNMIOffsets;
+
+/*
+ * This is a header for the switchNMI.S module.  It contains code for
+ * exceptions occurring during worldswitch.  The code gets copied to
+ * the crosspage by initialization.
+ */
+typedef
+#include "vmware_pack_begin.h"
+struct SwitchNMI {                                // see switchNMI.S
+   uint16           switchNMISize;
+   SwitchNMIOffsets host;                         // offsets to handlers
+   volatile Bool    wsException[NUM_EXCEPTIONS];  // EXC_DE ... EXC_XF
+                                                  // TRUE -> fault occurred in
+                                                  //   worldswitch
+   uint64           wsUD2;                        // IP of ud2 instruction
+                                                  //    0ULL == unset
+                                                  //   other == worldswitch IP
+   uint8            codeBlock[768];               // Enough for
+                                                  //   max('.switchNMI',
+                                                  //       '.switchNMILog').
+}
+#include "vmware_pack_end.h"
+SwitchNMI;
+
+#define SHADOW_DR(cpData, n)    (cpData)->shadowDR[n].ureg64
+
+
+/*----------------------------------------------------------------------
+ *
+ * MAX_SWITCH_PT_PATCHES
+ *
+ *   This is the maximum number of patches that must be placed into
+ *   the monitor page tables so that two pages of the host GDT and the
+ *   crosspage can be accessed during worldswitch.
+ *
+ *----------------------------------------------------------------------
+ */
+#define MAX_SWITCH_PT_PATCHES 3
+
+/*----------------------------------------------------------------------
+ *
+ * WS_INTR_STRESS
+ *
+ *   When set to non-zero, world switch code will enable single-step
+ *   debugging across much of the switch path in both directions.  The
+ *   #DB handler detects single-stepping and induces a simulated NMI per
+ *   instruction.  This verifies that interrupts and exceptions are safe
+ *   across the switch path, even if an NMI were raised during handling
+ *   of another exception.
+ *
+ *   When set to zero, normal worldswitch operation occurs.
+ *
+ *   See the worldswitch assembly code for details.
+ *
+ *----------------------------------------------------------------------
+ */
+#define WS_INTR_STRESS 0
+
+
+/*----------------------------------------------------------------------
+ *
+ * VMM64PageTablePatch
+ *
+ *    Describes an entry in the monitor page table which needs to be
+ *    patched during the back-to-host worldswitch.
+ *
+ *    o A patch can appear at any place in the page table, and so four
+ *      items are required to uniquely describe the patch:
+ *
+ *      o level
+ *
+ *        This is the level in the page table to which the patch must
+ *        be applied: L4, L3, L2, L1.  This information is used to
+ *        determine the base of the region of memory which must be
+ *        patched.  The level value corresponds to the following
+ *        regions in monitor memory:
+ *
+ *          MMU_ROOT_64
+ *          MMU_L3_64
+ *          MMU_L2_64
+ *          MON_PAGE_TABLE_64
+ *
+ *        The value zero is reserved to indicate an empty spot in the
+ *        array of patches.
+ *
+ *      o level offset
+ *
+ *        The monitor memory regions corresponding to the page table
+ *        levels may be more than one page in length, so a 'page
+ *        offset' is required to know the starting address of the page
+ *        table page which must be patched in 'level'.
+ *
+ *      o page index
+ *
+ *        The 'index' value specifies the element in the page which
+ *        should be patched.
+ *
+ *      o pte
+ *
+ *        This is the PTE value which will be patched into the monitor
+ *        page table.
+ *
+ *----------------------------------------------------------------------
+ */
+typedef
+#include "vmware_pack_begin.h"
+struct VMM64PageTablePatch {
+#define PTP_EMPTY    (0U) /* Unused array entry. (must be 0) */
+#define PTP_LEVEL_L1 (1U)       /* leaf level */
+#define PTP_LEVEL_L2 (2U)
+#define PTP_LEVEL_L3 (3U)
+#define PTP_LEVEL_L4 (4U)       /* root level */
+   uint16   level;              /* [0, 4]  (maximal size: 3 bits) */
+   uint16   page;               /* Index of 'page' in 'level'.    */
+   uint32   index;              /* Index of 'pte' in 'page'.      */
+   VM_PDPTE pte;                /* PTE.                           */
+}
+#include "vmware_pack_end.h"
+VMM64PageTablePatch;
+
+#define MODULECALL_NUM_ARGS  4
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VMCrossPageData --
+ *
+ *      Data which is stored on the VMCrossPage.
+ *
+ *----------------------------------------------------------------------
+ */
+typedef
+#include "vmware_pack_begin.h"
+struct VMCrossPageData {
+   /*
+    * A tiny stack upon which interrupt and exception handlers in the switch
+    * path temporarily run.  Keep the end 16-byte aligned.  This stack must
+    * be large enough for the sum of:
+    *
+    * - 1 #DB exception frame (5 * uint64)
+    * - 1 #NMI exception frame (5 * uint64)
+    * - 1 #MCE exception frame (5 * uint64)
+    * - the largest stack use instantaneously possible by #MCE handling code
+    * - the largest stack use instantaneously possible by #NMI handling code
+    * - the largest stack use instantaneously possible by #DB handling code
+    * - one high-water uint32 used to detect stack overflows when debugging
+    * - remaining pad bytes to align to 16 bytes
+    *
+    * 184 bytes is slightly more than enough as of 2015/03/17 -- fjacobs.
+    */
+   uint32   tinyStack[46];
+
+   uint64   hostCR3;
+   uint32   crosspageMA;
+
+   uint8    hostDRSaved;        // Host DR spilled to hostDR[x].
+   uint8    hostDRInHW;         // 0 -> shadowDR in h/w, 1 -> hostDR in h/w.
+                                //   contains host-sized DB,NMI,MCE entries
+   uint16   hostSS;
+   uint64   hostRSP;
+   uint64   hostDR[8];
+   uint64   hostRBX;
+   uint64   hostRSI;
+   uint64   hostRDI;
+   uint64   hostRBP;
+   uint64   hostR12;
+   uint64   hostR13;
+   uint64   hostR14;
+   uint64   hostR15;
+   LA64     hostCrossPageLA;   // where host has crosspage mapped
+   uint16   hostInitial64CS;
+   uint16   _pad0[3];
+
+   uint64   wsCR0;
+   uint64   wsCR4;
+
+   DTR64    crossGDTHKLADesc;   // always uses host kernel linear address
+   uint16   _pad1[3];
+   DTR64    mon64GDTR;
+   uint16   mon64ES;
+   uint16   mon64SS;
+   uint16   mon64DS;
+   uint64   mon64CR3;
+   uint64   mon64RBX;
+   uint64   mon64RSP;
+   uint64   mon64RBP;
+   uint64   mon64RSI;
+   uint64   mon64RDI;
+   uint64   mon64R12;
+   uint64   mon64R13;
+   uint64   mon64R14;
+   uint64   mon64R15;
+   uint64   mon64RIP;
+   Task64   monTask64;          /* vmm64's task */
+
+   VMM64PageTablePatch vmm64PTP[MAX_SWITCH_PT_PATCHES]; /* page table patch */
+   LA64                vmm64CrossPageLA;
+   LA64                vmm64CrossGDTLA;   // where crossGDT mapped by PT patch
+                                          //  64-bit host: host kernel linear
+                                          // address
+
+   /*
+    * The monitor may requests up to two actions when returning to the
+    * host.  The moduleCallType field and args encode a request for
+    * some action in the driver.  The userCallType field (together
+    * with the RPC block) encodes a user call request.  The two
+    * requests are independent.  The user call is executed first, with
+    * the exception of MODULECALL_INTR which has a special effect.
+    */
+   ModuleCallType moduleCallType;
+   uint32         retval;
+   uint64         args[MODULECALL_NUM_ARGS];
+   int            userCallType;
+   uint32         pcpuNum;   /* Used as extra module call arg within vmmon. */
+
+   VCPUSet        yieldVCPUs;
+
+#if !defined(VMX86_SERVER)
+   uint64 ucTimeStamps[UCCOST_MAX];
+#endif
+
+   /*
+    * The values in the shadow debug registers must match those in the
+    * hardware debug register immediately after a task switch in
+    * either direction.  They are used to minimize moves to and from
+    * the debug registers.
+    */
+   SharedUReg64     shadowDR[8];
+   uint8            shadowDRInHW; // bit n set iff %DRn == shadowDR[n]
+
+   SwitchedMSRState switchedMSRState;
+   uint8            _pad2[7];
+
+   /*
+    * Adjustment for machines where the hardware TSC does not run
+    * constantly (laptops) or is out of sync between different PCPUs.
+    * Updated as needed by vmmon.  See VMK_SharedData for the ESX
+    * analog, which is updated by the vmkernel.
+    */
+   RateConv_ParamsVolatile pseudoTSCConv;
+   VmAbsoluteTS            worldSwitchPTSC; // PTSC value immediately before
+                                            // last worldswitch.
+
+   VmAbsoluteTS timerIntrTS;    // PTSC of timer interrupt while in the vmm
+   VmAbsoluteTS hstTimerExpiry; // PTSC of host timer interrupt
+   VmAbsoluteTS monTimerExpiry; // PTSC of next MonTimer callback
+
+   Bool     activateVMX;        // TRUE -> activate Intel VMX extensions
+   Bool     activateSVM;        // TRUE -> activate AMD SVM extensions
+   Bool     retryWorldSwitch;   // TRUE -> return to host on host->vmm switch
+   /*
+    * TRUE if moduleCall was interrupted by signal. Only
+    * vmmon uses this field to remember that it should
+    * restart RunVM call, nobody else should look at it.
+    */
+   Bool     moduleCallInterrupted;
+   uint8    _pad3[4];
+
+   DTR64    switchHostIDTR;     // baseLA = switchHostIDT's host knl LA
+   uint16   _pad4[3];
+   DTR64    switchMon64IDTR;    // has baseLA = switchMon64IDT's monitor LA
+                                //   contains 64-bit DB,NMI,MCE entries
+   uint16   _pad5[3];
+
+   /*
+    * Descriptors and interrupt tables for switchNMI handlers.  Each
+    * IDT has only enough space for the hardware exceptions; they are
+    * sized to accommodate 64-bit descriptors.
+    */
+   uint8 switchHostIDT [sizeof(Gate64) * NUM_EXCEPTIONS]; // hostCS:hostVA
+   uint8 switchMon64IDT[sizeof(Gate64) * NUM_EXCEPTIONS]; // 64-bit monCS:monVA
+}
+#include "vmware_pack_end.h"
+VMCrossPageData;
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VMCrossPageCode --
+ *
+ *      Code which is stored on the VMCrossPage.
+ *
+ *----------------------------------------------------------------------
+ */
+typedef
+#include "vmware_pack_begin.h"
+struct VMCrossPageCode {
+   WSModule   worldswitch;
+   SwitchNMI  faultHandler;
+}
+#include "vmware_pack_end.h"
+VMCrossPageCode;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VMCrossPage --
+ *
+ *      Data structure shared between the monitor and the module
+ *      that is used for crossing between the two.
+ *      Accessible as vm->cross (kernel module) and CROSS_PAGE
+ *      (monitor)
+ *
+ *      Exactly one page long
+ *
+ *----------------------------------------------------------------------
+ */
+
+typedef
+#include "vmware_pack_begin.h"
+struct VMCrossPage {
+   uint32          version;         /* 4 bytes. Must be at offset zero. */
+   uint32          crosspage_size;  /* 4 bytes. Must be at offset 4.    */
+   VMCrossPageData crosspageData;
+   uint8           _pad[PAGE_SIZE - (sizeof(uint32) /* version */        +
+                                     sizeof(uint32) /* crosspage_size */ +
+                                     sizeof(VMCrossPageData)             +
+                                     sizeof(VMCrossPageCode))];
+   VMCrossPageCode crosspageCode;
+}
+#include "vmware_pack_end.h"
+VMCrossPage;
+
+#define CROSSPAGE_VERSION_BASE 0xbf1 /* increment by 1 */
+#define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
+
+#if !defined(VMX86_SERVER) && defined(VMM)
+#define CROSS_PAGE  ((VMCrossPage * const) VPN_2_VA(CROSS_PAGE_START))
+#define VMM_SWITCH_SHARED_DATA ((VMCrossPageData *)&CROSS_PAGE->crosspageData)
+#endif
+
+#define NULLPAGE_LINEAR_START  (MONITOR_LINEAR_START + \
+                                PAGE_SIZE * CPL0_GUARD_PAGE_START)
+
+#define MX_WAITINTERRUPTED     3
+#define MX_WAITTIMEDOUT        2
+#define MX_WAITNORMAL          1  // Must equal one; see linux module code.
+#define MX_WAITERROR           0  // Use MX_ISWAITERROR() to test for error.
+
+// Any zero or negative value denotes error.
+#define MX_ISWAITERROR(e)      ((e) <= MX_WAITERROR)
+#endif
diff --git a/vmmon-only/include/modulecallstructs.h b/vmmon-only/include/modulecallstructs.h
new file mode 100644
index 00000000..7943a2ba
--- /dev/null
+++ b/vmmon-only/include/modulecallstructs.h
@@ -0,0 +1,99 @@
+/*********************************************************
+ * Copyright (C) 2006,2009-2011,2013-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * modulecallstructs.h --
+ *
+ *
+ *      Data structures that need to be included in modulecall.h
+ *      as well as the vmkernel.
+ *
+ */
+
+#ifndef _MODULECALLSTRUCTS_H_
+#define _MODULECALLSTRUCTS_H_
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMCORE
+
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+/*
+ *      Flags indicating switched MSR status.
+ *
+ * UNUSED    - Not used by the monitor (yet). [This is a value, not a flag.]
+ * USED      - Hardware MSR is used by the monitor.
+ * RESTORED  - Monitor value is restored on world switch into the VMM.
+ * SHADOWED  - Live monitor value is always shadowed in the SwitchedMSRState.
+ *
+ */
+
+#define SWITCHED_MSR_FLAG_UNUSED           0
+#define SWITCHED_MSR_FLAG_USED             1
+#define SWITCHED_MSR_FLAG_RESTORED         2
+#define SWITCHED_MSR_FLAG_SHADOWED         4
+
+/*
+ * Note: If you add an msr to this list, please also ensure that
+ *       hardware support for the msr is properly indicated in
+ *       both the monitor (MonMSRIsSupported) and in the vmkernel
+ *       (world switch msrSupported array).
+ */
+#define SWITCHED_MSRS       \
+   SWMSR(MSR_SYSENTER_CS)   \
+   SWMSR(MSR_SYSENTER_EIP)  \
+   SWMSR(MSR_SYSENTER_ESP)  \
+   SWMSR(MSR_STAR)          \
+   SWMSR(MSR_LSTAR)         \
+   SWMSR(MSR_CSTAR)         \
+   SWMSR(MSR_SFMASK)        \
+   SWMSR(MSR_TSC_AUX)       \
+   SWMSR(MSR_BD_TSC_RATIO)
+
+/*
+ *      Data structures for dealing with the context-switched MSRs that need
+ *      to be specially handled.  While the MSR definitions themselves
+ *      are part of the x86 architecture, our handling of them (and hence
+ *      these data structures) is an implementation detail.
+ */
+
+
+typedef enum SwitchedMSR {
+#define SWMSR(msr) SWITCHED_##msr,
+   SWITCHED_MSRS
+#undef SWMSR
+   NUM_SWITCHED_MSRS
+} SwitchedMSR;
+
+/*
+ * Switched MSR values for each [vp]CPU.
+ */
+typedef struct SwitchedMSRValues {
+   uint64 a[NUM_SWITCHED_MSRS];
+} SwitchedMSRValues;
+
+typedef struct SwitchedMSRState {
+   SwitchedMSRValues smv;
+   uint8             flags[NUM_SWITCHED_MSRS];
+   uint32            _pad;
+} SwitchedMSRState;
+
+#endif
diff --git a/vmmon-only/include/mon_assert.h b/vmmon-only/include/mon_assert.h
new file mode 100644
index 00000000..b86832ca
--- /dev/null
+++ b/vmmon-only/include/mon_assert.h
@@ -0,0 +1,207 @@
+/*********************************************************
+ * Copyright (C) 2007-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _MON_ASSERT_H_
+#define _MON_ASSERT_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_assert.h"
+#include "vm_basic_asm.h"
+
+/*
+ * Monitor Source Location
+ *
+ * The monitor encodes source locations -- file name & line number --
+ * in just 32 bits; the process is arcane enough that it deserves a
+ * little discussion.
+ *
+ *   o The ASSERT family of macros are expanded in the monitor to take
+ *     an 'Assert_MonSrcLoc' rather than the standard '<file>,
+ *     <line-number>' couplet.
+ *
+ *   o The '<file>, <line-number>' couplet is encoded into
+ *     Assert_MonSrcLoc, which is an unsigned 32-bit integer.
+ *
+ *   o The upper 16-bits of Assert_MonSrcLoc are the line number.
+ *
+ *     Source lines above 65535 will be silently masked to 16-bits.
+ *
+ *   o The lower 16-bits of Assert_MonSrcLoc are the offset to the file
+ *     name from the start of the file name table.
+ *
+ *     This, of course, implies that the size of the table containing
+ *     the file names cannot exceed 64K.
+ *
+ *   o If we use '__FILE__' directly, gcc will coalesce all equivalent
+ *     strings into a single occurrence (in '.rodata').
+ *
+ *     Using the full pathname for __FILE__ is undesirable because
+ *     different source trees frequently have different path name
+ *     lengths, and this causes the 'monitor-modular-size' script to
+ *     report differences in '.rodata'.
+ *
+ *   o To avoid differences in '.rodata', each __FILE__ is put into
+ *     its own section.  The monitor's linker (not ld) will use the
+ *     name of the section to recover the name of the source file.
+ *
+ *   o At run time, prior to loading, when our linker is creating an
+ *     executable image of the monitor and extensions, all the file
+ *     names are extracted from these sections, the '${VMTREE}' prefix
+ *     is removed, and the resulting table of shortened file names is
+ *     added to '.rodata'.
+ *
+ *     Further, during linkage, each relocation to the original
+ *     section containing the path name is modified so that the low
+ *     16-bits contain an offset from '__vmm_pathnames_start' rather
+ *     than the base of the original containing section.
+ *
+ *     Only three types of relocations to the assertion strings are
+ *     supported (32-bit PC-relative and 32-bit/64-bit absolute) because that
+ *     is all the compiler has been seen to generate.
+ */
+
+#define ALL_ASSERT_TYPES \
+   ADEF(AssertType_AssertPanic,          _AssertPanicFmt),                 \
+   ADEF(AssertType_AssertAssert,         _AssertAssertFmt),                \
+   ADEF(AssertType_AssertVerify,         _AssertVerifyFmt),                \
+   ADEF(AssertType_AssertNotImplemented, _AssertNotImplementedFmt),        \
+   ADEF(AssertType_AssertNotReached,     _AssertNotReachedFmt),            \
+   ADEF(AssertType_AssertPanicBug,       _AssertPanicFmt " bugNr=%d"),     \
+   ADEF(AssertType_AssertAssertBug,      _AssertAssertFmt " bugNr=%d"),    \
+   ADEF(AssertType_AssertVerifyBug,      _AssertVerifyFmt " bugNr=%d"),    \
+   ADEF(AssertType_AssertNotImplementedBug,                                \
+        _AssertNotImplementedFmt " bugNr=%d"),                             \
+   ADEF(AssertType_AssertNotReachedBug,  _AssertNotReachedFmt " bugNr=%d"),\
+   ADEF(AssertType_AssertNotTested,      _AssertNotTestedFmt)
+
+typedef uint32 Assert_MonSrcLoc;
+
+#define ADEF(type, fmt) type
+typedef enum Assert_Type {  
+   ALL_ASSERT_TYPES
+} Assert_Type;
+#undef ADEF
+
+typedef struct Assert_Info {
+   VA faultAddr;
+   struct {
+      Assert_Type type:4;
+      int bugNr:28;
+   } misc;
+   Assert_MonSrcLoc loc;
+} Assert_Info;
+
+/*
+ * The portion of the __attribute__ line after __FILE__ is there so that
+ * the .assert_pathname_* sections are not marked as ALLOC, since we only
+ * need them in the vmx and do not need them loaded.
+ */
+#define __VMM__FILE__SECTION \
+      __attribute__((section (".assert_pathname_" __FILE__ ",\"\"#")))
+#define __VMM__FILE__ ({                                                \
+         static __VMM__FILE__SECTION const char file[] = "";            \
+         file;                                                          \
+      })
+
+#define ASSERT_MONSRCFILEOFFSET(loc)    LOWORD(loc)
+#define ASSERT_MONSRCLINE(loc)          HIWORD(loc)
+
+#define ASSERT_NULL_MONSRCLOC     0             // there is never line 0
+
+#ifdef VMM // {
+#ifdef MONITOR_APP // {
+
+#define ASSERT_MONSRCLOC() ASSERT_NULL_MONSRCLOC
+
+#else // } {
+
+#define ASSERT_MONSRCLOC() ({                                           \
+   const uintptr_t offset = ((__LINE__ << 16) +                         \
+                             (uintptr_t)__VMM__FILE__);                 \
+   const Assert_MonSrcLoc loc = offset;                                 \
+   loc;                                                                 \
+})
+
+extern const char __vmm_pathnames_start;
+#define ASSERT_MONSRCFILE(loc) \
+   (&__vmm_pathnames_start + ASSERT_MONSRCFILEOFFSET(loc))
+
+
+/*
+ * Assertion information is collected in a non-loadable section
+ * named .assert_info.  Each record in this section contains
+ * a VMM address, an assertion type, an optional bug number, and
+ * the MonSrcLoc described previously.  The VMM address is a key
+ * used by the VMX to look up the information associated with
+ * a particular assertion failure.
+ *
+ * Assertion failures are fired by executing a ud2 instruction.
+ *
+ * For assertions which always result in a terminal user RPC, we use
+ * __builtin_trap to generate the ud2, so that gcc knows that the
+ * subsequent code is unreachable.  For assertions which are
+ * recoverable (e.g any assertion triggered on the BackToHost path),
+ * we generate the ud2 manually, so that gcc will treat the subsequent
+ * code as reachable.
+ *
+ * The memory barriers work around a gcc bug that results from having
+ * to continue past an assertion.  Without these barriers, gcc has been
+ * seen to hoist code into the failing arm of the assertion, where it
+ * can then tell that, because of the assertion failure, the code ends
+ * up accessing an array out of bounds.
+ */
+
+#define ASSERT_RECORDINFO(assembly, assertType, bugNr)                   \
+   __asm__ __volatile__(".pushsection .assert_info;"                     \
+                        ".quad 0f;"                                      \
+                        ".long %c[type] + (%c[bug] << 4);"               \
+                        ".long (%c[line] << 16) + %c[file];"             \
+                        ".popsection;"                                   \
+                        "0: " assembly : :                               \
+                        [line] "i" (__LINE__),                           \
+                        [file] "i" (__VMM__FILE__),                      \
+                        [type] "i" (assertType),                         \
+                        [bug]  "i" (bugNr))
+
+#define _ASSERT_PANIC(name)                                              \
+   ({COMPILER_MEM_BARRIER();                                             \
+     ASSERT_RECORDINFO("ud2", AssertType_##name, 0);})
+
+#define _ASSERT_PANIC_NORETURN(name)                                     \
+   ({COMPILER_MEM_BARRIER();                                             \
+     ASSERT_RECORDINFO("", AssertType_##name, 0);                        \
+     __builtin_trap();})
+
+#define _ASSERT_PANIC_BUG(bug, name)                                     \
+   ({COMPILER_MEM_BARRIER();                                             \
+     ASSERT_RECORDINFO("ud2", AssertType_##name##Bug, bug);})
+
+#define _ASSERT_PANIC_BUG_NORETURN(bug, name)                            \
+   ({COMPILER_MEM_BARRIER();                                             \
+     ASSERT_RECORDINFO("", AssertType_##name##Bug, bug);                 \
+     __builtin_trap();})
+
+#endif // MONITOR_APP }
+#endif // VMM }
+
+#endif
diff --git a/vmmon-only/include/monitorAction_exported.h b/vmmon-only/include/monitorAction_exported.h
new file mode 100644
index 00000000..28b57c2c
--- /dev/null
+++ b/vmmon-only/include/monitorAction_exported.h
@@ -0,0 +1,156 @@
+/*********************************************************
+ * Copyright (C) 2010-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _MONITORACTION_EXPORTED_H_
+#define _MONITORACTION_EXPORTED_H_
+
+#define INCLUDE_ALLOW_VMX
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#include "includeCheck.h"
+
+#include "vm_assert.h"
+#include "vm_atomic.h"
+#include "vm_basic_types.h"
+
+/*
+ * Please bump the version number if your change will break the
+ * compatability to the drivers.
+ */
+#define ACTION_EXPORTED_VERSION   2
+
+#define ACTION_WORD_SIZE   (sizeof(uint64) * 8)
+#define ACTION_NUM_WORDS   (2)
+#define ACTION_NUM_IDS     (ACTION_NUM_WORDS * ACTION_WORD_SIZE)
+
+#define MONACTION_INVALID  MAX_UINT32
+
+typedef uint32 MonitorIdemAction;
+
+/*
+ * Representation of a set of actions.
+ */
+typedef struct MonitorActionSet {
+   volatile uint64 word[ACTION_NUM_WORDS];
+} MonitorActionSet;
+
+#ifndef __cplusplus
+typedef enum MonitorActionSetName MonitorActionSetName;
+#endif
+
+/*
+ * Summary of action and interrupt states.
+ */
+typedef struct MonitorActionIntr {
+   MonitorActionSet  pendingSet;
+   volatile Bool     action;
+   Bool              intr;
+   Bool              nmi;
+   Bool              db;
+   uint32            _pad;
+} MonitorActionIntr;
+
+/*
+ *------------------------------------------------------------------------
+ * MonitorActionSet_AtomicInclude --
+ *
+ *    This function atomically adds an action to an action set.
+ *
+ * Results:
+ *    TRUE if the action being added did not exist in the action set.
+ *    FALSE otherwise.
+ *
+ * Side effects:
+ *    The given action set will be updated.
+ *------------------------------------------------------------------------
+ */
+static INLINE Bool
+MonitorActionSet_AtomicInclude(MonitorActionSet *set, const uint32 actionID)
+{
+   Atomic_uint64 *atomicSet =
+      Atomic_VolatileToAtomic64(&set->word[actionID / ACTION_WORD_SIZE]);
+   uint64 mask = (uint64)1 << (actionID % ACTION_WORD_SIZE);
+   uint64 oldWord;
+   uint64 newWord;
+
+   ASSERT_ON_COMPILE((ACTION_WORD_SIZE & (ACTION_WORD_SIZE - 1)) == 0);
+#ifdef VMX86_DEBUG
+   /* If ASSERT is not desirable, do explicit check. Please see PR 567811. */
+#ifdef MODULE
+   if (UNLIKELY(actionID / ACTION_WORD_SIZE >= ACTION_NUM_WORDS)) {
+      return FALSE;
+   }
+#else
+   ASSERT(actionID / ACTION_WORD_SIZE < ACTION_NUM_WORDS);
+#endif // MODULE
+#endif // VMX86_DEBUG
+   do {
+      oldWord = Atomic_Read64(atomicSet);
+      newWord = oldWord | mask;
+   } while (!Atomic_CMPXCHG64(atomicSet, &oldWord, &newWord));
+   return (oldWord & mask) == 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------------
+ * MonitorAction_SetBits --
+ *
+ *      The core logic for posting an action. Update the set of pending
+ *      actions of the target VCPU in the shared area to mark the action
+ *      as present. Make sure the bit is set in the pendingSet first to
+ *      avoid a race with the drain loop.
+ *
+ *      It's the responsibility of the callers to ensure that the change
+ *      to actionIntr->action is globally visible before any IPI is sent
+ *      (the change to pendingSet is pushed out by the cmpxchg in
+ *      MonitorActionSet_AtomicInclude).
+ *
+ * Results:
+ *      TRUE if the action being posted was not pending before.
+ *      FALSE otherwise (other threads could have posted the same action).
+ *
+ * Side effects:
+ *      None.
+ *----------------------------------------------------------------------------
+ */
+static INLINE Bool
+MonitorAction_SetBits(MonitorActionIntr *actionIntr, MonitorIdemAction actionID)
+{
+   /* Careful if optimizing this: see PR70016. */
+   Bool newAction =
+      MonitorActionSet_AtomicInclude(&actionIntr->pendingSet, actionID);
+   actionIntr->action = TRUE;
+   return newAction;
+}
+
+/*
+ * C1 states entered by monitor while waiting for an action
+ */
+typedef enum {
+   VMM_C1_STATE_INVALID = 0,
+   VMM_C1_STATE_HLT,
+   VMM_C1_STATE_MWAIT,
+   VMM_C1_STATE_PAUSE
+} vmmC1StateType;
+
+#endif // _MONITORACTION_EXPORTED_H_
diff --git a/vmmon-only/include/numa_defs.h b/vmmon-only/include/numa_defs.h
new file mode 100644
index 00000000..f14a8b54
--- /dev/null
+++ b/vmmon-only/include/numa_defs.h
@@ -0,0 +1,72 @@
+/*********************************************************
+ * Copyright (C) 2006 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * numa_defs.h --
+ *	This is the internal header file for the NUMA module.
+ */
+
+#ifndef _NUMA_DEFS_H
+#define _NUMA_DEFS_H
+
+#define INCLUDE_ALLOW_VMX
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+
+#include "includeCheck.h"
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "cpu_defs.h"
+
+/* Machine NUMA nodes */
+typedef uint32 NUMA_Node;
+typedef uint32 NUMA_NodeMask;
+typedef uint8  NUMA_MemRangeID;
+
+/*
+ * Constants
+ */
+#define NUMA_MAX_NODES              32
+#define NUMA_MAX_CPUS_PER_NODE      (vmx86_server ? MAX_PCPUS : 32)
+#define NUMA_MAX_MEM_RANGES         64
+#define INVALID_NUMANODE            ((NUMA_Node)-1)
+#define NUMA_NODE_MASK_ANY          ((NUMA_NodeMask)-1)
+#define NUMA_NODE_MASK_NONE         ((NUMA_NodeMask)0)
+
+
+/*
+ * Structures
+ */
+typedef struct {
+   MPN          startMPN;
+   MPN          endMPN;
+   NUMA_Node    id;
+   Bool         isReliable;
+   Bool         isVolatile;
+} NUMA_MemRange;
+
+typedef struct NUMA_MemRangesList {
+   uint64        numMemRanges;
+   NUMA_MemRange memRange[NUMA_MAX_MEM_RANGES];
+} NUMA_MemRangesList;
+
+#endif // _NUMA_DEFS_H
diff --git a/vmmon-only/include/overheadmem_types.h b/vmmon-only/include/overheadmem_types.h
new file mode 100644
index 00000000..a07bcab6
--- /dev/null
+++ b/vmmon-only/include/overheadmem_types.h
@@ -0,0 +1,131 @@
+/*********************************************************
+ * Copyright (C) 2001-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * overheadmem_types.h
+ *
+ *	Types for tracking memory overheads.
+ */
+
+#ifndef _OVERHEADMEM_TYPES_H
+#define _OVERHEADMEM_TYPES_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_MODULE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+/*
+ * There are 4 types of memory we lock on the host.  Memory can be Mem_Mapped in
+ * the vmx, anonymous memory for use by monitor is not mapped permanently in any
+ * address space, guest memory regions other than main memory (can be
+ * locked/unlocked on hosted but not on ESX), and main memory which can be
+ * locked/unlocked in hosted and esx.
+ *
+ * In addition, the vmx may malloc memory or declare (large) static structures.
+ * Neither of these is locked on hosted platforms and the hostOS may swap it.
+ * Therefore, on hosted platforms we do not track this memory and instead
+ * include a working set component (sched.mem.hosted.perVMOverheadMBs).
+ * On ESX, this memory must be accounted for so we account it to user
+ * (nonpaged) overhead.  At present, the accounting is extremely coarse,
+ * and only aggregate sizes are hard-coded (see PR363997).
+ */
+typedef enum OvhdMemType {
+   OvhdMem_memmap,
+   OvhdMem_anon,
+   OvhdMem_guest,
+   OvhdMem_mainmem,
+   OvhdMem_malloc,
+   OvhdMem_static,
+   OvhdMem_text,
+   NumOvhdMemTypes
+} OvhdMemType;
+
+#define OvhdMemMask(type)    (1 << type)
+
+#define OVHDMEM_NONE      0x0
+#define OVHDMEM_MEMMAP    0x1 // OvhdMemMask(OvhdMem_memmap)
+#define OVHDMEM_ANON      0x2 // OvhdMemMask(OvhdMem_anon)
+#define OVHDMEM_GUEST     0x4 // OvhdMemMask(OvhdMem_guest)
+#define OVHDMEM_MAINMEM   0x8 // OvhdMemMask(OvhdMem_mainmem)
+#define OVHDMEM_MALLOC   0x10 // OvhdMemMask(OvhdMem_malloc)
+#define OVHDMEM_STATIC   0x20 // OvhdMemMask(OvhdMem_static)
+#define OVHDMEM_TEXT     0x40 // OvhdMemMask(OvhdMem_text)
+#define OVHDMEM_ALL_USER (OVHDMEM_MEMMAP | OVHDMEM_GUEST | OVHDMEM_MAINMEM | \
+                          OVHDMEM_MALLOC | OVHDMEM_STATIC | OVHDMEM_TEXT)
+#define OVHDMEM_ALL      (OVHDMEM_ALL_USER | OVHDMEM_ANON)
+
+/* ... and four categories of memory sources. */
+typedef enum OvhdMemCategory {
+   OvhdMemCat_paged,
+   OvhdMemCat_nonpaged,
+   OvhdMemCat_excluded,
+   OvhdMemCat_anonymous,
+   NumOvhdMemCategories
+} OvhdMemCategory;
+
+#define OVHDMEM_PAGED     (OVHDMEM_MALLOC  | OVHDMEM_STATIC)
+#define OVHDMEM_NONPAGED  (OVHDMEM_GUEST   | OVHDMEM_MEMMAP)
+#define OVHDMEM_EXCLUDED  (OVHDMEM_MAINMEM | OVHDMEM_TEXT)
+
+#if ((OVHDMEM_PAGED & OVHDMEM_NONPAGED) != 0)    ||                          \
+    ((OVHDMEM_NONPAGED & OVHDMEM_EXCLUDED) != 0) ||                          \
+    ((OVHDMEM_PAGED & OVHDMEM_EXCLUDED) != 0)    ||                          \
+    ((OVHDMEM_PAGED | OVHDMEM_NONPAGED | OVHDMEM_EXCLUDED | OVHDMEM_ANON) != \
+              OVHDMEM_ALL)
+#error Overheadmem categories do not form a partition of the overheads
+#endif
+
+/* Categories of overhead for 32-bit and 64-bit mode. */
+typedef struct OvhdMem_Overheads {
+   uint32 paged;
+   uint32 nonpaged;
+   uint32 anonymous;
+   uint32 text;
+} OvhdMem_Overheads;
+
+typedef struct OvhdMem_Deltas {
+   int32 paged;
+   int32 nonpaged;
+   int32 anonymous;
+} OvhdMem_Deltas;
+
+
+/* Types for tracking vmx (user) overheads. */
+
+#define OVHDMEM_MAX_NAME_LEN 36
+
+/* Types for tracking vmm overheads. */
+
+typedef struct OvhdMemUsage {
+   uint32 reserved; // pages
+   uint32 used;     // pages
+} OvhdMemUsage;
+
+typedef struct OvhdMemNode {
+   OvhdMemUsage usage;               // allocated and rsvd bytes for source
+   OvhdMemUsage maxUsage;            // max allocated and rsvd bytes for source
+   char name[OVHDMEM_MAX_NAME_LEN];  // name of overhead source
+   OvhdMemType type;                 // how/where memory for source is managed
+} OvhdMemNode;
+
+#endif
diff --git a/vmmon-only/include/pageLock_defs.h b/vmmon-only/include/pageLock_defs.h
new file mode 100644
index 00000000..c3b5eb98
--- /dev/null
+++ b/vmmon-only/include/pageLock_defs.h
@@ -0,0 +1,105 @@
+/*********************************************************
+ * Copyright (C) 2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * pageLock_defs.h
+ *
+ *        Page lock status codes, used by vmmon.
+ */
+
+#ifndef _PAGELOCK_DEFS_H_
+#define _PAGELOCK_DEFS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_MODULE
+#include "includeCheck.h"
+
+/*
+ * Return codes from page locking, unlocking, and MPN lookup.
+ * They share an error code space because they call one another
+ * internally.
+ *
+ *    PAGE_LOCK_FAILED              The host refused to lock a page.
+ *    PAGE_LOCK_LIMIT_EXCEEDED      We have reached the limit of locked
+ *                                  pages for all VMs
+ *    PAGE_LOCK_TOUCH_FAILED        Failed to touch page after lock.
+ *    PAGE_LOCK_IN_TRANSITION       The page is locked but marked by Windows
+ *                                  as nonpresent in CPU PTE and in transition
+ *                                  in Windows PFN.
+ *
+ *    PAGE_LOCK_SYS_ERROR           System call error.
+ *    PAGE_LOCK_ALREADY_LOCKED      Page already locked.
+ *    PAGE_LOCK_MEMTRACKER_ERROR    MemTracker fails.
+ *    PAGE_LOCK_PHYSTRACKER_ERROR   PhysTracker fails.
+ *    PAGE_LOCK_MDL_ERROR           Mdl error on Windows.
+ *
+ *    PAGE_UNLOCK_NO_ERROR          Unlock successful (must be 0).
+ *    PAGE_UNLOCK_NOT_TRACKED       Not in memtracker.
+ *    PAGE_UNLOCK_NO_MPN            Tracked but no MPN.
+ *    PAGE_UNLOCK_NOT_LOCKED        Not locked.
+ *    PAGE_UNLOCK_TOUCH_FAILED      Failed to touch page.
+ *    PAGE_UNLOCK_MISMATCHED_TYPE   Tracked but was locked by different API
+ *
+ *    PAGE_LOOKUP_INVALID_ADDR      Consistency checking.
+ *    PAGE_LOOKUP_BAD_HIGH_ADDR     Consistency checking.
+ *    PAGE_LOOKUP_ZERO_ADDR         Consistency checking.
+ *    PAGE_LOOKUP_SMALL_ADDR        Consistency checking.
+ *
+ * All error values must be negative values less than -4096 to avoid
+ * conflicts with errno values on Linux.
+ *
+ * -- edward
+ */
+
+#define PAGE_LOCK_SUCCESS                   0
+#define PAGE_LOCK_FAILED              (-10001)
+#define PAGE_LOCK_LIMIT_EXCEEDED      (-10002)
+#define PAGE_LOCK_TOUCH_FAILED        (-10003)
+#define PAGE_LOCK_IN_TRANSITION       (-10004)
+
+#define PAGE_LOCK_SYS_ERROR           (-10010)
+#define PAGE_LOCK_ALREADY_LOCKED      (-10011)
+#define PAGE_LOCK_MEMTRACKER_ERROR    (-10012)
+#define PAGE_LOCK_PHYSTRACKER_ERROR   (-10013)
+#define PAGE_LOCK_MDL_ERROR           (-10014)
+
+#define PAGE_UNLOCK_SUCCESS                 0
+#define PAGE_UNLOCK_NOT_TRACKED       (-10100)
+#define PAGE_UNLOCK_NO_MPN            (-10101)
+#define PAGE_UNLOCK_NOT_LOCKED        (-10102)
+#define PAGE_UNLOCK_TOUCH_FAILED      (-10103)
+#define PAGE_UNLOCK_MISMATCHED_TYPE   (-10104)
+
+#define PAGE_LOOKUP_SUCCESS                 0
+#define PAGE_LOOKUP_INVALID_ADDR      (-10200)
+#define PAGE_LOOKUP_BAD_HIGH_ADDR     (-10201)
+#define PAGE_LOOKUP_ZERO_ADDR         (-10202)
+#define PAGE_LOOKUP_SMALL_ADDR        (-10203)
+#define PAGE_LOOKUP_SYS_ERROR         (-10204)
+#define PAGE_LOOKUP_NOT_TRACKED          (-10)	// added to another code
+#define PAGE_LOOKUP_NO_MPN               (-20)	// added to another code
+#define PAGE_LOOKUP_NOT_LOCKED           (-30)	// added to another code
+#define PAGE_LOOKUP_NO_VM                (-40)	// added to another code
+
+#define PAGE_LOCK_SOFT_FAILURE(status) (status <= PAGE_LOCK_FAILED && \
+                                        status > PAGE_LOCK_SYS_ERROR)
+
+#endif // ifndef _PAGELOCK_DEFS_H_
diff --git a/vmmon-only/include/pagelist.h b/vmmon-only/include/pagelist.h
new file mode 100644
index 00000000..46ed1424
--- /dev/null
+++ b/vmmon-only/include/pagelist.h
@@ -0,0 +1,101 @@
+/*********************************************************
+ * Copyright (C) 2010-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * pagelist.h -- 
+ *
+ *      Definitions of operations on BPNs used in communicating page info
+ *	between VMKernel/VMX and VMM.
+ */
+
+#ifndef	_PAGELIST_H
+#define	_PAGELIST_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_MODULE
+#include "includeCheck.h"
+
+#include "vm_assert.h"
+#include "vmcore_types.h"
+
+/*
+ * Sets of pages are passed between the monitor and the platform to be 
+ * shared, invalidated, remapped, or swapped.
+ *
+ * A set is sized so that it fits in a 4KB page.
+ */
+
+#pragma pack(push, 1)
+typedef struct PageListEntry {
+   CompressedBPN cbpn;
+   Bool voided;
+   uint8 _pad[2];
+} PageListEntry;
+#pragma pack(pop) 
+
+#define PAGELIST_MAX     (PAGE_SIZE / sizeof(PageListEntry))
+
+static INLINE PageListEntry
+PageList_CreateEntry(BPN bpn)
+{
+   PageListEntry ple;
+   CompressedBPN_Write(&ple.cbpn, bpn);
+   ple.voided = FALSE;
+   return ple;
+}   
+
+static INLINE BPN
+PageList_BPN(const PageListEntry *ple)
+{
+   return CompressedBPN_Read(&ple->cbpn);
+}
+
+static INLINE Bool
+PageList_IsVoid(const PageListEntry *ple)
+{
+   ASSERT(ple->voided == TRUE || ple->voided == FALSE);
+   return ple->voided;
+}
+
+static INLINE void
+PageList_VoidEntry(PageListEntry *ple)
+{
+   ple->voided = TRUE;
+}
+
+
+/*
+ * This function inspects the set of BPN between entry [0,i) in the page list
+ * and returns TRUE if any of them matches the provided BPN.
+ */
+static INLINE Bool
+PageList_IsBPNDup(const PageListEntry *pageList, unsigned i, BPN bpn)
+{
+   unsigned k;
+   for (k = 0; k < i; k++) {
+      if (PageList_BPN(&pageList[k]) == bpn) {
+         return TRUE;
+      }
+   }
+   return FALSE;
+}
+
+#endif
diff --git a/vmmon-only/include/pcip_defs.h b/vmmon-only/include/pcip_defs.h
new file mode 100644
index 00000000..a00520bb
--- /dev/null
+++ b/vmmon-only/include/pcip_defs.h
@@ -0,0 +1,122 @@
+/*********************************************************
+ * Copyright (C) 2009-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * pcip_defs.h --
+ *
+ *      PCI passthru definitions shared by the vmx, monitor, vmkernel, and
+ *      vmmon. Not all PCI passthru definitions are found here: the shared
+ *      bits mainly pertain to interrupt proxying.
+ */
+
+#ifndef _PCIP_DEFS_H
+#define _PCIP_DEFS_H
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "monitorAction_exported.h"
+
+#include "bitvector.h"
+
+#define MAX_INTERRUPTS                 256 // max interrupts a device could use
+#define PCIP_MAX_MSIX_VECTORS          128
+#define PCIP_MAX_VECTORS               (PCIP_MAX_MSIX_VECTORS + 2)
+
+typedef struct PCIPVecBV {
+   BitVector bv;
+   uint32 reserved[PCIP_MAX_VECTORS / sizeof (uint32) - 1];
+} PCIPVecBV;
+
+typedef enum PCIPassthruVectorIndex {
+   PCIP_INDEX_IOAPIC,
+   PCIP_INDEX_MSI,
+   PCIP_INDEX_MSIXOFF,
+   PCIP_INDEX_INVALID = PCIP_INDEX_MSIXOFF + PCIP_MAX_MSIX_VECTORS,
+} PCIPassthruVectorIndex;
+
+typedef enum PCIPassthru_IntrType {
+   PCIPASSTHRU_INTR_NONE   = 0x00,
+   PCIPASSTHRU_INTR_IOAPIC = 0x01,
+   PCIPASSTHRU_INTR_MSI    = 0x02,
+   PCIPASSTHRU_INTR_MSIX   = 0x04,
+} PCIPassthru_IntrType;
+
+typedef struct FPTIntrProxyInfo {
+   uint32            adapterIndex;
+   uint32            vectorIndex;
+   MonitorIdemAction actionID;
+   uint32 _pad0;
+
+   /*
+    * These addresses are only needed for hosted platforms, where our kernel
+    * modules lack a SharedArea API.
+    */
+#ifndef VMX86_SERVER
+   VA64              notifyUVA;
+   VA64              vectorIndexUVA;
+#endif
+} FPTIntrProxyInfo;
+
+typedef struct UPTIntrProxyInfo {
+   uint32            adapterIndex;
+   MonitorIdemAction actionID;
+} UPTIntrProxyInfo;
+
+typedef union PCIPassthru_IntrProxyInfo {
+   FPTIntrProxyInfo fpt;
+   UPTIntrProxyInfo upt;
+} PCIPassthru_IntrProxyInfo;
+
+typedef enum PCIPassthru_ErrorType {
+   PCIPASSTHRU_ERROR_NONE       = 0x00,
+   PCIPASSTHRU_ERROR_AER        = 0x01,
+   PCIPASSTHRU_ERROR_PAGE_FAULT = 0x02,
+} PCIPassthru_ErrorType;
+
+typedef struct PCIPassthru_PageFaultInfo {
+   uint64 ioAddr;
+   uint64 machAddr;
+   uint8  faultReason;
+   uint8  unused[7];
+} PCIPassthru_PageFaultInfo;
+
+typedef struct PCIPassthru_AERInfo {
+   uint64 count;
+} PCIPassthru_AERInfo;
+
+typedef union PCIPassthru_ErrorInfo {
+   PCIPassthru_PageFaultInfo pageFaultInfo;
+   PCIPassthru_AERInfo aerInfo;
+} PCIPassthru_ErrorInfo;
+
+typedef 
+#include "vmware_pack_begin.h"
+struct PCIPassthru_ErrorMsg {
+   uint32                 sbdf;
+   PCIPassthru_ErrorType  errorType;
+   PCIPassthru_ErrorInfo  errorInfo;
+}
+#include "vmware_pack_end.h"
+PCIPassthru_ErrorMsg;
+
+#endif // _PCIP_DEFS_H
diff --git a/vmmon-only/include/perfctr_generic.h b/vmmon-only/include/perfctr_generic.h
new file mode 100644
index 00000000..82a068ba
--- /dev/null
+++ b/vmmon-only/include/perfctr_generic.h
@@ -0,0 +1,72 @@
+/*********************************************************
+ * Copyright (C) 1998-2012,2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * perfctr_generic.h --
+ *
+ */
+
+#ifndef _PERFCTR_GENERIC_H_
+#define _PERFCTR_GENERIC_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+
+#include "includeCheck.h"
+#include "vm_basic_types.h"
+
+/*
+ * nmiNo      -- vmm peer is not attempting to do nmi profiling this run
+ * nmiYes     -- vmm peer is doing nmi profiling and nmis are currently enabled
+ * nmiStopped -- vmm peer is doing nmi profiling, but nmis are temporarily
+ *               disabled for safety reasons.
+ */
+typedef enum {nmiNo = 0, nmiYes, nmiStopped} NMIStatus;
+typedef struct NMIShared { /* shared with vmx and vmkernel */
+   NMIStatus vmmStatus;
+   int32     nmiErrorCode;
+   int64     nmiErrorData;
+} NMIShared;
+
+/*
+ * CrossProf: structures for unified profiling of vmm, vmx, and
+ * vmkernel.  Per-vcpu.
+ */
+
+#define CALLSTACK_CROSSPROF_PAGES 1
+
+typedef struct {
+   /*
+    * This structure is per-vcpu.  The raw data is a packed vector
+    * of MonitorCallStackSample, a variable-length structure.
+    */
+
+   /* raw data - packed vec of MonitorCallStackSample, variable length */
+   uint8  crossProfSampleBuffer[PAGES_2_BYTES(CALLSTACK_CROSSPROF_PAGES)];
+
+   uint32 crossProfSampleBytes;
+   uint32 crossProfNumDroppedSamples; /* For when buffer fills up */
+   Bool   enabled; /* Can be false in stats build if monitor.callstack=FALSE */
+   uint8  _pad[3];
+} CrossProfShared;
+
+#endif // ifndef _PERFCTR_GENERIC_H_
diff --git a/vmmon-only/include/pgtbl.h b/vmmon-only/include/pgtbl.h
new file mode 100644
index 00000000..39ef4e19
--- /dev/null
+++ b/vmmon-only/include/pgtbl.h
@@ -0,0 +1,382 @@
+/*********************************************************
+ * Copyright (C) 2002,2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __PGTBL_H__
+#   define __PGTBL_H__
+
+
+#include <linux/highmem.h>
+
+#include "compat_pgtable.h"
+#include "compat_spinlock.h"
+#include "compat_page.h"
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblPte2MPN --
+ *
+ *    Returns the page structure associated to a Page Table Entry.
+ *
+ *    This function is not allowed to schedule() because it can be called while
+ *    holding a spinlock --hpreg
+ *
+ * Results:
+ *    INVALID_MPN on failure
+ *    mpn         on success
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE MPN
+PgtblPte2MPN(pte_t *pte)   // IN
+{
+   MPN mpn;
+   if (pte_present(*pte) == 0) {
+      return INVALID_MPN;
+   }
+   mpn = pte_pfn(*pte);
+   if (mpn >= INVALID_MPN) {
+      return INVALID_MPN;
+   }
+   return mpn;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblPte2Page --
+ *
+ *    Returns the page structure associated to a Page Table Entry.
+ *
+ *    This function is not allowed to schedule() because it can be called while
+ *    holding a spinlock --hpreg
+ *
+ * Results:
+ *    The page structure if the page table entry points to a physical page
+ *    NULL if the page table entry does not point to a physical page
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE struct page *
+PgtblPte2Page(pte_t *pte) // IN
+{
+   if (pte_present(*pte) == 0) {
+      return NULL;
+   }
+
+   return compat_pte_page(*pte);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblPGD2PTELocked --
+ *
+ *    Walks through the hardware page tables to try to find the pte
+ *    associated to a virtual address.
+ *
+ * Results:
+ *    pte. Caller must call pte_unmap if valid pte returned.
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE pte_t *
+PgtblPGD2PTELocked(compat_pgd_t *pgd,    // IN: PGD to start with
+                   VA addr)              // IN: Address in the virtual address
+                                         //     space of that process
+{
+   compat_pud_t *pud;
+   pmd_t *pmd;
+   pte_t *pte;
+
+   if (compat_pgd_present(*pgd) == 0) {
+      return NULL;
+   }
+
+   pud = compat_pud_offset(pgd, addr);
+   if (compat_pud_present(*pud) == 0) {
+      return NULL;
+   }
+
+   pmd = pmd_offset_map(pud, addr);
+   if (pmd_present(*pmd) == 0) {
+      pmd_unmap(pmd);
+      return NULL;
+   }
+
+   pte = pte_offset_map(pmd, addr);
+   pmd_unmap(pmd);
+   return pte;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblVa2PTELocked --
+ *
+ *    Walks through the hardware page tables to try to find the pte
+ *    associated to a virtual address.
+ *
+ * Results:
+ *    pte. Caller must call pte_unmap if valid pte returned.
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE pte_t *
+PgtblVa2PTELocked(struct mm_struct *mm, // IN: Mm structure of a process
+                  VA addr)              // IN: Address in the virtual address
+                                        //     space of that process
+{
+   return PgtblPGD2PTELocked(compat_pgd_offset(mm, addr), addr);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblVa2MPNLocked --
+ *
+ *    Retrieve MPN for a given va.
+ *
+ *    Caller must call pte_unmap if valid pte returned. The mm->page_table_lock
+ *    must be held, so this function is not allowed to schedule() --hpreg
+ *
+ * Results:
+ *    INVALID_MPN on failure
+ *    mpn         on success
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE MPN
+PgtblVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a process
+                  VA addr)              // IN: Address in the virtual address
+{
+   pte_t *pte;
+
+   pte = PgtblVa2PTELocked(mm, addr);
+   if (pte != NULL) {
+      MPN mpn = PgtblPte2MPN(pte);
+      pte_unmap(pte);
+      return mpn;
+   }
+   return INVALID_MPN;
+}
+
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblKVa2MPNLocked --
+ *
+ *    Retrieve MPN for a given kernel va.
+ *
+ *    Caller must call pte_unmap if valid pte returned. The mm->page_table_lock
+ *    must be held, so this function is not allowed to schedule() --hpreg
+ *
+ * Results:
+ *    INVALID_MPN on failure
+ *    mpn         on success
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE MPN
+PgtblKVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a caller
+                   VA addr)              // IN: Address in the virtual address
+{
+   pte_t *pte;
+
+   pte = PgtblPGD2PTELocked(compat_pgd_offset_k(mm, addr), addr);
+   if (pte != NULL) {
+      MPN mpn = PgtblPte2MPN(pte);
+      pte_unmap(pte);
+      return mpn;
+   }
+   return INVALID_MPN;
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblVa2PageLocked --
+ *
+ *    Return the "page" struct for a given va.
+ *
+ * Results:
+ *    struct page or NULL.  The mm->page_table_lock must be held, so this 
+ *    function is not allowed to schedule() --hpreg
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE struct page *
+PgtblVa2PageLocked(struct mm_struct *mm, // IN: Mm structure of a process
+                   VA addr)              // IN: Address in the virtual address
+{
+   pte_t *pte;
+
+   pte = PgtblVa2PTELocked(mm, addr);
+   if (pte != NULL) {
+      struct page *page = PgtblPte2Page(pte);
+      pte_unmap(pte);
+      return page;
+   } else {
+      return NULL;
+   }
+} 
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblVa2MPN --
+ *
+ *    Walks through the hardware page tables of the current process to try to
+ *    find the page structure associated to a virtual address.
+ *
+ * Results:
+ *    Same as PgtblVa2MPNLocked()
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE MPN
+PgtblVa2MPN(VA addr)  // IN
+{
+   struct mm_struct *mm;
+   MPN mpn;
+
+   /* current->mm is NULL for kernel threads, so use active_mm. */
+   mm = current->active_mm;
+   if (compat_get_page_table_lock(mm)) {
+      spin_lock(compat_get_page_table_lock(mm));
+   }
+   mpn = PgtblVa2MPNLocked(mm, addr);
+   if (compat_get_page_table_lock(mm)) {
+      spin_unlock(compat_get_page_table_lock(mm));
+   }
+   return mpn;
+}
+
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblKVa2MPN --
+ *
+ *    Walks through the hardware page tables of the current process to try to
+ *    find the page structure associated to a virtual address.
+ *
+ * Results:
+ *    Same as PgtblVa2MPNLocked()
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE MPN
+PgtblKVa2MPN(VA addr)  // IN
+{
+   struct mm_struct *mm = current->active_mm;
+   MPN mpn;
+
+   if (compat_get_page_table_lock(mm)) {
+      spin_lock(compat_get_page_table_lock(mm));
+   }
+   mpn = PgtblKVa2MPNLocked(mm, addr);
+   if (compat_get_page_table_lock(mm)) {
+      spin_unlock(compat_get_page_table_lock(mm));
+   }
+   return mpn;
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PgtblVa2Page --
+ *
+ *    Walks through the hardware page tables of the current process to try to
+ *    find the page structure associated to a virtual address.
+ *
+ * Results:
+ *    Same as PgtblVa2PageLocked()
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE struct page *
+PgtblVa2Page(VA addr) // IN
+{
+   struct mm_struct *mm = current->active_mm;
+   struct page *page;
+
+   if (compat_get_page_table_lock(mm)) {
+      spin_lock(compat_get_page_table_lock(mm));
+   }
+   page = PgtblVa2PageLocked(mm, addr);
+   if (compat_get_page_table_lock(mm)) {
+      spin_unlock(compat_get_page_table_lock(mm));
+   }
+   return page;
+}
+
+
+#endif /* __PGTBL_H__ */
diff --git a/vmmon-only/include/pshare_ext.h b/vmmon-only/include/pshare_ext.h
new file mode 100644
index 00000000..ab42c3d1
--- /dev/null
+++ b/vmmon-only/include/pshare_ext.h
@@ -0,0 +1,64 @@
+/*********************************************************
+ * Copyright (C) 2001,2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * pshare_ext.h --
+ *
+ *      VMKernel/VMMon <-> VMM transparent page sharing info.
+ */
+
+#ifndef _PSHARE_EXT_H
+#define _PSHARE_EXT_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_MODULE
+#include "includeCheck.h"
+
+#include "pagelist.h"
+#include "vm_basic_types.h"
+#include "vm_assert.h"
+
+/*
+ * constants
+ */
+
+#define PSHARE_PAGELIST_MAX             (PAGELIST_MAX)
+#define PSHARE_P2M_BUFFER_MPNS_MAX      (16)
+#define PSHARE_P2M_BUFFER_MPNS_DEFAULT  (4)
+#define PSHARE_P2M_BUFFER_SLOTS_PER_MPN (PAGE_SIZE / sizeof(PShare_P2MUpdate))
+
+#define PSHARE_POISON_MARKER            (CONST64U(0xAAAAAAAAAAAAAAAA))
+
+#define PSHARE_SALT_UNSET       0
+#define PSHARE_SALT_DEFAULT     1
+
+MY_ASSERTS(PSHARE_EXT,
+           ASSERT_ON_COMPILE(PSHARE_PAGELIST_MAX <= PAGELIST_MAX);)
+
+/*
+ * types
+ */
+
+typedef struct PShare_P2MUpdate {
+   BPN     bpn;
+   MPN     mpn;
+} PShare_P2MUpdate;
+#endif
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
new file mode 100644
index 00000000..dfa0328a
--- /dev/null
+++ b/vmmon-only/include/ptsc.h
@@ -0,0 +1,263 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * ptsc.h --
+ *
+ *      Pseudo TSC
+ */
+
+#ifndef _PTSC_H_
+#define _PTSC_H_
+
+#define INCLUDE_ALLOW_VMX
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#include "includeCheck.h"
+
+#include "rateconv.h"
+
+/*
+ * RDTSC and PTSC_Get.
+ *
+ * RDTSC reads the hardware timestamp counter on the current physical
+ * CPU.  In general, the TSC is *not* a globally consistent timer that
+ * runs at a constant rate.  Any code that still assumes it is should
+ * be corrected; see PR 20499.
+ *
+ * PTSC_Get returns a pseudo-TSC that runs at approximately the
+ * maximum speed of physical CPU 0's TSC and is approximately globally
+ * consistent.  It is available both at userlevel and in the monitor,
+ * with different implementations.  In the vmkernel, Timer_PseudoTSC
+ * provides similar functionality.
+ *
+ */
+
+/* TS stands for "timestamp", which is in units of "cycles" */
+typedef uint64 VmAbsoluteTS; // a particular point in time (in cycles)
+typedef int64  VmRelativeTS; // a signed delta in cycles
+typedef uint64 VmIntervalTS; // an unsigned delta in cycles
+typedef uint64 VmAbsoluteUS; // a particular point in time (in us)
+typedef int64  VmRelativeUS; // a signed delta in us
+typedef uint64 VmIntervalUS; // an unsigned delta in us
+
+/*
+ * Compare two VmAbsoluteTS's using comparison operator op, allowing
+ * for wrap.  The assumption is that differences should not be more
+ * than 2**63, so a larger difference is taken as negative.
+ */
+#define COMPARE_TS(ts1, op, ts2) (((int64) ((ts1) - (ts2))) op 0)
+
+#define MAX_ABSOLUTE_TS \
+   ((VmAbsoluteTS) CONST64U(0xffffffffffffffff))
+
+/*
+ * Largest possible unambiguous difference between two VmAbsoluteTS's
+ * according to COMPARE_TS's method of comparison.
+ */
+#define MAX_RELATIVE_TS \
+   ((VmRelativeTS) CONST64(0x7fffffffffffffff))
+
+#define MAX_ABSOLUTE_US \
+   ((VmAbsoluteUS) CONST64U(0xffffffffffffffff))
+
+typedef struct PTSCInfo {
+   Bool             hwTSCsSynced;
+   Bool             hwTSCsAdjusted;
+   uint8            _pad[6];
+   int64            hz;
+   uint32           kHz;
+   uint32           mHz;
+
+   RateConv_Ratio   usToCycles;
+   RateConv_Ratio   cyclesToUs;
+   RateConv_Ratio   msToCycles;
+   RateConv_Ratio   cyclesToNs;
+} PTSCInfo;
+
+extern PTSCInfo ptscInfo;
+
+Bool PTSC_Init(uint64 tscHz);
+VmAbsoluteTS PTSC_InitialCount(const char *module,
+                               const char *option,
+                               VmIntervalTS freq,
+                               VmAbsoluteTS defaultCnt);
+Bool PTSC_HasPerfectlySynchronizedTSCs(void);
+
+static INLINE int64
+PTSC_Hz(void)
+{
+   ASSERT(ptscInfo.hz);
+   return ptscInfo.hz;
+}
+
+static INLINE uint32
+PTSC_KHz(void)
+{
+   ASSERT(ptscInfo.kHz);
+   return ptscInfo.kHz;
+}
+
+static INLINE uint32
+PTSC_MHz(void)
+{
+   ASSERT(ptscInfo.mHz);
+   return ptscInfo.mHz;
+}
+
+#if defined(VM_X86_64) || defined(VM_ARM_64)
+
+/* 
+ * Conversions to/from cycles.  Note that the conversions operate on
+ * signed values, so be careful when taking the difference of two
+ * VmAbsoluteTS (which is unsigned) that that value is not out of range
+ * of the signed type.
+ */
+
+static INLINE VmRelativeTS
+PTSC_USToCycles(int64 us)
+{
+   return Muls64x32s64(us, ptscInfo.usToCycles.mult, ptscInfo.usToCycles.shift);
+}
+
+static INLINE VmRelativeTS
+PTSC_MSToCycles(int64 ms)
+{
+   return Muls64x32s64(ms, ptscInfo.msToCycles.mult, ptscInfo.msToCycles.shift);
+}
+
+static INLINE int64
+PTSC_CyclesToNS(VmRelativeTS ts)
+{
+   return Muls64x32s64(ts, ptscInfo.cyclesToNs.mult, ptscInfo.cyclesToNs.shift);
+}
+
+static INLINE int64
+PTSC_CyclesToUS(VmRelativeTS ts)
+{
+   return Muls64x32s64(ts, ptscInfo.cyclesToUs.mult, ptscInfo.cyclesToUs.shift);
+}
+
+#else
+
+/* 32-bit Muls64x32s64 too big to justify inlining. */
+VmRelativeTS PTSC_USToCycles(int64 us);
+VmRelativeTS PTSC_MSToCycles(int64 ms);
+int64 PTSC_CyclesToNS(VmRelativeTS ts);
+int64 PTSC_CyclesToUS(VmRelativeTS ts);
+
+#endif
+
+#if defined(VMX86_SERVER) && defined(VMX86_VMX)
+
+/*
+ * ESX with userworld VMX
+ */
+#include "x86types.h"
+#include "user_layout.h"
+
+#ifdef VM_ARM_64
+static INLINE VmAbsoluteTS
+PTSC_Get(void)
+{
+   extern __thread User_ThreadData vmkUserTdata;
+
+   register RateConv_Params params;
+   register uint64 pseudoTSC;
+
+   /*
+    * On ARM64 the generic timer guarantees that the counters are synchronous
+    * and independent of CPU frequency.
+    */
+   params = vmkUserTdata.pseudoTSCConv;
+   pseudoTSC = RDTSC();
+
+   /*
+    *  assert that conversion rate is `identity'.
+    * we'll have to revisit that when/if this assumption changes
+    * on some platform
+    */
+   ASSERT((params.mult == 1 && params.shift == 0) ||
+          (params.mult == 0x80000000 && params.shift == 31));
+
+   pseudoTSC += params.add;
+
+   return pseudoTSC;
+}
+#else
+static INLINE VmAbsoluteTS
+PTSC_Get(void)
+{
+   extern __thread User_ThreadData vmkUserTdata;
+   VmAbsoluteTS ptsc;
+
+   if (vmkUserTdata.magic != USER_THREADDATA_MAGIC) {
+      return 0;
+   }
+   ptsc = vmkUserTdata.u.pseudoTSCGet(&vmkUserTdata);
+   ASSERT((int64)ptsc >= 0);
+   return ptsc;
+}
+#endif
+#else
+
+/*
+ * Monitor and hosted VMX
+ */
+
+VmAbsoluteTS PTSC_Get(void);
+
+#endif
+
+/* 
+ *-----------------------------------------------------------------------------
+ *
+ * PTSC_HasSynchronizedTSCs --
+ *
+ *      Returns TRUE iff the platform TSCs are known to be synchronized.
+ * 
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+PTSC_HasSynchronizedTSCs(void)
+{
+   return ptscInfo.hwTSCsSynced;
+}
+
+
+/* 
+ *-----------------------------------------------------------------------------
+ *
+ * PTSC_HostAdjustedTSCs --
+ *
+ *      Returns TRUE if the platform may have adjusted TSCs in an attempt
+ *      to sync them up.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+PTSC_HostAdjustedTSCs(void)
+{
+   return ptscInfo.hwTSCsAdjusted;
+}
+
+#endif /* ifndef _PTSC_H_ */
diff --git a/vmmon-only/include/rateconv.h b/vmmon-only/include/rateconv.h
new file mode 100644
index 00000000..14f0195f
--- /dev/null
+++ b/vmmon-only/include/rateconv.h
@@ -0,0 +1,118 @@
+/*********************************************************
+ * Copyright (C) 2003 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *
+ * rateconv.h --
+ *
+ *     Parameters and functions for linear rate conversion of 64 bit
+ *     counters:
+ *
+ *       y = ((x * mult) >> shift) + add.
+ *
+ */
+
+#ifndef _VM_RATECONV_H_
+#define _VM_RATECONV_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_basic_asm.h"
+#include "vm_assert.h"
+#include "vm_atomic.h"
+
+/* RateConv_Params is part of vmx<->vmmon interface (INIT_PSEUDO_TSC ioctl) */
+typedef struct RateConv_Params {
+   uint32 mult;  /* mult == 1 implies shift == 0. */
+   uint32 shift;
+   int64  add;
+} RateConv_Params;
+
+typedef struct RateConv_ParamsVolatile {
+   RateConv_Params p;
+   Bool            changed;
+   uint8           pad[7];
+} RateConv_ParamsVolatile;
+
+typedef struct RateConv_Ratio {
+   uint32 mult;
+   uint32 shift;
+} RateConv_Ratio;
+
+#define RATE_CONV_IDENTITY { 1, 0, 0 }  /* Out = in. */
+
+Bool RateConv_ComputeParams(uint64 inHz, uint64 inBase,
+		            uint64 outHz, uint64 outBase,
+		            RateConv_Params *conv);
+void RateConv_LogParams(const char *prefix,
+			uint64 inHz, uint64 inBase,
+			uint64 outHz, uint64 outBase,
+			const RateConv_Params *conv);
+Bool RateConv_ComputeRatio(uint64 inHz, uint64 outHz,
+                           RateConv_Ratio *ratio);
+void RateConv_LogRatio(const char *prefix,
+                       uint64 inHz, uint64 outHz,
+                       const RateConv_Ratio *ratio);
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * RateConv_Unsigned --
+ *
+ *      Apply rate conversion to an unsigned argument:
+ *       y = ((x * mult) >> shift) + add.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+RateConv_Unsigned(const RateConv_Params *conv, uint64 x)
+{
+   return Mul64x3264(x, conv->mult, conv->shift) + conv->add;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * RateConv_Signed --
+ *
+ *      Apply rate conversion to a signed argument:
+ *       y = ((x * mult) >> shift) + add.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE int64
+RateConv_Signed(const RateConv_Params *conv, int64 x)
+{
+   return Muls64x32s64(x, conv->mult, conv->shift) + conv->add;
+}
+
+
+#endif // _VM_RATECONV_H_
diff --git a/vmmon-only/include/uccostTable.h b/vmmon-only/include/uccostTable.h
new file mode 100644
index 00000000..87366788
--- /dev/null
+++ b/vmmon-only/include/uccostTable.h
@@ -0,0 +1,34 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+UC(CALL_START)
+UC(BEGIN_BACK_TO_HOST)
+UC(SWITCHED_TO_MODULE)
+UC(VMX_SELECT_RETURN)
+UC(VMX_HANDLER_START)
+UC(VMX_SIGNAL)
+UC(MODULE_SIGNAL)
+UC(SWITCHING_TO_MONITOR)
+UC(DONE_BACK_TO_HOST)
+UC(CALL_END)
+
+#undef UC
diff --git a/vmmon-only/include/usercalldefs.h b/vmmon-only/include/usercalldefs.h
new file mode 100644
index 00000000..9b32ee79
--- /dev/null
+++ b/vmmon-only/include/usercalldefs.h
@@ -0,0 +1,35 @@
+/*********************************************************
+ * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef USERCALLDEFS_H
+#define USERCALLDEFS_H
+
+#ifdef linux
+#include <linux/errno.h>
+#define USERCALL_RESTART (-ERESTARTNOINTR)
+#else
+#include <usercall.h>
+#define USERCALL_RESTART (USERCALL_NOP)
+#endif
+/*
+ * -1 to -4096 are reserved for syscall errors on Linux.  -1 is reserved for
+ * failing DeviceIoControl on Windows.
+ */
+#define USERCALL_VMX86ALLOCERR (-8192)
+
+#endif 
diff --git a/vmmon-only/include/vcpuid.h b/vmmon-only/include/vcpuid.h
new file mode 100644
index 00000000..c12dcef0
--- /dev/null
+++ b/vmmon-only/include/vcpuid.h
@@ -0,0 +1,65 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *
+ * vcpuid.h --
+ *
+ *    Monitor's VCPU ID.
+ */
+
+#ifndef _VCPUID_H_
+#define _VCPUID_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+
+typedef uint32 Vcpuid;			// VCPU number
+
+#define VCPUID_INVALID	(~0U)
+
+#define BOOT_VCPU_ID     0
+#define IS_BOOT_VCPUID(vcpuid)  ((vcpuid) == BOOT_VCPU_ID)
+
+#define MAX_VCPUS      128
+
+#define MAX_CORES_PER_SOCKET   64
+
+#ifdef VMM
+#include "vcpuset.h"
+
+/* In VMM, CurVcpuid() is available everywhere. */
+extern const Vcpuid      curVcpuid;
+extern const VCPUSet     curVcpuidSet;
+#define CurVcpuid()         (curVcpuid)
+#define CurVcpuidSet()      (&curVcpuidSet)
+#define IS_BOOT_VCPU()      IS_BOOT_VCPUID(CurVcpuid())
+
+#endif  /* VMM */
+
+#endif // ifndef _VCPUID_H_
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
new file mode 100644
index 00000000..4bbe3a08
--- /dev/null
+++ b/vmmon-only/include/vcpuset.h
@@ -0,0 +1,808 @@
+/*********************************************************
+ * Copyright (C) 2002-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vcpuset.h --
+ *
+ *	ADT for a set of VCPUs.  Implemented as an array of bitmasks.
+ *
+ */
+
+#ifndef _VCPUSET_H_
+#define _VCPUSET_H_
+
+
+#define INCLUDE_ALLOW_VMX
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_asm.h"
+#include "vm_atomic.h"
+#include "vcpuid.h"
+#include "vcpuset_types.h"
+
+#if defined VMX86_VMX
+#   include "str.h"     /* Str_Snprintf */
+#   define VCS_SNPRINTF Str_Snprintf
+#elif defined MONITOR_APP
+#   include <stdio.h>   /* libc snprintf */
+#   if defined WIN32
+#      define VCS_SNPRINTF _snprintf
+#   else
+#      define VCS_SNPRINTF snprintf
+#   endif
+#elif defined VMM || defined VMKERNEL
+#   include "vm_libc.h" /* vmcore snprintf */
+#   define VCS_SNPRINTF snprintf
+#endif
+
+#ifdef VMX86_VMX
+#include "vmx.h"
+#endif
+
+
+/*
+ * A buffer for logging a VCPUSet must fit a maximally-populated set.  To
+ * balance brevity and readability, sets are formatted for printing like long
+ * hexadecimal numbers, with a '.' at every 64-VCPU subset boundary.  The
+ * highest-numbered VCPU in the set is printed first, followed by all slots
+ * for lower-numbered VCPUs, populated or not.  Leading zeroes are not printed.
+ *
+ * Examples, assuming a VCS_SUBSET_COUNT of 2:
+ * An empty set:                                            "0x0\0"
+ * A full set:              "0xffffffffffffffff.ffffffffffffffff\0"
+ * A set with only VCPU 50:                     "0x4000000000000\0"
+ * A set with only VCPU 80:            "0x10000.0000000000000000\0"
+ */
+#define VCS_BUF_SIZE (2 +                                         /* "0x"  */ \
+                      (VCS_SUBSET_COUNT * VCS_SUBSET_WIDTH / 4) + /* (hex) */ \
+                      (VCS_SUBSET_COUNT - 1) +                    /* '.'   */ \
+                      1)                                          /* NULL  */
+
+extern VCPUSet  vcpuSetFull;
+
+#define FOR_EACH_VCPU_IN_SET(_vcpuSet, _v)                                    \
+   do {                                                                       \
+      Vcpuid  _v;                                                             \
+      VCPUSet __vcs;                                                          \
+      VCPUSet_Copy(&__vcs, _vcpuSet);                                         \
+      while ((_v = VCPUSet_FindFirst(&__vcs)) != VCPUID_INVALID) {            \
+         VCPUSet_Remove(&__vcs, _v);
+
+#define ROF_EACH_VCPU_IN_SET()                                                \
+      }                                                                       \
+   } while (0)
+
+
+#define FOR_EACH_SUBSET_IN_SET(_setIndex)                                     \
+   do {                                                                       \
+      int _setIndex;                                                          \
+      for (_setIndex = 0; _setIndex < VCS_SUBSET_COUNT; _setIndex++) {
+
+#define ROF_EACH_SUBSET_IN_SET()                                              \
+      }                                                                       \
+   } while (0)
+
+
+#define FOR_EACH_SUBSET_IN_SET_COUNTDOWN(_setIndex)                           \
+   do {                                                                       \
+      int _setIndex;                                                          \
+      for (_setIndex = VCS_SUBSET_COUNT - 1; _setIndex >= 0; _setIndex--) {
+
+#define ROF_EACH_SUBSET_IN_SET_COUNTDOWN()                                    \
+      }                                                                       \
+   } while (0)
+
+
+#define FOR_EACH_POPULATED_SUBSET_IN_SET(_setIndex)                           \
+   do {                                                                       \
+      int _setIndex;                                                          \
+      int _maxSubsets = VCS_VCPUID_SUBSET_IDX(NumVCPUs() - 1);                \
+      for (_setIndex = 0; _setIndex <= _maxSubsets; _setIndex++) {
+
+#define ROF_EACH_POPULATED_SUBSET_IN_SET()                                    \
+      }                                                                       \
+   } while (0)
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Empty --
+ *      
+ *      Clear all bits in a VCPUSet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_Empty(VCPUSet *vcs)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      vcs->subset[idx] = 0;
+   } ROF_EACH_SUBSET_IN_SET();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_IsEmpty --
+ *      
+ *      Return TRUE iff a VCPUSet has no bits set.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VCPUSet_IsEmpty(const VCPUSet *vcs)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      if (vcs->subset[idx] != 0) {
+         return FALSE;
+      }
+   } ROF_EACH_SUBSET_IN_SET();
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Full --
+ *
+ *      Returns a pointer to a VCPUSet containing all valid VCPUs.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE const VCPUSet *
+VCPUSet_Full(void)
+{
+   /*
+    * Read too early, we may get the wrong notion of how many
+    * vcpus the VM has. Cf. pr286243 and pr289186.
+    */
+#if defined (VMX86_VMX)
+   ASSERT(NumVCPUs() != 0 && !VCPUSet_IsEmpty(&vcpuSetFull));
+#endif
+   return &vcpuSetFull;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Copy --
+ *      
+ *      Copy one VCPUSet's contents to another.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_Copy(VCPUSet *dest, const VCPUSet *src)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      dest->subset[idx] = src->subset[idx];
+   } ROF_EACH_SUBSET_IN_SET();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Equals --
+ *      
+ *      Compare two VCPUSets, return TRUE iff their contents match.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VCPUSet_Equals(const VCPUSet *vcs1, const VCPUSet *vcs2)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      if (vcs1->subset[idx] != vcs2->subset[idx]) {
+         return FALSE;
+      }
+   } ROF_EACH_SUBSET_IN_SET();
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_IsMember --
+ *      
+ *      Return TRUE iff the given Vcpuid is present in a VCPUSet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VCPUSet_IsMember(const VCPUSet *vcs, Vcpuid v)
+{
+   ASSERT(v < MAX_VCPUS);
+   return (vcs->subset[VCS_VCPUID_SUBSET_IDX(v)] &
+           VCS_VCPUID_SUBSET_BIT(v)) != 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_AtomicIsMember --
+ *      
+ *      Return TRUE iff the given Vcpuid is present in a VCPUSet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VCPUSet_AtomicIsMember(VCPUSet *vcs, Vcpuid v)
+{
+   volatile uint64 *subset = &vcs->subset[VCS_VCPUID_SUBSET_IDX(v)];
+   ASSERT(v < MAX_VCPUS);
+   return (Atomic_Read64(Atomic_VolatileToAtomic64(subset)) &
+           VCS_VCPUID_SUBSET_BIT(v)) != 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_FindFirst --
+ * VCPUSet_FindLast --
+ *      
+ *      Find the first (lowest-numbered) or last (highest-numbered)
+ *      Vcpuid in a VCPUSet.
+ *
+ * Results:
+ *      Vcpuid if at least one is present in a set.
+ *      VCPUID_INVALID if the set is empty.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Vcpuid
+VCPUSet_FindFirst(const VCPUSet *vcs)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      uint64 subset = vcs->subset[idx];
+      if (subset != 0) {
+         return lssb64_0(subset) + (idx << VCS_SUBSET_SHIFT);
+      }
+   } ROF_EACH_SUBSET_IN_SET();
+   return VCPUID_INVALID;
+}
+
+static INLINE Vcpuid
+VCPUSet_FindLast(const VCPUSet *vcs)
+{
+   FOR_EACH_SUBSET_IN_SET_COUNTDOWN(idx) {
+      uint64 subset = vcs->subset[idx];
+      if (subset != 0) {
+         return mssb64_0(subset) + (idx << VCS_SUBSET_SHIFT);
+      }
+   } ROF_EACH_SUBSET_IN_SET_COUNTDOWN();
+   return VCPUID_INVALID;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Remove --
+ * VCPUSet_AtomicRemove --
+ *      
+ *      Remove or atomically remove a single Vcpuid from a VCPUSet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_Remove(VCPUSet *vcs, Vcpuid v)
+{
+   ASSERT(v < MAX_VCPUS);
+   vcs->subset[VCS_VCPUID_SUBSET_IDX(v)] &= ~VCS_VCPUID_SUBSET_BIT(v);
+}
+
+
+static INLINE void
+VCPUSet_AtomicRemove(VCPUSet *vcs, Vcpuid v)
+{
+   volatile uint64 *subset = &vcs->subset[VCS_VCPUID_SUBSET_IDX(v)];
+   ASSERT(v < MAX_VCPUS);
+   Atomic_And64(Atomic_VolatileToAtomic64(subset), ~VCS_VCPUID_SUBSET_BIT(v));
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_IncludeSet --
+ * VCPUSet_RemoveSet --
+ *
+ *      Add/remove all vcpus present in the set 'src' to/from the set 'dest'.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_IncludeSet(VCPUSet *dest, const VCPUSet *src)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      dest->subset[idx] |= src->subset[idx];
+   } ROF_EACH_SUBSET_IN_SET();
+}
+
+
+static INLINE void
+VCPUSet_RemoveSet(VCPUSet *dest, const VCPUSet *src)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      dest->subset[idx] &= ~src->subset[idx];
+   } ROF_EACH_SUBSET_IN_SET();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Include --
+ * VCPUSet_AtomicInclude --
+ *      
+ *      Add or atomically add a single Vcpuid to a VCPUSet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_Include(VCPUSet *vcs, Vcpuid v)
+{
+   ASSERT(v < MAX_VCPUS);
+   vcs->subset[VCS_VCPUID_SUBSET_IDX(v)] |= VCS_VCPUID_SUBSET_BIT(v);
+}
+
+
+static INLINE void
+VCPUSet_AtomicInclude(VCPUSet *vcs, Vcpuid v)
+{
+   volatile uint64 *subset = &vcs->subset[VCS_VCPUID_SUBSET_IDX(v)];
+   ASSERT(v < MAX_VCPUS);
+   Atomic_Or64(Atomic_VolatileToAtomic64(subset), VCS_VCPUID_SUBSET_BIT(v));
+}
+
+
+#if defined(VMM) && !defined(MONITOR_APP)
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_PackCareful --
+ *      
+ *      Pack a VCPUSet into the bytes at "ptr".
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_PackCareful(unsigned numVCPUs, const VCPUSet *vcs, void *ptr)
+{
+   memcpy(ptr, vcs->subset, (numVCPUs + 7) / 8);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_UnpackCareful --
+ *      
+ *      Unpack a VCPUSet from the bytes at "src".
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_UnpackCareful(unsigned numVCPUs, VCPUSet *vcs, void *ptr)
+{
+   memcpy(vcs->subset, ptr, (numVCPUs + 7) / 8);
+}
+#endif /* VMM && !MONITOR_APP */
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_PopulateRange --
+ *
+ *  Populates the given set with 'numVCPUs' VCPUs starting at 'firstVCPU'.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_PopulateRange(VCPUSet *vcs, unsigned firstVCPU,
+                          unsigned numVCPUs)
+{
+   unsigned sub;
+   unsigned lastVCPU      = firstVCPU + numVCPUs - 1;
+   unsigned firstSubset   = firstVCPU / VCS_SUBSET_WIDTH;
+   unsigned lastSubset    = lastVCPU / VCS_SUBSET_WIDTH;
+   unsigned lowMaskShift  = firstVCPU % VCS_SUBSET_WIDTH;
+   unsigned highMaskShift = VCS_SUBSET_WIDTH - 1 - lastVCPU % VCS_SUBSET_WIDTH;
+
+   ASSERT(firstSubset <= lastSubset && lastSubset < VCS_SUBSET_COUNT);
+
+   VCPUSet_Empty(vcs);
+   for (sub = firstSubset; sub <= lastSubset; sub++) {
+      vcs->subset[sub] = CONST64U(-1);
+   }
+   vcs->subset[firstSubset] &= (CONST64U(-1) << lowMaskShift);
+   vcs->subset[lastSubset] &= (CONST64U(-1) >> highMaskShift);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Populate --
+ *
+ *  Populates the given set with the VCPUs in [0, numVCPUs).
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_Populate(VCPUSet *vcs, unsigned numVCPUs)
+{
+   VCPUSet_PopulateRange(vcs, 0, numVCPUs);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Subset --
+ *      
+ *      Return the specified subset of a VCPUSet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+VCPUSet_Subset(const VCPUSet *vcs,
+                   unsigned subset)
+{
+   ASSERT(subset < VCS_SUBSET_COUNT);
+   return vcs->subset[subset];
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_SubsetPtr --
+ *      
+ *      Return a pointer to the specified subset of a VCPUSet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64 *
+VCPUSet_SubsetPtr(VCPUSet *vcs, unsigned subset)
+{
+   ASSERT(subset < VCS_SUBSET_COUNT);
+   return &vcs->subset[subset];
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_IsSupersetOrEqual --
+ *      
+ *      Return TRUE iff vcs1 contains a superset of the VCPUs in vcs2
+ *      or vcs1 and vcs2 contain exactly the same VCPUs.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VCPUSet_IsSupersetOrEqual(const VCPUSet *vcs1, const VCPUSet *vcs2)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      if (vcs2->subset[idx] & ~vcs1->subset[idx]) {
+         return FALSE;
+      }
+   } ROF_EACH_SUBSET_IN_SET();
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_IsSubsetOrEqual --
+ *      
+ *      Return TRUE iff vcs1 contains a subset of the VCPUs in vcs2
+ *      or vcs1 and vcs2 contain exactly the same VCPUs.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VCPUSet_IsSubsetOrEqual(const VCPUSet *vcs1, const VCPUSet *vcs2)
+{
+   return VCPUSet_IsSupersetOrEqual(vcs2, vcs1);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_MakeSingleton --
+ *      
+ *      Add a single Vcpuid to a VCPUSet and remove all others.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_MakeSingleton(VCPUSet *vcs, Vcpuid v)
+{
+   VCPUSet_Empty(vcs);
+   VCPUSet_Include(vcs, v);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_IsSingleton --
+ *      
+ *      Return TRUE iff vcs contains exactly one VCPU.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VCPUSet_IsSingleton(const VCPUSet *vcs)
+{
+   Bool foundOnce = FALSE;
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      uint64 sub = vcs->subset[idx];
+      if (sub != 0) {
+         if (foundOnce || (sub & (sub - 1)) != 0) {
+            return FALSE;
+         }
+         foundOnce = TRUE;
+      }
+   } ROF_EACH_SUBSET_IN_SET();
+   return foundOnce;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_IsFull --
+ *
+ *  Returns true iff vcs contains the set of all vcpus.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VCPUSet_IsFull(const VCPUSet *vcs)
+{
+   return VCPUSet_Equals(vcs, VCPUSet_Full());
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_AtomicReadWriteSubset --
+ *      
+ *      For the nth aligned 64-VCPU subset of a VCPU set, atomically
+ *      read then write.  Return the contents read.  Set 0 is VCPUs
+ *      0-63 and set 1 is VCPUs 64-127.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+VCPUSet_AtomicReadWriteSubset(VCPUSet *vcs, uint64 vcpus,
+                                  unsigned n)
+{
+   ASSERT(n < VCS_SUBSET_COUNT);
+   return Atomic_ReadWrite64(Atomic_VolatileToAtomic64(&vcs->subset[n]),
+                             vcpus);
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Size --
+ *
+ *    Return the number of VCPUs in this set.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE int
+VCPUSet_Size(const VCPUSet *vcs)
+{
+   int n = 0;
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      uint64 bits = vcs->subset[idx];
+      while (bits != 0) {
+         bits = bits & (bits - 1);
+         n++;
+      }
+   } ROF_EACH_SUBSET_IN_SET();
+   return n;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_UnionSubset --
+ *      
+ *      Given an 64-bit value and a subset number, add the VCPUs
+ *      represented to the set.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_UnionSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
+{
+   ASSERT(n < VCS_SUBSET_COUNT);
+   vcs->subset[n] |= vcpus;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_SubtractSubset --
+ *      
+ *      Given an 64-bit value and a subset number, remove the VCPUs
+ *      represented in the subset from the set.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_SubtractSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
+{
+   ASSERT(n < VCS_SUBSET_COUNT);
+   vcs->subset[n] &= ~vcpus;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_AtomicUnionSubset --
+ *      
+ *      Given a 64-bit value and a subset number, atomically add
+ *      the VCPUs represented to the set.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_AtomicUnionSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
+{
+   uint64 *subsetPtr = &vcs->subset[n];
+   ASSERT(n < VCS_SUBSET_COUNT);
+   Atomic_Or64(Atomic_VolatileToAtomic64(subsetPtr), vcpus);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Invert --
+ *      
+ *      Makes all non-present valid VCPUs in a set present and all
+ *      VCPUs present non-present.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_Invert(VCPUSet *vcs)
+{
+   VCPUSet temp;
+   VCPUSet_Copy(&temp, VCPUSet_Full());
+   VCPUSet_RemoveSet(&temp, vcs);
+   VCPUSet_Copy(vcs, &temp);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_Intersection
+ *      
+ *      Given two VCPUSets, populate the destination set with only the
+ *      VCPUs common to both.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VCPUSet_Intersection(VCPUSet *dest, const VCPUSet *src)
+{
+   FOR_EACH_SUBSET_IN_SET(idx) {
+      dest->subset[idx] &= src->subset[idx];
+   } ROF_EACH_SUBSET_IN_SET();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_LogFormat --
+ *      
+ *      Given a buffer of at least VCS_BUF_SIZE to fill, write into it a
+ *      string suitable for use in Log() or LOG().
+ *      Returns the buffer which was passed as an argument, after
+ *      writing the string.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#ifdef VCS_SNPRINTF
+static INLINE char *
+VCPUSet_LogFormat(char *buf, const int size, const VCPUSet *vcs)
+{
+   int offset = 0;
+   Vcpuid highest = VCPUSet_FindLast(vcs);
+   int idx = (highest == VCPUID_INVALID) ? 0 : highest / 8;
+   ASSERT(size >= VCS_BUF_SIZE);
+#define VCS_LOGF(...)                                                   \
+   {                                                                    \
+      int ret = VCS_SNPRINTF(buf + offset, size - offset, __VA_ARGS__); \
+      ASSERT(0 <= ret && ret < size - offset);                          \
+      offset += ret;                                                    \
+   }
+   /* Print the leading value with no zero-extension. */
+   VCS_LOGF("%#x", ((unsigned char *)vcs)[idx--]);
+
+   while (idx >= 0) {
+      if ((idx + 1) % (VCS_SUBSET_WIDTH / 8) == 0) {
+         VCS_LOGF(".");
+      }
+      VCS_LOGF("%02x", ((unsigned char *)vcs)[idx]);
+      idx--;
+   }
+   return buf;
+}
+#undef VCS_LOGF
+#endif
+
+
+#endif /* _VCPUSET_H_ */
diff --git a/vmmon-only/include/vcpuset_types.h b/vmmon-only/include/vcpuset_types.h
new file mode 100644
index 00000000..bbb1990d
--- /dev/null
+++ b/vmmon-only/include/vcpuset_types.h
@@ -0,0 +1,58 @@
+/*********************************************************
+ * Copyright (C) 2002-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vcpuset_types.h --
+ *
+ *	ADT for a set of VCPUs.  Implemented as an array of bitmasks.
+ *
+ */
+
+#ifndef _VCPUSET_TYPES_H_
+#define _VCPUSET_TYPES_H_
+
+
+#define INCLUDE_ALLOW_VMX
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_asm.h"
+#include "vm_atomic.h"
+#include "vcpuid.h"
+
+#define VCS_SUBSET_WIDTH                                                   64
+#define VCS_SUBSET_SHIFT                                                    6
+#define VCS_SUBSET_MASK               ((CONST64U(1) << VCS_SUBSET_SHIFT) - 1)
+#define VCS_SUBSET_COUNT                                                    2
+
+#define VCS_VCPUID_SUBSET_IDX(v)                    ((v) >> VCS_SUBSET_SHIFT)
+#define VCS_VCPUID_SUBSET_BIT(v)     (CONST64U(1) << ((v) & VCS_SUBSET_MASK))
+
+/*
+ * If you update this type, you also need to update the SEND_IPI line in
+ * bora/public/iocontrolsMacosTable.h.
+ */
+typedef struct VCPUSet {
+   uint64 subset[VCS_SUBSET_COUNT];
+} VCPUSet;
+
+#endif
diff --git a/vmmon-only/include/versioned_atomic.h b/vmmon-only/include/versioned_atomic.h
new file mode 100644
index 00000000..7eb190d8
--- /dev/null
+++ b/vmmon-only/include/versioned_atomic.h
@@ -0,0 +1,170 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *  Versioned atomic synchronization:
+ *
+ *    These synchronization macros allow single-writer/many-reader
+ *    access to data, based on Leslie Lamport's paper "Concurrent
+ *    Reading and Writing", Communications of the ACM, November 1977.
+ *
+ *    many-writer/many-reader can be implemented on top of versioned
+ *    atomics by using an additional spin lock to synchronize
+ *    writers. This is preferable for cases where readers are expected to
+ *    greatly outnumber writers.
+ *
+ *    Multiple concurrent writers to the version variables are not
+ *    allowed.  Even if writers are working on lock-free or disjoint
+ *    data, the version counters are not interlocked for read-modify-write.
+ *
+ *    Recursive use of versioned atomics in writers is currently not supported.
+ */
+
+#ifndef _VERSIONED_ATOMIC_H
+#define _VERSIONED_ATOMIC_H
+ 
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_asm.h"
+#include "vm_assert.h"
+
+/*
+ * Users with attribute(packed) structs must ensure any
+ * VersionedAtomic members are marked as ALIGNED(4).  Unfortunately
+ * the compiler cannot be trusted to align our substruct correctly
+ * (PR515329).  If the enclosing struct is packed, the VersionedAtomic
+ * alignment requested below will be ignored!
+ */
+
+typedef struct {
+   volatile uint32 v0;
+   volatile uint32 v1;
+} ALIGNED(4) VersionedAtomic;
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VersionedAtomic_BeginWrite --
+ *    Called by a writer to indicate that the data protected by
+ *    a given atomic version is about to change. Effectively locks out
+ *    all readers until EndWrite is called.
+ * 
+ * Results:
+ *      .
+ *
+ * Side effects:
+ *
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE void
+VersionedAtomic_BeginWrite(VersionedAtomic *versions)
+{
+   /*
+    * As long as the variable is on natural boundary it is guaranteed
+    * to be atomic, so we don't need to write from left to right as in
+    * Lamport's original algorithm.
+    */
+   ASSERT(((size_t)(&versions->v0) & (sizeof(versions->v0) - 1)) == 0);
+   /* If recursive use is needed demand for support in PR514764 */
+   ASSERT(versions->v1 == versions->v0);
+   versions->v0++;
+   COMPILER_MEM_BARRIER();
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VersionedAtomic_EndWrite --
+ *    Called by a writer after it is done updating shared data. Lets
+ *    pending and new readers proceed on shared data.
+ * 
+ * Results:
+ *      .
+ *
+ * Side effects:
+ *
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE void
+VersionedAtomic_EndWrite(VersionedAtomic *versions)
+{
+   ASSERT(((size_t)(&versions->v1) & (sizeof(versions->v1) - 1)) == 0);
+   ASSERT(versions->v1 + 1 == versions->v0);
+   COMPILER_MEM_BARRIER();
+   versions->v1 = versions->v0;
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VersionedAtomic_BeginTryRead --
+ *    Called by a reader before it tried to read shared data.
+ * 
+ * Results:
+ *    Returns a version number to the reader. This version number
+ *    is required to confirm validity of the read operation when reader
+ *    calls EndTryRead.
+ *
+ * Side effects:
+ *
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE uint32
+VersionedAtomic_BeginTryRead(const VersionedAtomic *versions)
+{
+   uint32 readVersion;
+
+   readVersion = versions->v1;
+   COMPILER_MEM_BARRIER();
+
+   return readVersion;
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VersionedAtomic_EndTryRead --
+ *    Called by a reader after it finishes reading shared data, to confirm
+ *    validity of the data that was just read (IOW, to make sure that a
+ *    writer did not intervene while the read was in progress).
+ * 
+ * Results:
+ *    TRUE if the data read between BeginTryRead() and this call is
+ *    valid. FALSE otherwise.
+ *
+ * Side effects:
+ *
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE Bool
+VersionedAtomic_EndTryRead(const VersionedAtomic *versions,
+                           uint32 readVersion)
+{
+   COMPILER_MEM_BARRIER();
+   return LIKELY(versions->v0 == readVersion);
+}
+
+#endif //_VERSIONED_ATOMIC_H
diff --git a/vmmon-only/include/vm_asm.h b/vmmon-only/include/vm_asm.h
new file mode 100644
index 00000000..0eb9cee5
--- /dev/null
+++ b/vmmon-only/include/vm_asm.h
@@ -0,0 +1,93 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_asm.h
+ *
+ *	asm macros
+ */
+
+#ifndef _VM_ASM_H_
+#define _VM_ASM_H_
+
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_USERLEVEL
+#include "includeCheck.h"
+
+#ifdef VM_ARM_64
+#include "vm_asm_arm64.h"
+#else
+
+#include "vm_basic_asm.h"
+#include "x86msr.h"
+
+#ifdef VM_X86_64
+#include "vm_asm_x86_64.h"
+#else
+#include "vm_asm_x86.h"
+#endif
+
+
+static INLINE void
+SET_FS64(uint64 fs64)
+{
+   __SET_MSR(MSR_FSBASE, fs64);
+}
+
+
+static INLINE void
+SET_GS64(uint64 gs64)
+{
+   __SET_MSR(MSR_GSBASE, gs64);
+}
+
+static INLINE void
+SET_KernelGS64(uint64 kgs64)
+{
+   __SET_MSR(MSR_KERNELGSBASE, kgs64);
+}
+
+
+static INLINE uint64
+GET_FS64(void)
+{
+   return __GET_MSR(MSR_FSBASE);
+}
+
+
+static INLINE uint64
+GET_GS64(void)
+{
+   return __GET_MSR(MSR_GSBASE);
+}
+
+
+static INLINE uint64
+GET_KernelGS64(void)
+{
+   return __GET_MSR(MSR_KERNELGSBASE);
+}
+
+#endif // VM_ARM_64
+#endif
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
new file mode 100644
index 00000000..2b37976a
--- /dev/null
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -0,0 +1,998 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_asm_x86.h
+ *
+ *	IA32 asm macros
+ */
+
+#ifndef _VM_ASM_X86_H_
+#define _VM_ASM_X86_H_
+
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_USERLEVEL
+#include "includeCheck.h"
+
+#include "x86types.h"
+#include "x86desc.h"
+#include "x86sel.h"
+#include "x86_basic_defs.h"
+#include "x86msr.h"
+
+#ifdef VM_X86_64
+#define _GETSET_DTR_TYPE DTR64
+#else
+#define _GETSET_DTR_TYPE DTR32
+#endif
+
+#ifdef __GNUC__
+
+#if defined __APPLE__
+/* PR 352418: GCC produces error if the non-Apple version is used */
+#define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)
+#else
+/* ASSERT_ON_COMPILE_SELECTOR_SIZE:
+ *
+ *  - Selector must be 16-bits.
+ *  - If a constant is used, it better be only 16-bits.
+ *  - If it's not a constant, it must be Selector-sized. or less.
+ *
+ * Although aesthetically the following looks nicer, gcc is unable
+ * to produce a constant expression for it:
+ *
+ *  ASSERT_ON_COMPILE(sizeof(Selector) == 2 &&                            \
+ *                    ((__builtin_constant_p(expr) ? ((expr) >> 16) == 0) \
+ *                                                 : sizeof(expr) <= 2)
+ */
+#if (__GNUC__ >= 4) && (__GNUC_MINOR__ >= 1)
+#define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)                                \
+   ASSERT_ON_COMPILE(sizeof(Selector) == 2 &&                                \
+                     ((__builtin_constant_p(expr) && ((expr) >> 16) == 0) || \
+                      sizeof(expr) <= 2))
+#else
+/* gcc 3.3.3 is not able to produce a constant expression (PR 356383) */
+#define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)
+#endif
+#endif
+
+
+/*
+ * [GS]ET_[GI]DT() are defined as macros wrapping a function
+ * so we can pass the argument implicitly by reference (requires
+ * a macro) and get type checking too (requires a function).
+ */
+
+#define SET_GDT(var) _Set_GDT(&(var))
+
+/* Checked against the Intel manual and GCC --hpreg */
+static INLINE void
+_Set_GDT(_GETSET_DTR_TYPE *dtr)
+{
+   __asm__(
+      "lgdt %0"
+      :
+      : "m" (*dtr)
+   );
+}
+
+#define SET_IDT(var) _Set_IDT(&(var))
+
+/* Checked against the Intel manual and GCC --hpreg */
+static INLINE void
+_Set_IDT(_GETSET_DTR_TYPE *dtr)
+{
+   __asm__(
+      "lidt %0"
+      :
+      : "m" (*dtr)
+   );
+}
+
+#define GET_GDT(var) _Get_GDT(&(var))
+
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ * volatile because there's a hidden input (the [IG]DTR) that can change
+ * without the compiler knowing it.
+ */
+static INLINE void
+_Get_GDT(_GETSET_DTR_TYPE *dtr)
+{
+   __asm__ __volatile__(
+      "sgdt %0"
+      : "=m" (*dtr)
+   );
+}
+
+#define GET_IDT(var) _Get_IDT(&(var))
+
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ * volatile because the [IG]DT can change without the compiler knowing it
+ * (when we use l[ig]dt).
+ */
+static INLINE void
+_Get_IDT(_GETSET_DTR_TYPE *dtr)
+{
+   __asm__ __volatile__(
+      "sidt %0"
+      : "=m" (*dtr)
+   );
+}
+
+
+#define SET_LDT(expr)                                                   \
+   do {                                                                 \
+      const Selector _set_ldt_sel = (Selector)(expr);                   \
+      ASSERT_ON_COMPILE_SELECTOR_SIZE(expr);                            \
+      /* lldt reads from the GDT; don't sink any writes. */             \
+      COMPILER_MEM_BARRIER();                                           \
+      /* Checked against the Intel manual and GCC --hpreg */            \
+      __asm__("lldt %0"                                                 \
+              :                                                         \
+              : "rm" (_set_ldt_sel));                                   \
+   } while (0)
+
+
+/* Checked against the Intel manual and GCC --hpreg
+ *
+ * volatile because the LDT can change without the compiler knowing it
+ * (when we use lldt).
+ */
+static INLINE void
+_GET_LDT(Selector * const result)
+{
+   __asm__ __volatile__("sldt %0"
+                        : "=rm" (*result));
+}
+
+
+#define GET_LDT(var)    \
+   do {                 \
+      _GET_LDT(&(var)); \
+   } while (0)
+
+
+/* Checked against the Intel manual and GCC --thutt */
+#define _BUILD_SET_R(func, reg)        \
+   static INLINE void                  \
+   func(uintptr_t r)                   \
+   {                                   \
+      __asm__("mov %0, %%" #reg        \
+              : /* no outputs */       \
+              :  "r" (r)               \
+              : "memory");             \
+   }
+
+/* Not yet checked against the Intel manual and GCC --slava
+ *
+ * 'volatile' because CRs and DRs can change without the compiler
+ * knowing it (when there is a page fault, when a breakpoint occurs,
+ * and moreover it seems there is no way to teach gcc that smsw
+ * clobbers cr0 for example).
+ *
+ * The parameter is a 'uintptr_t *' so that the size of the actual
+ * parameter must exactly match the size of the hardware register.
+ * This prevents the use of 32-bit variables when building 64-bit
+ * code.
+ */
+#define _BUILD_GET_R(func, reg)                         \
+   static INLINE void                                   \
+   func(uintptr_t *result)                              \
+   {                                                    \
+      __asm__ __volatile__("mov %%" #reg ", %0"         \
+                           : "=r" (*result));           \
+   }
+
+_BUILD_SET_R(_SET_CR0, cr0)
+_BUILD_SET_R(_SET_CR2, cr2)
+_BUILD_SET_R(_SET_CR3, cr3)
+_BUILD_SET_R(_SET_CR4, cr4)
+_BUILD_SET_R(_SET_CR8, cr8)
+
+_BUILD_GET_R(_GET_CR0, cr0)
+_BUILD_GET_R(_GET_CR2, cr2)
+_BUILD_GET_R(_GET_CR3, cr3)
+_BUILD_GET_R(_GET_CR4, cr4)
+_BUILD_GET_R(_GET_CR8, cr8)
+
+#if defined __APPLE__
+/* Mac OS gcc 4 uses DBx instead of DRx register names. */
+_BUILD_SET_R(_SET_DR0, db0)
+_BUILD_SET_R(_SET_DR1, db1)
+_BUILD_SET_R(_SET_DR2, db2)
+_BUILD_SET_R(_SET_DR3, db3)
+_BUILD_SET_R(_SET_DR6, db6)
+_BUILD_SET_R(_SET_DR7, db7)
+
+_BUILD_GET_R(_GET_DR0, db0)
+_BUILD_GET_R(_GET_DR1, db1)
+_BUILD_GET_R(_GET_DR2, db2)
+_BUILD_GET_R(_GET_DR3, db3)
+_BUILD_GET_R(_GET_DR6, db6)
+_BUILD_GET_R(_GET_DR7, db7)
+#else
+_BUILD_SET_R(_SET_DR0, dr0)
+_BUILD_SET_R(_SET_DR1, dr1)
+_BUILD_SET_R(_SET_DR2, dr2)
+_BUILD_SET_R(_SET_DR3, dr3)
+_BUILD_SET_R(_SET_DR6, dr6)
+_BUILD_SET_R(_SET_DR7, dr7)
+
+_BUILD_GET_R(_GET_DR0, dr0)
+_BUILD_GET_R(_GET_DR1, dr1)
+_BUILD_GET_R(_GET_DR2, dr2)
+_BUILD_GET_R(_GET_DR3, dr3)
+_BUILD_GET_R(_GET_DR6, dr6)
+_BUILD_GET_R(_GET_DR7, dr7)
+#endif
+
+#define SET_CR_DR(regType, regNum, expr)                     \
+   do {                                                      \
+      /* Ensure no implicit truncation of 'expr' */          \
+      ASSERT_ON_COMPILE(sizeof(expr) <= sizeof(uintptr_t));  \
+      _SET_##regType##regNum(expr);                          \
+   } while (0)
+
+#define GET_CR_DR(regType, regNum, var) \
+   do {                                 \
+      _GET_##regType##regNum(&(var));   \
+   } while (0)
+
+#define SET_CR0(expr) SET_CR_DR(CR, 0, expr)
+#define SET_CR2(expr) SET_CR_DR(CR, 2, expr)
+#define SET_CR3(expr) SET_CR_DR(CR, 3, expr)
+#define SET_CR4(expr) SET_CR_DR(CR, 4, expr)
+#define SET_CR8(expr) SET_CR_DR(CR, 8, expr)
+
+/* Undefine GET_CR0; it is defined in mach_asm.h for SLES cross-compile */
+#undef GET_CR0
+#define GET_CR0(var)  GET_CR_DR(CR, 0, var)
+#define GET_CR2(var)  GET_CR_DR(CR, 2, var)
+#define GET_CR3(var)  GET_CR_DR(CR, 3, var)
+#define GET_CR4(var)  GET_CR_DR(CR, 4, var)
+#define GET_CR8(var)  GET_CR_DR(CR, 8, var)
+
+#define SET_DR0(expr) SET_CR_DR(DR, 0, expr)
+#define SET_DR1(expr) SET_CR_DR(DR, 1, expr)
+#define SET_DR2(expr) SET_CR_DR(DR, 2, expr)
+#define SET_DR3(expr) SET_CR_DR(DR, 3, expr)
+#define SET_DR6(expr) SET_CR_DR(DR, 6, expr)
+#define SET_DR7(expr) SET_CR_DR(DR, 7, expr)
+
+#define GET_DR0(var)  GET_CR_DR(DR, 0, var)
+#define GET_DR1(var)  GET_CR_DR(DR, 1, var)
+#define GET_DR2(var)  GET_CR_DR(DR, 2, var)
+#define GET_DR3(var)  GET_CR_DR(DR, 3, var)
+#define GET_DR6(var)  GET_CR_DR(DR, 6, var)
+#define GET_DR7(var)  GET_CR_DR(DR, 7, var)
+
+#define SET_SEGREG(reg, expr)                                          \
+   do {                                                                \
+      const Selector _set_segreg_sel = (Selector)(expr);               \
+      ASSERT_ON_COMPILE_SELECTOR_SIZE(expr);                           \
+      /* mov to Sreg reads from the [GL]DT; don't sink any writes. */  \
+      COMPILER_MEM_BARRIER();                                          \
+      /* Checked against the Intel manual and GCC --hpreg */           \
+      __asm__("movw %0, %%" #reg                                       \
+              :                                                        \
+              : "rm" (_set_segreg_sel));                               \
+   } while (0)
+
+#define SET_DS(expr) SET_SEGREG(ds, expr)
+#define SET_ES(expr) SET_SEGREG(es, expr)
+#define SET_FS(expr) SET_SEGREG(fs, expr)
+#define SET_GS(expr) SET_SEGREG(gs, expr)
+#define SET_SS(expr) SET_SEGREG(ss, expr)
+
+/* Checked against the Intel manual and GCC --hpreg
+ *
+ * volatile because the content of CS can change without the compiler
+ * knowing it (when we use call gates).
+ *
+ * XXX: The segment register getter functions have not been updated to
+ *      have stricter type checking like many other functions in this
+ *      file because they return a value, rather than taking an
+ *      argument.  Perhaps sometime in the future, a willing soul will
+ *      change these accessors to take an argument and at the same
+ *      time install better type checking.
+ */
+#define _BUILD_GET_SEG(func, reg)                \
+   static INLINE Selector                        \
+   func(void)                                    \
+   {                                             \
+      Selector result;                           \
+      __asm__ __volatile__("movw %%" #reg ", %0" \
+                           : "=rm" (result));    \
+      return result;                             \
+   }
+
+_BUILD_GET_SEG(GET_CS, cs)
+_BUILD_GET_SEG(GET_DS, ds)
+_BUILD_GET_SEG(GET_ES, es)
+_BUILD_GET_SEG(GET_FS, fs)
+_BUILD_GET_SEG(GET_GS, gs)
+_BUILD_GET_SEG(GET_SS, ss)
+
+
+#define SET_TR(expr)                                                    \
+   do {                                                                 \
+      const Selector _set_tr_sel = (Selector)(expr);                    \
+      ASSERT_ON_COMPILE_SELECTOR_SIZE(expr);                            \
+      /* ltr reads from the GDT; don't sink any writes. */              \
+      COMPILER_MEM_BARRIER();                                           \
+      /* Checked against the Intel manual and GCC --hpreg */            \
+      __asm__ __volatile__("ltr %0"                                     \
+                           :                                            \
+                           : "rm" (_set_tr_sel) : "memory");            \
+   } while (0)
+
+/* Checked against the Intel manual and GCC --hpreg
+
+   volatile because the content of TR can change without the compiler knowing
+   it (when we use task gates). */
+static INLINE void
+_GET_TR(Selector * const result)
+{
+   __asm__ __volatile__("str %0"
+                        : "=rm" (*result));
+}
+
+#define GET_TR(var)    \
+   do {                \
+      _GET_TR(&(var)); \
+   } while (0)
+
+
+/* Checked against the Intel manual and GCC --hpreg
+
+   We use this to restore interrupts, so this cannot be reordered around
+   by gcc */
+static INLINE void
+_Set_flags(uintptr_t f)
+{
+   __asm__ __volatile__(
+      "push %0" "\n\t"
+      "popf"
+      :
+      : "g" (f)
+      : "memory", "cc"
+   );
+}
+
+
+
+/* Checked against the Intel manual and GCC --hpreg
+
+   volatile because gcc 2.7.2.3 doesn't know when eflags are modified (it
+   seems to ignore the "cc" clobber). gcc 2.95.2 is ok: it optimize 2
+   successive calls only if there is no instructions in between. */
+static INLINE uintptr_t
+_Get_flags(void)
+{
+   uintptr_t result;
+
+   __asm__ __volatile__(
+      "pushf"  "\n\t"
+      "pop %0"
+      : "=rm" (result)
+      :
+      : "memory"
+   );
+
+   return result;
+}
+
+#define SAVE_FLAGS(var) do { \
+   var = _Get_flags();       \
+} while (0)
+
+static INLINE Bool
+HwInterruptsEnabled(uint32 eflags)
+{
+   return (eflags & EFLAGS_IF) != 0;
+}
+
+/* Checked against the Intel manual and GCC --hpreg */
+static INLINE void
+CLTS(void)
+{
+   __asm__ __volatile__ ("clts");
+}
+
+
+/* Beginning of the section whose correctness has NOT been checked */
+#define FNCLEX()         __asm__("fnclex" ::);
+
+/* TLB_INVALIDATE_xxx are not checked yet */
+#define TLB_INVALIDATE_PAGE(_addr) do { \
+     __asm__ __volatile__("invlpg %0": :"m" (*(char *) (_addr)):"memory"); \
+} while (0)
+
+#define TLB_INVALIDATE_PAGE_OFF_FS(_addr) do { \
+     __asm__ __volatile__("fs; invlpg %0": :"m" (*(char *) (_addr)):"memory"); \
+} while (0)
+
+#if ! defined(VMKBOOT)
+#define RESTORE_FLAGS _Set_flags
+#define ENABLE_INTERRUPTS() __asm__ __volatile__ ("sti": : :"memory")
+#define CLEAR_INTERRUPTS()  __asm__ __volatile__ ("cli": : :"memory")
+#endif
+
+#define RAISE_INTERRUPT(_x)  __asm__ __volatile__("int %0" :: "g" (_x))
+#define RETURN_FROM_INT()   __asm__ __volatile__("iret" :: )
+
+#if ! defined(VMKERNEL) && ! defined(VMKBOOT)
+#define NO_INTERRUPTS_BEGIN()	do { \
+                                   uintptr_t _flags; \
+                                   SAVE_FLAGS(_flags); \
+                                   CLEAR_INTERRUPTS();
+
+#define NO_INTERRUPTS_END()	   RESTORE_FLAGS(_flags); \
+                                } while(0)
+#endif
+
+/* End of the section whose correctness has NOT been checked */
+
+#elif defined _MSC_VER  /* !__GNUC__ */
+
+#define SET_IDT(_idt)    _Set_IDT(&(_idt))
+#define SET_GDT(_gdt)    _Set_GDT(&(_gdt))
+#define SET_TR(_tr)      _Set_TR(_tr)
+#define SET_LDT(_tr)     _Set_LDT(_tr)
+
+#define GET_IDT(_idt)    _Get_IDT(&(_idt))
+#define GET_GDT(_gdt)    _Get_GDT(&(_gdt))
+#define GET_TR(_tr)      do { _tr = _Get_TR();  } while (0)
+#define GET_LDT(_tr)     do { _tr = _Get_LDT(); } while (0)
+
+#define GET_CR0(_reg)    __asm mov eax, cr0 __asm mov _reg, eax
+#define SET_CR0(_reg)    __asm mov eax, _reg __asm mov cr0, eax
+#define GET_CR2(_reg)    __asm mov eax, cr2 __asm mov _reg, eax
+#define SET_CR2(_reg)    __asm mov eax, _reg __asm mov cr2, eax
+#define GET_CR3(_reg)    __asm mov eax, cr3 __asm mov _reg, eax
+#define SET_CR3(_reg)    __asm mov eax, _reg __asm mov cr3, eax
+/*
+ * MSC doesn't seem to like CR4 in __asm statements. We emit
+ * the opcode for MOV EAX,CR4 = 0xf020e0 and MOV CR4,EAX = 0xf022e0
+ */
+#define GET_CR4(_reg) { \
+ __asm _emit 0x0f __asm _emit 0x20 __asm _emit 0xe0 \
+ __asm mov _reg, eax \
+}
+#define SET_CR4(_reg)    { \
+  __asm mov eax, _reg \
+  __asm _emit 0x0f __asm _emit 0x22 __asm _emit 0xe0 \
+}
+
+
+#define GET_DR0(_reg) do { __asm mov eax,dr0 __asm mov _reg,eax } while (0)
+#define SET_DR0(_reg) do { __asm mov eax,_reg __asm mov dr0,eax } while (0)
+#define GET_DR1(_reg) do { __asm mov eax,dr1 __asm mov _reg,eax } while (0)
+#define SET_DR1(_reg) do { __asm mov eax,_reg __asm mov dr1,eax } while (0)
+#define GET_DR2(_reg) do { __asm mov eax,dr2 __asm mov _reg,eax } while (0)
+#define SET_DR2(_reg) do { __asm mov eax,_reg __asm mov dr2,eax } while (0)
+#define GET_DR3(_reg) do { __asm mov eax,dr3 __asm mov _reg,eax } while (0)
+#define SET_DR3(_reg) do { __asm mov eax,_reg __asm mov dr3,eax } while (0)
+#define GET_DR6(_reg) do { __asm mov eax,dr6 __asm mov _reg,eax } while (0)
+#define SET_DR6(_reg) do { __asm mov eax,_reg __asm mov dr6,eax } while (0)
+#define GET_DR7(_reg) do { __asm mov eax,dr7 __asm mov _reg,eax } while (0)
+#define SET_DR7(_reg) do { __asm mov eax,_reg __asm mov dr7,eax } while (0)
+
+
+#define CLTS()           __asm clts
+
+#define FNCLEX()         __asm fnclex
+
+#define TLB_INVALIDATE_PAGE(_addr) {  \
+	 void *_a = (_addr); \
+     __asm mov eax, _a __asm invlpg [eax] \
+}
+
+#define TLB_INVALIDATE_PAGE_OFF_FS(_addr) { \
+	uint32 __a = (uint32) (_addr); \
+	__asm mov eax, __a _asm invlpg fs:[eax] \
+}
+
+
+#define ENABLE_INTERRUPTS() { __asm sti }
+#define CLEAR_INTERRUPTS()  { __asm cli }
+
+#define RAISE_INTERRUPT(_x)  {__asm int _x }
+#define RETURN_FROM_INT()   {__asm iretd }
+
+
+#define SAVE_FLAGS(x) { \
+     __asm pushfd __asm pop eax __asm mov x, eax \
+}
+
+#define RESTORE_FLAGS(x) { \
+     __asm push x __asm popfd\
+}
+
+
+
+static INLINE void SET_DS(Selector val)
+{
+   __asm mov ax, val
+   __asm mov ds, ax
+}
+
+static INLINE void SET_ES(Selector val)
+{
+   __asm mov ax, val
+   __asm mov es, ax
+}
+
+static INLINE void SET_FS(Selector val)
+{
+   __asm mov ax, val
+   __asm mov fs, ax
+}
+
+static INLINE void SET_GS(Selector val)
+{
+   __asm mov ax, val
+   __asm mov gs, ax
+}
+
+static INLINE void SET_SS(Selector val)
+{
+   __asm mov ax, val
+   __asm mov ss, ax
+}
+
+static INLINE Selector GET_FS(void)
+{
+	Selector _v;
+	__asm mov _v,fs
+	return _v;
+}
+
+static INLINE Selector GET_GS(void)
+{
+	Selector _v;
+	__asm mov _v,gs
+	return _v;
+}
+
+
+static INLINE Selector GET_DS(void)
+{
+	Selector _v;
+	__asm mov _v,ds
+	return _v;
+}
+
+static INLINE Selector GET_ES(void)
+{
+	Selector _v;
+	__asm mov _v,es
+	return _v;
+}
+
+static INLINE Selector GET_SS(void)
+{
+	Selector _v;
+	__asm mov _v,ss
+	return _v;
+}
+
+static INLINE Selector GET_CS(void)
+{
+	Selector _v;
+	__asm mov _v,cs
+	return _v;
+}
+
+#pragma warning( disable : 4035)
+
+static INLINE uint32  GET_WORD_FROM_FS(uint32 *_addr) {
+	__asm mov eax, _addr
+    __asm mov eax, fs:[eax]
+}
+
+static INLINE uint16  GET_SHORT_FROM_FS(uint16 *_addr) {
+	__asm mov eax, _addr
+    __asm mov ax, fs:[eax]
+}
+
+static INLINE uint8  GET_BYTE_FROM_FS(uint8 *_addr) {
+	__asm mov eax, _addr
+     __asm mov al, fs:[eax]
+}
+
+#pragma warning (default: 4035)
+
+static INLINE void  SET_WORD_FS(uint32 *_addr, uint32 _val) {
+    __asm mov eax, _addr
+    __asm mov ebx, _val
+    __asm mov fs:[eax], ebx
+}
+
+static INLINE void  SET_SHORT_FS(uint32 *_addr, uint16 _val) {
+    __asm mov eax, _addr
+    __asm mov bx, _val
+    __asm mov fs:[eax], bx
+}
+
+static INLINE void  SET_BYTE_FS(uint32 *_addr, uint8 _val) {
+    __asm mov eax, _addr
+    __asm mov bl, _val
+    __asm mov fs:[eax], bl
+}
+
+static INLINE void _Set_GDT(_GETSET_DTR_TYPE *dtr) {
+   __asm mov eax, dtr
+   __asm lgdt [eax]
+}
+
+static INLINE void _Set_IDT(_GETSET_DTR_TYPE *dtr) {
+   __asm mov eax, dtr
+   __asm lidt [eax]
+}
+
+static INLINE void _Set_LDT(Selector val)
+{
+   __asm lldt val
+}
+
+static INLINE void _Set_TR(Selector val)
+{
+   __asm ltr val
+}
+
+static INLINE void _Get_GDT(_GETSET_DTR_TYPE *dtr) {
+   __asm mov eax, dtr
+   __asm sgdt [eax]
+}
+
+static INLINE void _Get_IDT(_GETSET_DTR_TYPE *dtr) {
+   __asm mov eax, dtr
+   __asm sidt [eax]
+}
+
+static INLINE Selector _Get_LDT(void) {
+   Selector sel;
+   __asm sldt sel
+   return sel;
+}
+
+static INLINE Selector _Get_TR(void) {
+   Selector sel;
+   __asm str sel
+   return sel;
+}
+
+
+static INLINE void
+MEMCOPY_TO_FS(VA to,
+              char * from,
+              unsigned long n)
+{
+   unsigned long i =0;
+   while (i+4  <=n) {
+      uint32 x = *(uint32*) (from + i);
+	  uint32 _faddr = (uint32) (to+i);
+	  __asm mov eax, _faddr
+	  __asm mov ebx, x
+	  __asm mov fs:[eax], ebx
+      i +=4;
+   }
+   while (i<n) {
+      uint8 x = from[i];
+	  uint32 _faddr = (uint32) (to+i);
+	  __asm mov eax, _faddr
+	  __asm mov bl, x
+	  __asm mov fs:[eax], bl
+      i++;
+   }
+}
+
+
+
+static INLINE void
+MEMCOPY_FROM_FS(char * to,
+                VA from,
+                unsigned long n)
+{
+   unsigned long i =0;
+   while (i+4  <=n) {
+      uint32 x;
+	  uint32 _faddr = (uint32)(from+i);
+	  __asm mov eax, _faddr
+	  __asm mov ebx, fs:[eax]
+	  __asm mov x,ebx
+      *(uint32*)(to+i)=x;
+      i +=4;
+   }
+   while (i<n) {
+      uint8 x;
+	  uint32 _faddr = (uint32) (from+i);
+	  __asm mov eax, _faddr;
+      __asm mov bl, fs:[eax]
+	  __asm mov x, bl
+      *(uint8*)(to+i)=x;
+      i++;
+   }
+}
+
+#else
+#error No compiler defined for get/set
+#endif /* !__GNUC__ && !_MSC_VER */
+
+
+#ifdef __GNUC__
+static INLINE unsigned CURRENT_CPL(void)
+{
+   return SELECTOR_RPL(GET_CS());
+}
+#elif defined _MSC_VER
+static INLINE unsigned CURRENT_CPL(void) {
+   volatile Selector _v;
+   __asm mov ax, cs _asm mov _v, ax
+   return SELECTOR_RPL(_v);
+}
+#else
+#error No compiler defined for CURRENT_CPL
+#endif
+
+
+#ifdef __GNUC__
+/* Checked against the Intel manual and GCC --hpreg
+
+   volatile because the msr can change without the compiler knowing it
+   (when we use wrmsr). */
+static INLINE uint64 __GET_MSR(int cx)
+{
+   uint64 msr;
+#ifdef VM_X86_64
+   __asm__ __volatile__(
+      "rdmsr; shlq $32, %%rdx; orq %%rdx, %%rax"
+      : "=a" (msr)
+      : "c" (cx)
+      : "%rdx"
+   );
+#else
+   __asm__ __volatile__(
+      "rdmsr"
+      : "=A" (msr)
+      : "c" (cx)
+   );
+#endif
+   return msr;
+}
+#elif defined _MSC_VER
+#pragma warning( disable : 4035)
+static INLINE uint64 __GET_MSR(int input)
+{
+   __asm push ecx
+   __asm mov  ecx, input
+   __asm _emit 0x0f __asm _emit 0x32
+   __asm pop ecx
+}
+
+static INLINE void __SET_MSR(int input, uint64 val)
+{
+   uint32 hival = (uint32)(val >> 32);
+   uint32 loval = (uint32)val;
+   __asm push edx
+   __asm push ecx
+   __asm push eax
+   __asm mov  eax, loval
+   __asm mov  edx, hival
+   __asm mov  ecx, input
+   __asm _emit 0x0f __asm _emit 0x30
+   __asm pop eax
+   __asm pop ecx
+   __asm pop edx
+}
+#pragma warning (default: 4035)
+#else
+#error
+#endif
+
+#ifdef __GNUC__
+static INLINE void __SET_MSR(int cx, uint64 val)
+{
+#ifdef VM_X86_64
+   __asm__ __volatile__(
+      "wrmsr"
+      : /* no outputs */
+      : "a" ((uint32) val), "d" ((uint32)(val >> 32)), "c" (cx)
+    );
+#else
+   __asm__ __volatile__(
+      "wrmsr"
+      : /* no outputs */
+      : "A" (val),
+        "c" (cx)
+    );
+#endif
+}
+#endif
+
+
+/*
+ * RDMSR/WRMSR access the 64bit MSRs as two
+ * 32 bit quantities, whereas GET_MSR/SET_MSR
+ * above access the MSRs as one 64bit quantity.
+ */
+#ifdef __GNUC__
+#undef RDMSR
+#undef WRMSR
+#define RDMSR(msrNum, low, high) do { \
+   __asm__ __volatile__(              \
+      "rdmsr"                         \
+      : "=a" (low), "=d" (high)       \
+      : "c" (msrNum)                  \
+   );                                 \
+} while (0)
+
+#define WRMSR(msrNum, low, high) do { \
+   __asm__ __volatile__(              \
+      "wrmsr"                         \
+      : /* no outputs */              \
+      : "c" (msrNum),                 \
+        "a" (low),                    \
+        "d" (high)                    \
+    );                                \
+} while (0)
+
+static INLINE uint64 RDPMC(int cx)
+{
+#ifdef VM_X86_64
+   uint64 pmcLow;
+   uint64 pmcHigh;
+
+   __asm__ __volatile__(
+      "rdpmc"
+      : "=a" (pmcLow), "=d" (pmcHigh)
+      : "c" (cx)
+   );
+
+   return pmcHigh << 32 | pmcLow;
+#else
+   uint64 pmc;
+
+   __asm__ __volatile__(
+      "rdpmc"
+      : "=A" (pmc)
+      : "c" (cx)
+   );
+
+   return pmc;
+#endif
+}
+#elif defined _MSC_VER
+#ifndef VM_X86_64 // XXX Switch to intrinsics with the new 32 and 64-bit compilers.
+
+static INLINE uint64 RDPMC(int counter)
+{
+   __asm mov ecx, counter
+   __asm rdpmc
+}
+
+static INLINE void WRMSR(uint32 msrNum, uint32 lo, uint32 hi)
+{
+   __asm mov ecx, msrNum
+   __asm mov eax, lo
+   __asm mov edx, hi
+   __asm wrmsr
+}
+#endif
+#endif
+
+
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+static INLINE uint64 __XGETBV(int cx)
+{
+#ifdef VM_X86_64
+   uint64 lowval, hival;
+   __asm__ __volatile__(
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+      ".byte 0x0f, 0x01, 0xd0"
+#else
+      "xgetbv"
+#endif
+      : "=a" (lowval), "=d" (hival)
+      : "c" (cx)
+   );
+   return hival << 32 | lowval;
+#else
+   uint64 val;
+   __asm__ __volatile__(
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+      ".byte 0x0f, 0x01, 0xd0"
+#else
+      "xgetbv"
+#endif
+      : "=A" (val)
+      : "c" (cx)
+   );
+   return val;
+#endif
+}
+
+static INLINE void __XSETBV(int cx, uint64 val)
+{
+   __asm__ __volatile__(
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+      ".byte 0x0f, 0x01, 0xd1"
+#else
+      "xsetbv"
+#endif
+      : /* no outputs */
+      : "a" ((uint32)val), "d" ((uint32)(val >> 32)), "c" (cx)
+    );
+}
+
+static INLINE uint64 GET_XCR0(void)
+{
+   return __XGETBV(0);
+}
+
+#define SET_XCR0(val) __XSETBV(0, val)
+
+static INLINE void SET_XCR0_IF_NEEDED(uint64 newVal, uint64 oldVal)
+{
+   ASSERT(oldVal == GET_XCR0());
+   if (newVal != oldVal) {
+      SET_XCR0(newVal);
+   }
+}
+#endif
+
+
+#define START_TRACING() { \
+   uintptr_t flags;       \
+   SAVE_FLAGS(flags);     \
+   flags |= EFLAGS_TF;    \
+   RESTORE_FLAGS(flags);  \
+}
+
+#define STOP_TRACING() {  \
+   uintptr_t flags;       \
+   SAVE_FLAGS(flags);     \
+   flags &= ~EFLAGS_TF;   \
+   RESTORE_FLAGS(flags);  \
+}
+
+
+static INLINE Bool
+INTERRUPTS_ENABLED(void)
+{
+   uintptr_t flags;
+   SAVE_FLAGS(flags);
+   return ((flags & EFLAGS_IF) != 0);
+}
+
+static INLINE void
+SET_KERNEL_PER_CORE(uint64 val)
+{
+   __SET_MSR(MSR_GSBASE, val);
+}
+
+#endif
diff --git a/vmmon-only/include/vm_asm_x86_64.h b/vmmon-only/include/vm_asm_x86_64.h
new file mode 100644
index 00000000..902cd81b
--- /dev/null
+++ b/vmmon-only/include/vm_asm_x86_64.h
@@ -0,0 +1,136 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_asm_x86_64.h
+ *
+ *	x86-64 asm macros
+ */
+
+#ifndef _VM_ASM_X86_64_H_
+#define _VM_ASM_X86_64_H_
+
+
+#define INCLUDE_ALLOW_VMX
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#include "includeCheck.h"
+
+#ifdef __GNUC__
+#include "vm_asm_x86.h"
+#endif
+
+/*
+ * This file contains inline assembly routines used by x86_64 code.
+ */
+
+#ifdef __GNUC__
+
+  /* nop; prevents #error for no compiler definition from firing */
+
+#elif defined _MSC_VER  /* !__GNUC__ */
+
+/*
+ * x86-64 windows doesn't support inline asm so we have to use these
+ * intrinsic functions defined in the compiler.  Not all of these are well
+ * documented.  There is an array in the compiler dll (c1.dll) which has
+ * an array of the names of all the intrinsics minus the leading
+ * underscore.  Searching around in the ntddk.h file can also be helpful.
+ *
+ * The declarations for the intrinsic functions were taken from the DDK.
+ * Our declarations must match the ddk's otherwise the 64-bit c++ compiler
+ * will complain about second linkage of the intrinsic functions.
+ * We define the intrinsic using the basic types corresponding to the
+ * Windows typedefs. This avoids having to include windows header files
+ * to get to the windows types.
+ */
+
+#ifdef _WIN64
+#ifdef __cplusplus
+extern "C" {
+#endif
+unsigned __int64  __readmsr(unsigned long);
+void              __writemsr(unsigned long, unsigned __int64);
+#pragma intrinsic(__readmsr, __writemsr)
+#ifdef __cplusplus
+}
+#endif
+
+
+static INLINE uint64
+RDPMC(int counter)
+{
+   return __readpmc(counter);
+}
+
+
+static INLINE void
+WRMSR(uint32 msrNum, uint32 lo, uint32 hi)
+{
+   uint64 value = QWORD(hi, lo);
+   __writemsr(msrNum, value);
+}
+
+
+static INLINE uint64
+__GET_MSR(int input)
+{
+   return __readmsr((unsigned long)input);
+}
+
+
+static INLINE void
+__SET_MSR(int cx, uint64 val)
+{
+  __writemsr((unsigned long)cx, (unsigned __int64)val);
+}
+
+#endif
+
+#else
+#error No compiler defined for get/set
+#endif /* !__GNUC__ && !_MSC_VER */
+
+
+#ifdef __GNUC__
+static INLINE void
+SWAPGS(void)
+{
+   __asm__ __volatile__("swapgs");
+}
+
+
+static INLINE uint64
+RDTSCP_AuxOnly(void)
+{
+   uint64 tscLow, tscHigh, tscAux;
+
+   __asm__ __volatile__(
+      "rdtscp"
+      : "=a" (tscLow), "=d" (tscHigh), "=c" (tscAux)
+   );
+
+   return tscAux;
+}
+#endif
+
+#endif
diff --git a/vmmon-only/include/vm_assert.h b/vmmon-only/include/vm_assert.h
new file mode 100644
index 00000000..b368e1da
--- /dev/null
+++ b/vmmon-only/include/vm_assert.h
@@ -0,0 +1,336 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_assert.h --
+ *
+ *	The basic assertion facility for all VMware code.
+ *
+ *      For proper use, see bora/doc/assert and
+ *      http://vmweb.vmware.com/~mts/WebSite/guide/programming/asserts.html.
+ */
+
+#ifndef _VM_ASSERT_H_
+#define _VM_ASSERT_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+// XXX not necessary except some places include vm_assert.h improperly
+#include "vm_basic_types.h"
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/*
+ * Some bits of vmcore are used in VMKernel code and cannot have
+ * the VMKERNEL define due to other header dependencies.
+ */
+#if defined(VMKERNEL) && !defined(VMKPANIC)
+#define VMKPANIC 1
+#endif
+
+/*
+ * Internal macros, functions, and strings
+ *
+ * The monitor wants to save space at call sites, so it has specialized
+ * functions for each situation.  User level wants to save on implementation
+ * so it uses generic functions.
+ */
+
+#if !defined VMM || defined MONITOR_APP // {
+
+#if defined (VMKPANIC) 
+#include "vmk_assert.h"
+#else /* !VMKPANIC */
+#define _ASSERT_PANIC(name) \
+           Panic(_##name##Fmt "\n", __FILE__, __LINE__)
+#define _ASSERT_PANIC_BUG(bug, name) \
+           Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
+#define _ASSERT_PANIC_NORETURN(name) \
+           Panic(_##name##Fmt "\n", __FILE__, __LINE__)
+#define _ASSERT_PANIC_BUG_NORETURN(bug, name) \
+           Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
+#endif /* VMKPANIC */
+
+#endif // }
+
+
+// These strings don't have newline so that a bug can be tacked on.
+#define _AssertPanicFmt            "PANIC %s:%d"
+#define _AssertAssertFmt           "ASSERT %s:%d"
+#define _AssertVerifyFmt           "VERIFY %s:%d"
+#define _AssertNotImplementedFmt   "NOT_IMPLEMENTED %s:%d"
+#define _AssertNotReachedFmt       "NOT_REACHED %s:%d"
+#define _AssertMemAllocFmt         "MEM_ALLOC %s:%d"
+#define _AssertNotTestedFmt        "NOT_TESTED %s:%d"
+
+
+/*
+ * Panic and log functions
+ */
+
+void Log(const char *fmt, ...) PRINTF_DECL(1, 2);
+void Warning(const char *fmt, ...) PRINTF_DECL(1, 2);
+#if defined VMKPANIC
+void Panic_SaveRegs(void);
+
+#ifdef VMX86_DEBUG
+void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
+#else
+NORETURN void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
+#endif
+
+NORETURN void Panic_NoSaveNoReturn(const char *fmt, ...) PRINTF_DECL(1, 2);
+
+#define Panic(fmt...) do { \
+   Panic_SaveRegs();       \
+   Panic_NoSave(fmt);      \
+} while(0)
+
+#define Panic_NoReturn(fmt...) do { \
+   Panic_SaveRegs();                \
+   Panic_NoSaveNoReturn(fmt);       \
+} while(0)
+
+#else
+NORETURN void Panic(const char *fmt, ...) PRINTF_DECL(1, 2);
+#endif
+
+void LogThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
+void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
+
+
+#ifndef ASSERT_IFNOT
+   /*
+    * PR 271512: When compiling with gcc, catch assignments inside an ASSERT.
+    *
+    * 'UNLIKELY' is defined with __builtin_expect, which does not warn when
+    * passed an assignment (gcc bug 36050). To get around this, we put 'cond'
+    * in an 'if' statement and make sure it never gets executed by putting
+    * that inside of 'if (0)'. We use gcc's statement expression syntax to
+    * make ASSERT an expression because some code uses it that way.
+    *
+    * Since statement expression syntax is a gcc extension and since it's
+    * not clear if this is a problem with other compilers, the ASSERT
+    * definition was not changed for them. Using a bare 'cond' with the
+    * ternary operator may provide a solution.
+    */
+
+   #ifdef __GNUC__
+      #define ASSERT_IFNOT(cond, panic)                                       \
+         ({if (UNLIKELY(!(cond))) { panic; if (0) { if (cond) {;}}} (void)0;})
+   #else
+      #define ASSERT_IFNOT(cond, panic)                                       \
+         (UNLIKELY(!(cond)) ? (panic) : (void)0)
+   #endif
+#endif
+
+
+/*
+ * Assert, panic, and log macros
+ *
+ * Some of these are redefined below undef !VMX86_DEBUG.
+ * ASSERT() is special cased because of interaction with Windows DDK.
+ */
+
+#if defined VMX86_DEBUG
+#undef  ASSERT
+#define ASSERT(cond) ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertAssert))
+#define ASSERT_BUG(bug, cond) \
+           ASSERT_IFNOT(cond, _ASSERT_PANIC_BUG(bug, AssertAssert))
+#endif
+
+#undef  VERIFY
+#define VERIFY(cond) \
+           ASSERT_IFNOT(cond, _ASSERT_PANIC_NORETURN(AssertVerify))
+#define VERIFY_BUG(bug, cond) \
+           ASSERT_IFNOT(cond, _ASSERT_PANIC_BUG_NORETURN(bug, AssertVerify))
+
+#define PANIC()        _ASSERT_PANIC(AssertPanic)
+#define PANIC_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertPanic)
+
+#define ASSERT_NOT_IMPLEMENTED(cond) \
+           ASSERT_IFNOT(cond, NOT_IMPLEMENTED())
+#define ASSERT_NOT_IMPLEMENTED_BUG(bug, cond) \
+           ASSERT_IFNOT(cond, NOT_IMPLEMENTED_BUG(bug))
+
+#if defined VMKPANIC || defined VMM
+#define NOT_IMPLEMENTED()        _ASSERT_PANIC_NORETURN(AssertNotImplemented)
+#else
+#define NOT_IMPLEMENTED()        _ASSERT_PANIC(AssertNotImplemented)
+#endif
+
+#if defined VMM
+#define NOT_IMPLEMENTED_BUG(bug) \
+          _ASSERT_PANIC_BUG_NORETURN(bug, AssertNotImplemented)
+#else 
+#define NOT_IMPLEMENTED_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertNotImplemented)
+#endif
+
+#if defined VMKPANIC || defined VMM
+#define NOT_REACHED()            _ASSERT_PANIC_NORETURN(AssertNotReached)
+#else
+#define NOT_REACHED()            _ASSERT_PANIC(AssertNotReached)
+#endif
+
+#define ASSERT_MEM_ALLOC(cond) \
+           ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertMemAlloc))
+
+#ifdef VMX86_DEVEL
+#define ASSERT_DEVEL(cond) ASSERT(cond)
+#define NOT_TESTED()       Warning(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
+#else
+#define ASSERT_DEVEL(cond) ((void)0)
+#define NOT_TESTED()       Log(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
+#endif
+
+#define ASSERT_NO_INTERRUPTS()  ASSERT(!INTERRUPTS_ENABLED())
+#define ASSERT_HAS_INTERRUPTS() ASSERT(INTERRUPTS_ENABLED())
+
+#define ASSERT_NOT_TESTED(cond) (UNLIKELY(!(cond)) ? NOT_TESTED() : (void)0)
+#define NOT_TESTED_ONCE()       DO_ONCE(NOT_TESTED())
+
+#define NOT_TESTED_1024()                                               \
+   do {                                                                 \
+      static uint16 count = 0;                                          \
+      if (UNLIKELY(count == 0)) { NOT_TESTED(); }                       \
+      count = (count + 1) & 1023;                                       \
+   } while (0)
+
+#define LOG_ONCE(_s) DO_ONCE(Log _s)
+
+
+/*
+ * Redefine macros that are only in debug versions
+ */
+
+#if !defined VMX86_DEBUG // {
+
+#undef  ASSERT
+#define ASSERT(cond)          ((void)0)
+#define ASSERT_BUG(bug, cond) ((void)0)
+
+/*
+ * Expand NOT_REACHED() as appropriate for each situation.
+ *
+ * Mainly, we want the compiler to infer the same control-flow
+ * information as it would from Panic().  Otherwise, different
+ * compilation options will lead to different control-flow-derived
+ * errors, causing some make targets to fail while others succeed.
+ *
+ * VC++ has the __assume() built-in function which we don't trust
+ * (see bug 43485); gcc has no such construct; we just panic in
+ * userlevel code.  The monitor doesn't want to pay the size penalty
+ * (measured at 212 bytes for the release vmm for a minimal infinite
+ * loop; panic would cost even more) so it does without and lives
+ * with the inconsistency.
+ */
+
+#if defined VMKPANIC || defined VMM
+#undef  NOT_REACHED
+#if defined __GNUC__ && (__GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 5)
+#define NOT_REACHED() (__builtin_unreachable())
+#else
+#define NOT_REACHED() ((void)0)
+#endif
+#else
+// keep debug definition
+#endif
+
+#undef LOG_UNEXPECTED
+#define LOG_UNEXPECTED(bug)     ((void)0)
+
+#undef  ASSERT_NOT_TESTED
+#define ASSERT_NOT_TESTED(cond) ((void)0)
+#undef  NOT_TESTED
+#define NOT_TESTED()            ((void)0)
+#undef  NOT_TESTED_ONCE
+#define NOT_TESTED_ONCE()       ((void)0)
+#undef  NOT_TESTED_1024
+#define NOT_TESTED_1024()       ((void)0)
+
+#endif // !VMX86_DEBUG }
+
+
+/*
+ * Compile-time assertions.
+ *
+ * ASSERT_ON_COMPILE does not use the common
+ * switch (0) { case 0: case (e): ; } trick because some compilers (e.g. MSVC)
+ * generate code for it.
+ *
+ * The implementation uses both enum and typedef because the typedef alone is
+ * insufficient; gcc allows arrays to be declared with non-constant expressions
+ * (even in typedefs, where it makes no sense).
+ *
+ * NOTE: if GCC ever changes so that it ignores unused types altogether, this
+ * assert might not fire!  We explicitly mark it as unused because GCC 4.8+
+ * uses -Wunused-local-typedefs as part of -Wall, which means the typedef will
+ * generate a warning.
+ */
+
+#if defined(_Static_assert) || defined(__cplusplus) ||                         \
+    !defined(__GNUC__) || __GNUC__ < 4 || (__GNUC__ == 4 && __GNUC_MINOR__ < 6)
+#define ASSERT_ON_COMPILE(e) \
+   do { \
+      enum { AssertOnCompileMisused = ((e) ? 1 : -1) }; \
+      UNUSED_TYPE(typedef char AssertOnCompileFailed[AssertOnCompileMisused]); \
+   } while (0)
+#else
+#define ASSERT_ON_COMPILE(e) \
+   do {                      \
+      _Static_assert(e, #e); \
+   } while (0);
+#endif
+
+/*
+ * To put an ASSERT_ON_COMPILE() outside a function, wrap it
+ * in MY_ASSERTS().  The first parameter must be unique in
+ * each .c file where it appears.  For example,
+ *
+ * MY_ASSERTS(FS3_INT,
+ *    ASSERT_ON_COMPILE(sizeof(FS3_DiskLock) == 128);
+ *    ASSERT_ON_COMPILE(sizeof(FS3_DiskLockReserved) == DISK_BLOCK_SIZE);
+ *    ASSERT_ON_COMPILE(sizeof(FS3_DiskBlock) == DISK_BLOCK_SIZE);
+ *    ASSERT_ON_COMPILE(sizeof(Hardware_DMIUUID) == 16);
+ * )
+ *
+ * Caution: ASSERT() within MY_ASSERTS() is silently ignored.
+ * The same goes for anything else not evaluated at compile time.
+ */
+
+#define MY_ASSERTS(name, assertions) \
+   static INLINE void name(void) {   \
+      assertions                     \
+   }
+
+#ifdef __cplusplus
+} /* extern "C" */
+#endif
+
+#endif /* ifndef _VM_ASSERT_H_ */
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
new file mode 100644
index 00000000..07f32eab
--- /dev/null
+++ b/vmmon-only/include/vm_atomic.h
@@ -0,0 +1,3896 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_atomic.h --
+ *
+ *       Atomic power
+ *
+ * Note: Only partially tested on ARM processors: Works for View Open
+ *       Client, which shouldn't have threads, and ARMv8 processors.
+ *
+ *       In ARM, GCC intrinsics (__sync*) compile but might not
+ *       work, while MS intrinsics (_Interlocked*) do not compile.
+ */
+
+#ifndef _ATOMIC_H_
+#define _ATOMIC_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_assert.h"
+
+/*
+ * In the Atomic_* definitions below, memory ordering and atomicity are somewhat
+ * conflated in an inconsistent manner. First, we have Atomic_{Read,Write},
+ * which only guarantees single copy atomicity, i.e. that the read/write occurs
+ * in an atomic fashion, but have no implication on memory ordering. The second
+ * class of Atomics are all the non-unfenced operations excluding
+ * Atomic_{Read,Write}*, which both imply atomicity and act as a memory barrier,
+ * implying sequentially consistent ordering of the atomic operation with all
+ * loads/stores prior to and after it.
+ *
+ * Since on x86, the second class of operations are associated with LOCK
+ * semantics, assumptions have been made about the ordering these operations
+ * imply on surrounding code (see for example the vmkernel's RefCount
+ * implementation). As a result, on arm64 we have to provide these same
+ * guarantees. We do this by making use of DMB barriers both before and after
+ * the atomic ldrx/strx sequences. A barrier before and after is required to
+ * avoid having part of the atomic operation reordered with surrounding code,
+ * e.g. a store-load reordering of the strx with a following load outside the
+ * Atomic_ op. For the first class of operations, Atomic_{Read,Write}, we do not
+ * implement a barrier.
+ *
+ * This implementation of Atomic operations is suboptimal on arm64, since
+ * both atomicity and memory ordering are fused together. Ideally the Atomic
+ * operations would only imply atomicity, and an explicit memory barrier in the
+ * surrounding code used to enforce ordering where necessary. This would eschew
+ * the need for the DMBs. A middle ground can be implemented where we use the
+ * arm64 load-acquire/store-release exclusive instructions to implement Atomics.
+ * This would imply sequential consistency of the Atomic operations (but not
+ * with any of the surrounding non-atomic operations) without the need for a
+ * DMB. Using these without a DMB today can still result in problematic
+ * reordering by the processor with surrounding non-atomic operations, e.g. a
+ * store-load reordering with a stlxr. Future optimization for arm64 should
+ * consider the wider change required at the call sites to minimize DMBs.
+ *
+ * For further details on x86 and ARM memory ordering see
+ * https://wiki.eng.vmware.com/ARM/MemoryOrdering.
+ */
+
+#ifdef VM_ARM_64
+#include "vm_basic_asm_arm64.h"
+
+#define ARM_64_ATOMIC_16_OPV_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint16 _sample;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxrh   %w0, [%2]      \n\t" \
+      #op "       %w0, %w0, %w3  \n\t" \
+      "   stxrh   %w1, %w0, [%2] \n\t" \
+      "   cbnz    %w1, 1b        \n\t" \
+      : "=&r" (_sample),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+})
+
+#define ARM_64_ATOMIC_16_OPO_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint16 _newval;                     \
+   uint16 _oldval;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxrh   %w0, [%3]      \n\t" \
+      #op "       %w1, %w0, %w4  \n\t" \
+      "   stxrh   %w2, %w1, [%3] \n\t" \
+      "   cbnz    %w2, 1b        \n\t" \
+      : "=&r" (_oldval),               \
+        "=&r" (_newval),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+   _oldval;                            \
+})
+
+#define ARM_64_ATOMIC_32_OPV_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint32 _sample;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxr    %w0, [%2]      \n\t" \
+      #op "       %w0, %w0, %w3  \n\t" \
+      "   stxr    %w1, %w0, [%2] \n\t" \
+      "   cbnz    %w1, 1b        \n\t" \
+      : "=&r" (_sample),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+})
+
+#define ARM_64_ATOMIC_32_OPO_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint32 _newval;                     \
+   uint32 _oldval;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxr    %w0, [%3]      \n\t" \
+      #op "       %w1, %w0, %w4  \n\t" \
+      "   stxr    %w2, %w1, [%3] \n\t" \
+      "   cbnz    %w2, 1b        \n\t" \
+      : "=&r" (_oldval),               \
+        "=&r" (_newval),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+   _oldval;                            \
+})
+
+#define ARM_64_ATOMIC_64_OPV_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint64 _sample;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxr    %x0, [%2]      \n\t" \
+      #op "       %x0, %x0, %x3  \n\t" \
+      "   stxr    %w1, %x0, [%2] \n\t" \
+      "   cbnz    %w1, 1b        \n\t" \
+      : "=&r" (_sample),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+})
+
+#define ARM_64_ATOMIC_64_OPO_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint64 _newval;                     \
+   uint64 _oldval;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxr    %x0, [%3]      \n\t" \
+      #op "       %x1, %x0, %x4  \n\t" \
+      "   stxr    %w2, %x1, [%3] \n\t" \
+      "   cbnz    %w2, 1b        \n\t" \
+      : "=&r" (_oldval),               \
+        "=&r" (_newval),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+   _oldval;                            \
+})
+
+#define ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
+   DMB();                                       \
+   ARM_64_ATOMIC_16_OPV_PRIVATE(atm,modval,op); \
+   DMB();                                       \
+})
+
+#define ARM_64_ATOMIC_16_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
+   uint16 _oldval_fenced;                                        \
+   DMB();                                                        \
+   _oldval_fenced = ARM_64_ATOMIC_16_OPO_PRIVATE(atm,modval,op); \
+   DMB();                                                        \
+   _oldval_fenced;                                               \
+})
+
+#define ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
+   DMB();                                       \
+   ARM_64_ATOMIC_32_OPV_PRIVATE(atm,modval,op); \
+   DMB();                                       \
+})
+
+#define ARM_64_ATOMIC_32_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
+   uint32 _oldval_fenced;                                        \
+   DMB();                                                        \
+   _oldval_fenced = ARM_64_ATOMIC_32_OPO_PRIVATE(atm,modval,op); \
+   DMB();                                                        \
+   _oldval_fenced;                                               \
+})
+
+#define ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
+   DMB();                                       \
+   ARM_64_ATOMIC_64_OPV_PRIVATE(atm,modval,op); \
+   DMB();                                       \
+})
+
+#define ARM_64_ATOMIC_64_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
+   uint64 _oldval_fenced;                                        \
+   DMB();                                                        \
+   _oldval_fenced = ARM_64_ATOMIC_64_OPO_PRIVATE(atm,modval,op); \
+   DMB();                                                        \
+   _oldval_fenced;                                               \
+})
+
+#endif /* VM_ARM_64 */
+
+
+/* Basic atomic types: 16, 32 and 64 bits */
+typedef struct Atomic_uint16 {
+   volatile uint16 value;
+} Atomic_uint16 ALIGNED(2);
+
+typedef struct Atomic_uint32 {
+   volatile uint32 value;
+} Atomic_uint32 ALIGNED(4);
+
+typedef struct  Atomic_uint64 {
+   volatile uint64 value;
+} Atomic_uint64 ALIGNED(8);
+
+/*
+ * Prototypes for msft atomics.  These are defined & inlined by the
+ * compiler so no function definition is needed.  The prototypes are
+ * needed for C++.  Since amd64 compiler doesn't support inline asm we
+ * have to use these.  Unfortunately, we still have to use some inline asm
+ * for the 32 bit code since the and/or/xor implementations didn't show up
+ * until XP or 2k3.
+ *
+ * The declarations for the intrinsic functions were taken from ntddk.h
+ * in the DDK. The declarations must match otherwise the 64-bit C++
+ * compiler will complain about second linkage of the intrinsic functions.
+ * We define the intrinsic using the basic types corresponding to the
+ * Windows typedefs. This avoids having to include windows header files
+ * to get to the windows types.
+ */
+#if defined(_MSC_VER) && _MSC_VER >= 1310 && !defined(BORA_NO_WIN32_INTRINS)
+#ifdef __cplusplus
+extern "C" {
+#endif
+long  _InterlockedExchange(long volatile*, long);
+long  _InterlockedCompareExchange(long volatile*, long, long);
+long  _InterlockedExchangeAdd(long volatile*, long);
+long  _InterlockedDecrement(long volatile*);
+long  _InterlockedIncrement(long volatile*);
+void  _ReadWriteBarrier(void);
+#pragma intrinsic(_InterlockedExchange, _InterlockedCompareExchange)
+#pragma intrinsic(_InterlockedExchangeAdd, _InterlockedDecrement)
+#pragma intrinsic(_InterlockedIncrement, _ReadWriteBarrier)
+
+# if _MSC_VER >= 1600
+char     _InterlockedExchange8(char volatile *, char);
+char     _InterlockedCompareExchange8(char volatile *, char, char);
+#pragma intrinsic(_InterlockedCompareExchange8, _InterlockedCompareExchange8)
+#endif
+
+#if defined(VM_X86_64)
+long     _InterlockedAnd(long volatile*, long);
+__int64  _InterlockedAnd64(__int64 volatile*, __int64);
+long     _InterlockedOr(long volatile*, long);
+__int64  _InterlockedOr64(__int64 volatile*, __int64);
+long     _InterlockedXor(long volatile*, long);
+__int64  _InterlockedXor64(__int64 volatile*, __int64);
+__int64  _InterlockedExchangeAdd64(__int64 volatile*, __int64);
+__int64  _InterlockedIncrement64(__int64 volatile*);
+__int64  _InterlockedDecrement64(__int64 volatile*);
+__int64  _InterlockedExchange64(__int64 volatile*, __int64);
+__int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
+#if !defined(_WIN64)
+#pragma intrinsic(_InterlockedAnd, _InterlockedAnd64)
+#pragma intrinsic(_InterlockedOr, _InterlockedOr64)
+#pragma intrinsic(_InterlockedXor, _InterlockedXor64)
+#pragma intrinsic(_InterlockedExchangeAdd64, _InterlockedIncrement64)
+#pragma intrinsic(_InterlockedDecrement64, _InterlockedExchange64)
+#pragma intrinsic(_InterlockedCompareExchange64)
+#endif /* !_WIN64 */
+#endif /* __x86_64__ */
+
+#ifdef __cplusplus
+}
+#endif
+#endif /* _MSC_VER */
+
+#if defined(__arm__)
+/*
+ * LDREX without STREX or CLREX may cause problems in environments where the
+ * context switch may not clear the reference monitor - according ARM manual
+ * the reference monitor should be cleared after a context switch, but some
+ * may not like Linux kernel's non-preemptive context switch path. So use of
+ * ARM routines in kernel code may not be safe.
+ */
+#   if defined(__ARM_ARCH_7__) || defined(__ARM_ARCH_7A__) ||  \
+       defined(__ARM_ARCH_7R__)|| defined(__ARM_ARCH_7M__)
+#      define VM_ARM_V7
+#      ifdef __KERNEL__
+#         warning LDREX/STREX may not be safe in linux kernel, since it      \
+          does not issue CLREX on context switch (as of 2011-09-29).
+#      endif
+#   else
+#     error Only ARMv7 extends the synchronization primitives ldrex/strex.   \
+            For the lower ARM version, please implement the atomic functions \
+            by kernel APIs.
+#   endif
+#endif
+
+/* Data Memory Barrier */
+#ifdef VM_ARM_V7
+#define dmb() __asm__ __volatile__("dmb" : : : "memory")
+#endif
+
+
+/* Convert a volatile uint32 to Atomic_uint32. */
+static INLINE Atomic_uint32 *
+Atomic_VolatileToAtomic(volatile uint32 *var)  // IN:
+{
+   return (Atomic_uint32 *)var;
+}
+
+/* Convert a volatile uint64 to Atomic_uint64. */
+static INLINE Atomic_uint64 *
+Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
+{
+   return (Atomic_uint64 *)var;
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Init, Atomic_SetFence, AtomicUseFence --
+ *
+ *      Determine whether an lfence intruction is executed after
+ *	every locked instruction.
+ *
+ *	Certain AMD processors have a bug (see bug 107024) that
+ *	requires an lfence after every locked instruction.
+ *
+ *	The global variable AtomicUseFence controls whether lfence
+ *	is used (see AtomicEpilogue).
+ *
+ *	Atomic_SetFence sets AtomicUseFence to the given value.
+ *
+ *	Atomic_Init computes and sets AtomicUseFence for x86.
+ *	It does not take into account the number of processors.
+ *
+ *	The rationale for all this complexity is that Atomic_Init
+ *	is the easy-to-use interface.  It can be called a number
+ *	of times cheaply, and does not depend on other libraries.
+ *	However, because the number of CPUs is difficult to compute,
+ *	it does without it and always assumes there are more than one.
+ *
+ *	For programs that care or have special requirements,
+ *	Atomic_SetFence can be called directly, in addition to Atomic_Init.
+ *	It overrides the effect of Atomic_Init, and can be called
+ *	before, after, or between calls to Atomic_Init.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+// The freebsd assembler doesn't know the lfence instruction
+#if defined(__GNUC__) &&                                                \
+     __GNUC__ >= 3 &&                                                   \
+    (defined(__VMKERNEL__) || !defined(__FreeBSD__)) &&                 \
+    (!defined(MODULE) || defined(__VMKERNEL_MODULE__)) &&               \
+    !defined(__APPLE__) &&                                              \
+    (defined(__i386__) || defined(__x86_64__)) /* PR136775 */
+#define ATOMIC_USE_FENCE
+#endif
+
+/* 
+ * Starting with vSphere 2014, we no longer support ESX on AMD Rev F. 
+ * Thus, we can eliminate all dynamic checks for whether to enable 
+ * the Errata 147 work-around when compiling many of our binaries. 
+ * However, we use an opt-in approach here rather than assuming all 
+ * parts of our builds are safe. For example, the "fdm" binary from 
+ * a new build may time travel back to hosts running older versions 
+ * of ESX on Rev F, so "fdm" continues to require the ability to 
+ * dynamically enable the errata work-around. With vSphere 2017,
+ * this will no longer be required as the oldest version of ESX that 
+ * VC 2017 will support is ESX 2014 (which won't run on Rev F).
+ *
+ * Modules may explicitly define MAY_NEED_AMD_REVF_WORKAROUND as 0 prior to
+ * inclusion of vm_atomic.h when they are safe on AMD Rev F with the elided
+ * lfence.
+ */
+#if !defined(MAY_NEED_AMD_REVF_WORKAROUND)
+#if (!defined(VMX86_SERVER) ||                                          \
+      (!defined(VMX86_VMX) && !defined(VMKERNEL) &&                     \
+       !defined(VMM)       && !defined(VMCORE)))
+#define MAY_NEED_AMD_REVF_WORKAROUND 1
+#else
+#define MAY_NEED_AMD_REVF_WORKAROUND 0
+#endif
+#endif
+
+#if MAY_NEED_AMD_REVF_WORKAROUND
+#if defined(VMATOMIC_IMPORT_DLLDATA)
+VMX86_EXTERN_DATA Bool AtomicUseFence;
+#else
+EXTERN Bool AtomicUseFence;
+#endif
+EXTERN Bool atomicFenceInitialized;
+#else   /* MAY_NEED_AMD_REVF_WORKAROUND */
+#define AtomicUseFence         FALSE
+#define atomicFenceInitialized TRUE
+#endif  /* MAY_NEED_AMD_REVF_WORKAROUND */
+
+
+void AtomicInitFence(void);
+
+static INLINE void
+Atomic_Init(void)
+{
+#ifdef ATOMIC_USE_FENCE
+   if (MAY_NEED_AMD_REVF_WORKAROUND && !atomicFenceInitialized) {
+      AtomicInitFence();
+   }
+#endif
+}
+
+static INLINE void
+Atomic_SetFence(Bool fenceAfterLock)  // IN:
+{
+   (void)fenceAfterLock;     /* Work around unused parameter. */
+#if MAY_NEED_AMD_REVF_WORKAROUND
+   AtomicUseFence = fenceAfterLock;
+   atomicFenceInitialized = TRUE;
+#endif
+}
+
+
+/* Conditionally execute fence after interlocked instruction. */
+static INLINE void
+AtomicEpilogue(void)
+{
+#if MAY_NEED_AMD_REVF_WORKAROUND && defined(ATOMIC_USE_FENCE)
+#ifdef VMM
+      /* The monitor conditionally patches out the lfence when not needed.*/
+      /* Construct a MonitorPatchTextEntry in the .patchtext section. */
+      asm volatile ("1:\n\t"
+                    "lfence\n\t"
+                    "2:\n\t"
+                    ".pushsection .patchtext\n\t"
+                    ".quad 1b\n\t"
+                    ".quad 2b\n\t"
+                    ".quad 0\n\t"
+                    ".popsection\n\t" ::: "memory");
+#else
+      if (UNLIKELY(AtomicUseFence)) {
+         asm volatile ("lfence" ::: "memory");
+      }
+#endif
+#endif
+}
+
+
+/*
+ * All the assembly code is tricky and written conservatively.
+ * For example, to make sure gcc won't introduce copies,
+ * we force the addressing mode like this:
+ *
+ *    "xchgl %0, (%1)"
+ *    : "=r" (val)
+ *    : "r" (&var->value),
+ *      "0" (val)
+ *    : "memory"
+ *
+ * - edward
+ *
+ * Actually - turns out that gcc never generates memory aliases (it
+ * still does generate register aliases though), so we can be a bit
+ * more agressive with the memory constraints. The code above can be
+ * modified like this:
+ *
+ *    "xchgl %0, %1"
+ *    : "=r" (val),
+ *      "=m" (var->value),
+ *    : "0" (val),
+ *      "1" (var->value)
+ *
+ * The advantages are that gcc can use whatever addressing mode it
+ * likes to access the memory value, and that we dont have to use a
+ * way-too-generic "memory" clobber as there is now an explicit
+ * declaration that var->value is modified.
+ *
+ * see also /usr/include/asm/atomic.h to convince yourself this is a
+ * valid optimization.
+ *
+ * - walken
+ */
+
+#if defined(_MSC_VER) && _MSC_VER < 1600 && defined(__x86_64__)
+Bool VMWInterlockedExchangeBool(Bool volatile *ptr,
+                                Bool val);
+
+Bool VMWInterlockedCompareExchangeBool(Bool volatile *ptr,
+                                       Bool newVal,
+                                       Bool oldVal);
+#endif
+
+typedef struct Atomic_Bool {
+   volatile Bool value;
+} Atomic_Bool;
+
+/* The ARM team can come along and add the code real soon now */
+extern Bool AtomicUndefinedOnARM(void);
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadBool --
+ *
+ *      Read the value of the specified object atomically.
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_ReadBool(Atomic_Bool const *var)  // IN:
+{
+   Bool val;
+
+#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
+   val = AtomicUndefinedOnARM();
+#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=q" (val)
+      : "m" (var->value)
+   );
+#elif defined(_MSC_VER)
+   val = var->value;
+#else
+#error No compiler defined for Atomic_ReadBool
+#endif
+
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWriteBool --
+ *
+ *      Read followed by write.
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_ReadWriteBool(Atomic_Bool *var,  // IN/OUT:
+                     Bool val)          // IN:
+{
+#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
+   return AtomicUndefinedOnARM();
+#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
+   __asm__ __volatile__(
+      "xchgb %0, %1"
+      : "=q" (val),
+        "+m" (var->value)
+      : "0" (val)
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(_MSC_VER) && _MSC_VER >= 1600
+   return _InterlockedExchange8(&var->value, val);
+#elif defined(_MSC_VER) && defined(__i386__)
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm movzx eax, val
+      __asm mov ebx, var
+      __asm xchg [ebx]Atomic_Bool.value, al
+   }
+#pragma warning(pop)
+#elif defined(_MSC_VER) && defined(__x86_64__)
+   return VMWInterlockedExchangeBool(&var->value, val);
+#else
+#error No compiler defined for Atomic_ReadBool
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_WriteBool --
+ *
+ *      Write the specified value to the specified object atomically.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_WriteBool(Atomic_Bool *var,  // IN/OUT:
+                 Bool val)          // IN:
+{
+#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
+   AtomicUndefinedOnARM();
+#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=m" (var->value)
+      : "qn" (val)
+   );
+#elif defined(_MSC_VER)
+   var->value = val;
+#else
+#error No compiler defined for Atomic_WriteBool
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWriteBool --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal.
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_ReadIfEqualWriteBool(Atomic_Bool *var,  // IN/OUT:
+                            Bool oldVal,       // IN:
+                            Bool newVal)       // IN:
+{
+#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
+   return AtomicUndefinedOnARM();
+#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
+   Bool val;
+
+   __asm__ __volatile__(
+      "lock; cmpxchgb %2, %1"
+      : "=a" (val),
+        "+m" (var->value)
+      : "q" (newVal),
+        "0" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(_MSC_VER) && _MSC_VER >= 1600
+   return _InterlockedCompareExchange8(&var->value, newVal, oldVal);
+#elif defined(_MSC_VER) && defined(__i386__)
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov al, oldVal
+      __asm mov ebx, var
+      __asm mov cl, newVal
+      __asm lock cmpxchg [ebx]Atomic_Bool.value, cl
+      __asm movzx eax, al
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#elif defined(_MSC_VER) && defined(__x86_64__)
+   return VMWInterlockedCompareExchangeBool(&var->value, newVal, oldVal);
+#else
+#error No compiler defined for Atomic_ReadIfEqualWriteBool
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read --
+ *
+ *      Read
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_Read(Atomic_uint32 const *var) // IN
+{
+   uint32 value;
+
+#if defined(VMM)
+   ASSERT(((uintptr_t)var % 4) == 0);
+#endif
+
+#if defined(__GNUC__)
+   /*
+    * Use inline assembler to force using a single load instruction to
+    * ensure that the compiler doesn't split a transfer operation into multiple
+    * instructions.
+    */
+
+#if defined(VM_ARM_32)
+   __asm__ __volatile__(
+      "ldr %0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value)
+   );
+#elif defined(VM_ARM_64)
+   __asm__ __volatile__ (
+      "ldr    %w0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value)
+   );
+#else
+   __asm__ __volatile__(
+      "mov %1, %0"
+      : "=r" (value)
+      : "m" (var->value)
+   );
+#endif
+#elif defined(_MSC_VER)
+   /*
+    * Microsoft docs guarantee simple reads and writes to properly
+    * aligned 32-bit variables use only a single instruction.
+    * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
+    */
+
+   value = var->value;
+#else
+#error No compiler defined for Atomic_Read
+#endif
+
+   return value;
+}
+#define Atomic_Read32 Atomic_Read
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWrite --
+ *
+ *      Read followed by write
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
+                 uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 retVal;
+   register volatile uint32 res;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[retVal], [%[var]] \n\t"
+      "strex %[res], %[val], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint32 retVal;
+   register uint32 failed;
+
+   __asm__ __volatile__(
+      "   dmb     sy             \n\t"
+      "1: ldxr   %w0, [%2]       \n\t"
+      "   stxr   %w1, %w3, [%2]  \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (val)
+      : "memory"
+   );
+
+   return retVal;
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "xchgl %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+   );
+   AtomicEpilogue();
+   return val;
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   return _InterlockedExchange((long *)&var->value, (long)val);
+#else
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov eax, val
+      __asm mov ebx, var
+      __asm xchg [ebx]Atomic_uint32.value, eax
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#endif // _MSC_VER >= 1310
+#else
+#error No compiler defined for Atomic_ReadWrite
+#endif // __GNUC__
+}
+#define Atomic_ReadWrite32 Atomic_ReadWrite
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write --
+ *
+ *      Write
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write(Atomic_uint32 *var, // OUT
+             uint32 val)         // IN
+{
+#if defined(VMM)
+   ASSERT(((uintptr_t)var % 4) == 0);
+#endif
+
+#if defined(__GNUC__)
+#if defined(VM_ARM_ANY)
+   /*
+    * A3.4.1 ARM DDI 0406C:
+    *
+    * When a processor writes using any instruction other than a
+    * Store-Exclusive:
+    *
+    * - if the write is to a physical address that is not covered by its local
+    *   monitor the write does not affect the state of the local monitor
+    * - if the write is to a physical address that is covered by its local
+    *   monitor it is IMPLEMENTATION DEFINED whether the write affects the
+    *   state of the local monitor.
+    *
+    * A3.4.5 ARM DDI 0406C:
+    *
+    * If two STREX instructions are executed without an intervening LDREX the
+    * second STREX returns a status value of 1. This means that:
+    *
+    * - ARM recommends that, in a given thread of execution, every STREX has a
+    *   preceding LDREX associated with it
+    * - it is not necessary for every LDREX to have a subsequent STREX.
+    */
+
+   Atomic_ReadWrite(var, val);
+#else
+   /*
+    * Use inline assembler to force using a single store instruction to
+    * ensure that the compiler doesn't split a transfer operation into multiple
+    * instructions.
+    */
+
+   __asm__ __volatile__(
+      "mov %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#endif
+#elif defined(_MSC_VER)
+   /*
+    * Microsoft docs guarantee simple reads and writes to properly
+    * aligned 32-bit variables use only a single instruction.
+    * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
+    */
+
+   var->value = val;
+#else
+#error No compiler defined for Atomic_Write
+#endif
+}
+#define Atomic_Write32 Atomic_Write
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWrite --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
+                        uint32 oldVal,      // IN
+                        uint32 newVal)      // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register uint32 retVal;
+   register uint32 res;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[retVal], [%[var]] \n\t"
+      "mov %[res], #0 \n\t"
+      "teq %[retVal], %[oldVal] \n\t"
+      "strexeq %[res], %[newVal], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint32 retVal;
+   register uint32 failed;
+
+   __asm__ __volatile__ (
+      "   dmb     sy             \n\t"
+      "1: ldxr   %w0, [%2]       \n\t"
+      "   cmp     %w0, %w3       \n\t"
+      "   b.ne    2f             \n\t"
+      "   stxr   %w1, %w4, [%2]  \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "2: clrex                  \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (oldVal), "r" (newVal)
+      : "cc", "memory");
+
+   return retVal;
+#else /* VM_X86_ANY */
+   uint32 val;
+
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; cmpxchgl %2, %1"
+      : "=a" (val),
+	"+m" (var->value)
+      : "r" (newVal),
+	"0" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   return _InterlockedCompareExchange((long *)&var->value,
+				      (long)newVal,
+				      (long)oldVal);
+#else
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov eax, oldVal
+      __asm mov ebx, var
+      __asm mov ecx, newVal
+      __asm lock cmpxchg [ebx]Atomic_uint32.value, ecx
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#endif
+#else
+#error No compiler defined for Atomic_ReadIfEqualWrite
+#endif
+}
+#define Atomic_ReadIfEqualWrite32 Atomic_ReadIfEqualWrite
+
+
+#if defined(VM_64BIT) || defined(VM_ARM_V7)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWrite64 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
+                          uint64 oldVal,      // IN
+                          uint64 newVal)      // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register uint64 retVal;
+   register uint32 res;
+
+   dmb();
+
+   /*
+    * Under Apple LLVM version 5.0 (clang-500.2.76) (based on LLVM 3.3svn)
+    * There will be a warning:
+    * "value size does not match register size specified by the constraint
+    * and modifier [-Wasm-operand-widths]"
+    * on the lines:
+    * : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+    *                                          ^
+    * : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+    *                                                                 ^
+    *
+    * Furthermore, using a 32-bits register to store a
+    * 64-bits value of an variable looks risky.
+    */
+#if defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wasm-operand-widths"
+#endif
+   __asm__ __volatile__(
+   "1: ldrexd %[retVal], %H[retVal], [%[var]] \n\t"
+      "mov %[res], #0 \n\t"
+      "teq %[retVal], %[oldVal] \n\t"
+      "teqeq %H[retVal], %H[oldVal] \n\t"
+      "strexdeq %[res], %[newVal], %H[newVal], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+      : "cc"
+   );
+#if defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#pragma clang diagnostic pop
+#endif // defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint64 retVal;
+   register uint32 failed;
+
+   __asm__ __volatile__ (
+      "   dmb     sy             \n\t"
+      "1: ldxr    %x0, [%2]      \n\t"
+      "   cmp     %x0, %x3       \n\t"
+      "   b.ne    2f             \n\t"
+      "   stxr    %w1, %x4, [%2] \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "2: clrex                  \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (oldVal), "r" (newVal)
+      : "cc", "memory");
+
+   return retVal;
+#else /* VM_X86_64 */
+   uint64 val;
+
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; cmpxchgq %2, %1"
+      : "=a" (val),
+	"+m" (var->value)
+      : "r" (newVal),
+	"0" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#endif //VM_ARM_V7
+#elif defined _MSC_VER
+   return _InterlockedCompareExchange64((__int64 *)&var->value,
+					(__int64)newVal,
+					(__int64)oldVal);
+#else
+#error No compiler defined for Atomic_ReadIfEqualWrite64
+#endif
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_And --
+ *
+ *      Atomic read, bitwise AND with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_And(Atomic_uint32 *var, // IN/OUT
+           uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[tmp], [%[var]] \n\t"
+      "and %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, and);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; andl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if defined(__x86_64__)
+   _InterlockedAnd((long *)&var->value, (long)val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock and [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_And
+#endif
+}
+#define Atomic_And32 Atomic_And
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Or --
+ *
+ *      Atomic read, bitwise OR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Or(Atomic_uint32 *var, // IN/OUT
+          uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[tmp], [%[var]] \n\t"
+      "orr %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, orr);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; orl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if defined(__x86_64__)
+   _InterlockedOr((long *)&var->value, (long)val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock or [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_Or
+#endif
+}
+#define Atomic_Or32 Atomic_Or
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Xor --
+ *
+ *      Atomic read, bitwise XOR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Xor(Atomic_uint32 *var, // IN/OUT
+           uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[tmp], [%[var]] \n\t"
+      "eor %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, eor);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; xorl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if defined(__x86_64__)
+   _InterlockedXor((long *)&var->value, (long)val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock xor [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_Xor
+#endif
+}
+#define Atomic_Xor32 Atomic_Xor
+
+
+#if defined(VM_64BIT)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Xor64 --
+ *
+ *      Atomic read, bitwise XOR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
+             uint64 val)         // IN
+{
+#if defined(__GNUC__)
+#if defined(VM_ARM_64)
+   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, eor);
+#else /* VM_X86_64 */
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; xorq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif
+#elif defined _MSC_VER
+   _InterlockedXor64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_Xor64
+#endif
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Add --
+ *
+ *      Atomic read, add a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Add(Atomic_uint32 *var, // IN/OUT
+           uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[tmp], [%[var]] \n\t"
+      "add %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, add);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; addl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   _InterlockedExchangeAdd((long *)&var->value, (long)val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock add [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_Add
+#endif
+}
+#define Atomic_Add32 Atomic_Add
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Sub --
+ *
+ *      Atomic read, subtract a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Sub(Atomic_uint32 *var, // IN/OUT
+           uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+      "1: ldrex %[tmp], [%[var]] \n\t"
+      "sub %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, sub);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; subl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   _InterlockedExchangeAdd((long *)&var->value, (long)-val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock sub [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_Sub
+#endif
+}
+#define Atomic_Sub32 Atomic_Sub
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Inc --
+ *
+ *      Atomic read, increment, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Inc(Atomic_uint32 *var) // IN/OUT
+{
+#ifdef __GNUC__
+#if defined(VM_ARM_ANY)
+   Atomic_Add(var, 1);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; incl %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   _InterlockedIncrement((long *)&var->value);
+#else
+   __asm mov ebx, var
+   __asm lock inc [ebx]Atomic_uint32.value
+#endif
+#else
+#error No compiler defined for Atomic_Inc
+#endif
+}
+#define Atomic_Inc32 Atomic_Inc
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Dec --
+ *
+ *      Atomic read, decrement, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Dec(Atomic_uint32 *var) // IN/OUT
+{
+#ifdef __GNUC__
+#if defined(VM_ARM_ANY)
+   Atomic_Sub(var, 1);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; decl %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   _InterlockedDecrement((long *)&var->value);
+#else
+   __asm mov ebx, var
+   __asm lock dec [ebx]Atomic_uint32.value
+#endif
+#else
+#error No compiler defined for Atomic_Dec
+#endif
+}
+#define Atomic_Dec32 Atomic_Dec
+
+
+/*
+ * Note that the technique below can be used to implement ReadX(), where X is
+ * an arbitrary mathematical function.
+ */
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadOr32 --
+ *
+ *      Atomic read (returned), bitwise OR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
+                uint32 val)         // IN
+{
+   uint32 res;
+
+   do {
+      res = Atomic_Read(var);
+   } while (res != Atomic_ReadIfEqualWrite(var, res, res | val));
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAnd32 --
+ *
+ *      Atomic read (returned), bitwise And with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
+                 uint32 val)         // IN
+{
+   uint32 res;
+
+   do {
+      res = Atomic_Read(var);
+   } while (res != Atomic_ReadIfEqualWrite(var, res, res & val));
+
+   return res;
+}
+
+
+#if defined(VM_64BIT)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadOr64 --
+ *
+ *      Atomic read (returned), bitwise OR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
+                uint64 val)         // IN
+{
+   uint64 res;
+
+   do {
+      res = var->value;
+   } while (res != Atomic_ReadIfEqualWrite64(var, res, res | val));
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAnd64 --
+ *
+ *      Atomic read (returned), bitwise AND with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
+                 uint64 val)         // IN
+{
+   uint64 res;
+
+   do {
+      res = var->value;
+   } while (res != Atomic_ReadIfEqualWrite64(var, res, res & val));
+
+   return res;
+}
+#endif /* defined(VM_64BIT) */
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAdd32 --
+ *
+ *      Atomic read (returned), add a value, write.
+ *
+ *      If you have to implement ReadAdd32() on an architecture other than
+ *      x86 or x86-64, you might want to consider doing something similar to
+ *      Atomic_ReadOr32().
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
+                 uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 retVal;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+      "1: ldrex %[retVal], [%[var]] \n\t"
+      "add %[tmp], %[val], %[retVal] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [tmp] "=&r" (tmp), [res] "=&r" (res), [retVal] "=&r" (retVal)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   return ARM_64_ATOMIC_32_OPO_PRIVATE_FENCED(var, val, add);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; xaddl %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   return _InterlockedExchangeAdd((long *)&var->value, (long)val);
+#else
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov eax, val
+      __asm mov ebx, var
+      __asm lock xadd [ebx]Atomic_uint32.value, eax
+   }
+#pragma warning(pop)
+#endif
+#else
+#error No compiler defined for Atomic_ReadAdd32
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadInc32 --
+ *
+ *      Atomic read (returned), increment, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadInc32(Atomic_uint32 *var) // IN/OUT
+{
+   return Atomic_ReadAdd32(var, 1);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadDec32 --
+ *
+ *      Atomic read (returned), decrement, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadDec32(Atomic_uint32 *var) // IN/OUT
+{
+   return Atomic_ReadAdd32(var, (uint32)-1);
+}
+
+
+#if defined VMKERNEL || defined VMM
+#if !defined(VM_ARM_64)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CMPXCHG1B --
+ *
+ *      Compare and exchange a single byte.
+ *
+ * Results:
+ *      The value read from ptr.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE uint8
+CMPXCHG1B(volatile uint8 *ptr, // IN/OUT
+          uint8 oldVal,        // IN
+          uint8 newVal)        // IN
+{
+   uint8 val;
+   __asm__ __volatile__("lock; cmpxchgb %b2, %1"
+                        : "=a" (val),
+                          "+m" (*ptr)
+                        : "r" (newVal),
+                          "0" (oldVal)
+                        : "cc");
+   return val;
+}
+#endif /* !defined(VM_ARM_64) */
+#endif
+
+
+/*
+ * Usage of this helper struct is strictly reserved to the following
+ * function. --hpreg
+ */
+typedef struct {
+   uint32 lowValue;
+   uint32 highValue;
+} S_uint64;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_CMPXCHG64 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ *      XXX: Ensure that if this function is to be inlined by gcc, it is
+ *      compiled with -fno-strict-aliasing. Otherwise it will break.
+ *      Unfortunately we know that gcc 2.95.3 (used to build the FreeBSD 3.2
+ *      Tools) does not honor -fno-strict-aliasing. As a workaround, we avoid
+ *      inlining the function entirely for versions of gcc under 3.0.
+ *
+ * Results:
+ *      TRUE if equal, FALSE if not equal
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && __GNUC__ < 3
+static Bool
+#else
+static INLINE Bool
+#endif
+Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
+                 uint64 const *oldVal, // IN
+                 uint64 const *newVal) // IN
+{
+#if defined(__GNUC__)
+#if defined(VM_ARM_ANY)
+   return (Atomic_ReadIfEqualWrite64(var, *oldVal, *newVal) == *oldVal);
+#else /* VM_X86_ANY */
+
+   Bool equal;
+   /* Checked against the Intel manual and GCC --walken */
+#if defined(__x86_64__)
+   uint64 dummy;
+   __asm__ __volatile__(
+      "lock; cmpxchgq %3, %0" "\n\t"
+      "sete %1"
+      : "+m" (*var),
+	"=qm" (equal),
+	"=a" (dummy)
+      : "r" (*newVal),
+        "2" (*oldVal)
+      : "cc"
+   );
+#else /* 32-bit version for non-ARM */
+   int dummy1, dummy2;
+#   if defined __PIC__
+   /*
+    * Rules for __asm__ statements in __PIC__ code
+    * --------------------------------------------
+    *
+    * The compiler uses %ebx for __PIC__ code, so an __asm__ statement cannot
+    * clobber %ebx. The __asm__ statement can temporarily modify %ebx, but _for
+    * each parameter that is used while %ebx is temporarily modified_:
+    *
+    * 1) The constraint cannot be "m", because the memory location the compiler
+    *    chooses could then be relative to %ebx.
+    *
+    * 2) The constraint cannot be a register class which contains %ebx (such as
+    *    "r" or "q"), because the register the compiler chooses could then be
+    *    %ebx. (This happens when compiling the Fusion UI with gcc 4.2.1, Apple
+    *    build 5577.)
+    *
+    * 3) Using register classes even for other values is problematic, as gcc
+    *    can decide e.g. %ecx == %edi == 0 (as compile-time constants) and
+    *    ends up using one register for two things. Which breaks xchg's ability
+    *    to temporarily put the PIC pointer somewhere else. PR772455
+    *
+    * For that reason alone, the __asm__ statement should keep the regions
+    * where it temporarily modifies %ebx as small as possible, and should
+    * prefer specific register assignments.
+    */
+#      if __GNUC__ < 3 // Part of #188541 - for RHL 6.2 etc.
+   __asm__ __volatile__(
+      "xchg %%ebx, %6"       "\n\t"
+      "mov 4(%%ebx), %%ecx"  "\n\t"
+      "mov (%%ebx), %%ebx"   "\n\t"
+      "lock; cmpxchg8b (%3)" "\n\t"
+      "xchg %%ebx, %6"       "\n\t"
+      "sete %0"
+      : "=a" (equal),
+        "=d" (dummy2),
+        "=D" (dummy1)
+      : /*
+         * See the "Rules for __asm__ statements in __PIC__ code" above: %3
+         * must use a register class which does not contain %ebx.
+         */
+        "S" (var),
+        "0" (((S_uint64 const *)oldVal)->lowValue),
+        "1" (((S_uint64 const *)oldVal)->highValue),
+        "D" (newVal)
+      : "ecx", "cc", "memory"
+   );
+#      else
+   __asm__ __volatile__(
+      "xchgl %%ebx, %6"      "\n\t"
+      "lock; cmpxchg8b (%3)" "\n\t"
+      "xchgl %%ebx, %6"      "\n\t"
+      "sete %0"
+      :	"=qm" (equal),
+	"=a" (dummy1),
+	"=d" (dummy2)
+      : /*
+         * See the "Rules for __asm__ statements in __PIC__ code" above: %3
+         * must use a register class which does not contain %ebx.
+         * "a"/"c"/"d" are already used, so we are left with either "S" or "D".
+         *
+         * Note that this assembly uses ALL GP registers (with %esp reserved for
+         * stack, %ebp reserved for frame, %ebx reserved for PIC).
+         */
+        "S" (var),
+        "1" (((S_uint64 const *)oldVal)->lowValue),
+        "2" (((S_uint64 const *)oldVal)->highValue),
+        "D" (((S_uint64 const *)newVal)->lowValue),
+        "c" (((S_uint64 const *)newVal)->highValue)
+      : "cc", "memory"
+   );
+#      endif
+#   else
+   __asm__ __volatile__(
+      "lock; cmpxchg8b %0" "\n\t"
+      "sete %1"
+      : "+m" (*var),
+	"=qm" (equal),
+	"=a" (dummy1),
+	"=d" (dummy2)
+      : "2" (((S_uint64 const *)oldVal)->lowValue),
+        "3" (((S_uint64 const *)oldVal)->highValue),
+        "b" (((S_uint64 const *)newVal)->lowValue),
+        "c" (((S_uint64 const *)newVal)->highValue)
+      : "cc"
+   );
+#   endif
+#endif
+   AtomicEpilogue();
+   return equal;
+#endif //VM_ARM_V7
+#elif defined _MSC_VER
+#if defined(__x86_64__)
+   return (__int64)*oldVal == _InterlockedCompareExchange64((__int64 *)&var->value,
+                                                            (__int64)*newVal,
+                                                            (__int64)*oldVal);
+#else
+#pragma warning(push)
+#pragma warning(disable : 4035)		// disable no-return warning
+   {
+      __asm mov esi, var
+      __asm mov edx, oldVal
+      __asm mov ecx, newVal
+      __asm mov eax, [edx]S_uint64.lowValue
+      __asm mov edx, [edx]S_uint64.highValue
+      __asm mov ebx, [ecx]S_uint64.lowValue
+      __asm mov ecx, [ecx]S_uint64.highValue
+      __asm lock cmpxchg8b [esi]
+      __asm sete al
+      __asm movzx eax, al
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#endif
+#else
+#error No compiler defined for Atomic_CMPXCHG64
+#endif // !GNUC
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_CMPXCHG32 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ * Results:
+ *      TRUE if equal, FALSE if not equal
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
+                 uint32 oldVal,        // IN
+                 uint32 newVal)        // IN
+{
+#if defined(__GNUC__)
+#if defined(VM_ARM_ANY)
+   return (Atomic_ReadIfEqualWrite(var, oldVal, newVal) == oldVal);
+#else /* VM_X86_ANY */
+   Bool equal;
+   uint32 dummy;
+
+   __asm__ __volatile__(
+      "lock; cmpxchgl %3, %0" "\n\t"
+      "sete %1"
+      : "+m" (*var),
+	"=qm" (equal),
+	"=a" (dummy)
+      : "r" (newVal),
+        "2" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return equal;
+#endif /* VM_X86_ANY */
+#else // defined(__GNUC__)
+   return (Atomic_ReadIfEqualWrite(var, oldVal, newVal) == oldVal);
+#endif // !defined(__GNUC__)
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read64 --
+ *
+ *      Read and return.
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_Read64(Atomic_uint64 const *var) // IN
+{
+#if defined(__GNUC__) && defined(__x86_64__)
+   uint64 value;
+
+#ifdef VMM
+   ASSERT((uintptr_t)var % 8 == 0);
+#endif
+   /*
+    * Use asm to ensure we emit a single load.
+    */
+   __asm__ __volatile__(
+      "movq %1, %0"
+      : "=r" (value)
+      : "m" (var->value)
+   );
+   return value;
+#elif defined(__GNUC__) && defined(__i386__)
+   uint64 value;
+   /*
+    * Since cmpxchg8b will replace the contents of EDX:EAX with the
+    * value in memory if there is no match, we need only execute the
+    * instruction once in order to atomically read 64 bits from
+    * memory.  The only constraint is that ECX:EBX must have the same
+    * value as EDX:EAX so that if the comparison succeeds.  We
+    * intentionally don't tell gcc that we are using ebx and ecx as we
+    * don't modify them and do not care what value they store.
+    */
+   __asm__ __volatile__(
+      "mov %%ebx, %%eax"   "\n\t"
+      "mov %%ecx, %%edx"   "\n\t"
+      "lock; cmpxchg8b %1"
+      : "=&A" (value)
+      : "m" (*var)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return value;
+#elif defined (_MSC_VER) && defined(__x86_64__)
+   /*
+    * Microsoft docs guarantee "Simple reads and writes to properly
+    * aligned 64-bit variables are atomic on 64-bit Windows."
+    * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
+    *
+    * XXX Verify that value is properly aligned. Bug 61315.
+    */
+   return var->value;
+#elif defined (_MSC_VER) && defined(__i386__)
+#   pragma warning(push)
+#   pragma warning(disable : 4035)		// disable no-return warning
+   {
+      __asm mov ecx, var
+      __asm mov edx, ecx
+      __asm mov eax, ebx
+      __asm lock cmpxchg8b [ecx]
+      // edx:eax is the return value; this is documented to work. --mann
+   }
+#   pragma warning(pop)
+#elif defined(__GNUC__) && defined (VM_ARM_V7)
+   uint64 value;
+
+   __asm__ __volatile__(
+      "ldrexd %[value], %H[value], [%[var]] \n\t"
+      : [value] "=&r" (value)
+      : [var] "r" (&var->value)
+   );
+
+   return value;
+#elif defined(__GNUC__) && defined(VM_ARM_64)
+   uint64 value;
+
+   __asm__ __volatile__(
+      "ldr     %0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value));
+
+   return value;
+#endif /* defined(__GNUC__) && defined(VM_ARM_64) */
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadUnaligned64 --
+ *
+ *      Atomically read a 64 bit integer, possibly misaligned.
+ *      This function can be *very* expensive, costing over 50 kcycles
+ *      on Nehalem.
+ * 
+ *      Note that "var" needs to be writable, even though it will not
+ *      be modified.
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+#if defined(VM_64BIT)
+static INLINE uint64
+Atomic_ReadUnaligned64(Atomic_uint64 const *var)  // IN:
+{
+   return Atomic_ReadIfEqualWrite64((Atomic_uint64*)var, 0, 0);
+}
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadAdd64 --
+ *
+ *      Atomically adds a 64-bit integer to another
+ *
+ * Results:
+ *      Returns the old value just prior to the addition
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
+                 uint64 val)         // IN
+{
+#if defined(VM_ARM_64)
+   return ARM_64_ATOMIC_64_OPO_PRIVATE_FENCED(var, val, add);
+#elif defined(__x86_64__)
+
+#if defined(__GNUC__)
+   __asm__ __volatile__(
+      "lock; xaddq %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined _MSC_VER
+   return _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_ReadAdd64
+#endif
+
+#else
+   uint64 oldVal;
+   uint64 newVal;
+
+   do {
+      oldVal = var->value;
+      newVal = oldVal + val;
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+
+   return oldVal;
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadSub64 --
+ *
+ *      Atomically subtracts a 64-bit integer to another
+ *
+ * Results:
+ *      Returns the old value just prior to the subtraction
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
+                 uint64 val)         // IN
+{
+   return Atomic_ReadAdd64(var, -val);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadInc64 --
+ *
+ *      Atomically increments a 64-bit integer
+ *
+ * Results:
+ *      Returns the old value just prior to incrementing
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadInc64(Atomic_uint64 *var) // IN/OUT
+{
+   return Atomic_ReadAdd64(var, 1);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadDec64 --
+ *
+ *      Atomically decrements a 64-bit integer
+ *
+ * Results:
+ *      Returns the old value just prior to decrementing
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadDec64(Atomic_uint64 *var) // IN/OUT
+{
+   return Atomic_ReadAdd64(var, CONST64U(-1));
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Add64 --
+ *
+ *      Atomic read, add a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Add64(Atomic_uint64 *var, // IN/OUT
+             uint64 val)         // IN
+{
+#if !defined(VM_64BIT)
+   Atomic_ReadAdd64(var, val); /* Return value is unused. */
+#elif defined(__GNUC__)
+#if defined(VM_ARM_64)
+   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, add);
+#else /* defined(VM_X86_64) */
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; addq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif
+#elif defined _MSC_VER
+   _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_Add64
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Sub64 --
+ *
+ *      Atomic read, subtract a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
+             uint64 val)         // IN
+{
+#if !defined(__x86_64__)
+   Atomic_ReadSub64(var, val); /* Return value is unused. */
+#elif defined(__GNUC__)
+#if defined(VM_ARM_64)
+   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, sub);
+#else /* VM_X86_64 */
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; subq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif
+#elif defined _MSC_VER
+   _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)-val);
+#else
+#error No compiler defined for Atomic_Sub64
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Inc64 --
+ *
+ *      Atomic read, increment, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
+{
+#if !defined(__x86_64__)
+   Atomic_ReadInc64(var);  /* Return value is unused. */
+#elif defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; incq %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   _InterlockedIncrement64((__int64 *)&var->value);
+#else
+#error No compiler defined for Atomic_Inc64
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Dec64 --
+ *
+ *      Atomic read, decrement, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
+{
+#if !defined(__x86_64__)
+   Atomic_ReadDec64(var);  /* Return value is unused. */
+#elif defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; decq %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   _InterlockedDecrement64((__int64 *)&var->value);
+#else
+#error No compiler defined for Atomic_Dec64
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWrite64 --
+ *
+ *      Read followed by write
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
+                   uint64 val)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "xchgq %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined _MSC_VER
+   return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_ReadWrite64
+#endif
+#else
+   uint64 oldVal;
+
+   do {
+      oldVal = var->value;
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &val));
+
+   return oldVal;
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write64 --
+ *
+ *      Write
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write64(Atomic_uint64 *var, // OUT
+               uint64 val)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+
+#ifdef VMM
+   ASSERT((uintptr_t)var % 8 == 0);
+#endif
+   /*
+    * There is no move instruction for 64-bit immediate to memory, so unless
+    * the immediate value fits in 32-bit (i.e. can be sign-extended), GCC
+    * breaks the assignment into two movl instructions.  The code below forces
+    * GCC to load the immediate value into a register first.
+    */
+
+   __asm__ __volatile__(
+      "movq %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#elif defined _MSC_VER
+   /*
+    * Microsoft docs guarantee "Simple reads and writes to properly aligned 
+    * 64-bit variables are atomic on 64-bit Windows."
+    * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
+    *
+    * XXX Verify that value is properly aligned. Bug 61315.
+    */
+
+   var->value = val;
+#else
+#error No compiler defined for Atomic_Write64
+#endif
+#else  /* defined(__x86_64__) */
+   (void)Atomic_ReadWrite64(var, val);
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Or64 --
+ *
+ *      Atomic read, bitwise OR with a 64-bit value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Or64(Atomic_uint64 *var, // IN/OUT
+            uint64 val)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; orq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   _InterlockedOr64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_Or64
+#endif
+#else // __x86_64__
+   uint64 oldVal;
+   uint64 newVal;
+   do {
+      oldVal = var->value;
+      newVal = oldVal | val;
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_And64 --
+ *
+ *      Atomic read, bitwise AND with a 64-bit value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_And64(Atomic_uint64 *var, // IN/OUT
+             uint64 val)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; andq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_And64
+#endif
+#else // __x86_64__
+   uint64 oldVal;
+   uint64 newVal;
+   do {
+      oldVal = var->value;
+      newVal = oldVal & val;
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_SetBit64 --
+ *
+ *      Atomically set the bit 'bit' in var.  Bit must be between 0 and 63.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
+                uint64 bit)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   ASSERT(bit <= 63);
+   __asm__ __volatile__(
+      "lock; bts %1, %0"
+      : "+m" (var->value)
+      : "ri" (bit)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   uint64 oldVal;
+   uint64 newVal;
+   ASSERT(bit <= 63);
+   do {
+      oldVal = var->value;
+      newVal = oldVal | (CONST64U(1) << bit);
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#else
+#error No compiler defined for Atomic_SetBit64
+#endif
+#else // __x86_64__
+   uint64 oldVal;
+   uint64 newVal;
+   ASSERT(bit <= 63);
+   do {
+      oldVal = var->value;
+      newVal = oldVal | (CONST64U(1) << bit);
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ClearBit64 --
+ *
+ *      Atomically clear the bit 'bit' in var.  Bit must be between 0 and 63.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
+                  uint64 bit)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   ASSERT(bit <= 63);
+   __asm__ __volatile__(
+      "lock; btr %1, %0"
+      : "+m" (var->value)
+      : "ri" (bit)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   uint64 oldVal;
+   uint64 newVal;
+   ASSERT(bit <= 63);
+   do {
+      oldVal = var->value;
+      newVal = oldVal & ~(CONST64U(1) << bit);
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#else
+#error No compiler defined for Atomic_ClearBit64
+#endif
+#else // __x86_64__
+   uint64 oldVal;
+   uint64 newVal;
+   ASSERT(bit <= 63);
+   do {
+      oldVal = var->value;
+      newVal = oldVal & ~(CONST64U(1) << bit);
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestBit64 --
+ *
+ *      Read the bit 'bit' in var.  Bit must be between 0 and 63.
+ *
+ * Results:
+ *      TRUE if the tested bit was set; else FALSE.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestBit64(Atomic_uint64 *var, // IN
+                 uint64 bit)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   Bool out = FALSE;
+   ASSERT(bit <= 63);
+   __asm__ __volatile__(
+      "bt %2, %1; setc %0"
+      : "=rm"(out)
+      : "m" (var->value),
+        "rJ" (bit)
+      : "cc"
+   );
+   return out;
+#elif defined _MSC_VER
+   ASSERT(bit <= 63);
+   return (var->value & (CONST64U(1) << bit)) != 0;
+#else
+#error No compiler defined for Atomic_TestBit64
+#endif
+#else // __x86_64__
+   ASSERT(bit <= 63);
+   return (var->value & (CONST64U(1) << bit)) != 0;
+#endif
+}
+
+
+#if defined(__GNUC__)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read16 --
+ *
+ *      Read and return.
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_Read16(Atomic_uint16 const *var) // IN
+{
+   uint16 value;
+
+#ifdef VMM
+   ASSERT((uintptr_t)var % 2 == 0);
+#endif
+
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+
+   __asm__ __volatile__(
+      "movw %1, %0"
+      : "=r" (value)
+      : "m" (var->value)
+   );
+#elif defined(VM_ARM_V7)
+   NOT_TESTED();
+
+   __asm__ __volatile__(
+      "ldrh %0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value)
+   );
+#elif defined(VM_ARM_64)
+   __asm__ __volatile__ (
+      "ldrh   %w0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value)
+   );
+
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+
+   return value;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWrite16 --
+ *
+ *      Read followed by write
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
+                   uint16 val)          // IN:
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "xchgw %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(VM_ARM_V7)
+   register volatile uint16 retVal;
+   register volatile uint16 res;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[retVal], [%[var]] \n\t"
+      "strexh %[res], %[val], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint16 retVal;
+   register uint16 failed;
+
+   __asm__ __volatile__(
+      "   dmb     sy             \n\t"
+      "1: ldxrh  %w0, [%2]       \n\t"
+      "   stxrh  %w1, %w3, [%2]  \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (val)
+      : "memory"
+   );
+
+   return retVal;
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write16 --
+ *
+ *      Write
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write16(Atomic_uint16 *var,  // OUT:
+               uint16 val)          // IN:
+{
+#ifdef VMM
+   ASSERT((uintptr_t)var % 2 == 0);
+#endif
+
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+
+   __asm__ __volatile__(
+      "movw %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#elif defined(VM_ARM_ANY)
+   Atomic_ReadWrite16(var, val);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWrite16 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
+                          uint16 oldVal,        // IN
+                          uint16 newVal)        // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   uint16 val;
+
+   __asm__ __volatile__(
+      "lock; cmpxchgw %2, %1"
+      : "=a" (val),
+	"+m" (var->value)
+      : "r" (newVal),
+	"0" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(VM_ARM_V7)
+   register uint16 retVal;
+   register uint16 res;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[retVal], [%[var]] \n\t"
+      "mov %[res], #0 \n\t"
+      "teq %[retVal], %[oldVal] \n\t"
+      "strexheq %[res], %[newVal], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint16 retVal;
+   register uint16 failed;
+
+   __asm__ __volatile__ (
+      "   dmb     sy             \n\t"
+      "1: ldxrh  %w0, [%2]       \n\t"
+      "   cmp     %w0, %w3       \n\t"
+      "   b.ne    2f             \n\t"
+      "   stxrh  %w1, %w4, [%2]  \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "2: clrex                  \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (oldVal), "r" (newVal)
+      : "cc", "memory");
+
+   return retVal;
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_And16 --
+ *
+ *      Atomic read, bitwise AND with a 16-bit value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_And16(Atomic_uint16 *var, // IN/OUT
+             uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; andw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[tmp], [%[var]] \n\t"
+      "and %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, and);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Or16 --
+ *
+ *      Atomic read, bitwise OR with a 16-bit value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Or16(Atomic_uint16 *var, // IN/OUT
+            uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; orw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[tmp], [%[var]] \n\t"
+      "orr %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, orr);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Xor16 --
+ *
+ *      Atomic read, bitwise XOR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
+             uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; xorw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[tmp], [%[var]] \n\t"
+      "eor %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, eor);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Add16 --
+ *
+ *      Atomic read, add a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Add16(Atomic_uint16 *var, // IN/OUT
+             uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; addw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[tmp], [%[var]] \n\t"
+      "add %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, add);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Sub16 --
+ *
+ *      Atomic read, subtract a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
+             uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; subw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+      "1: ldrexh %[tmp], [%[var]] \n\t"
+      "sub %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, sub);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Inc16 --
+ *
+ *      Atomic read, increment, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; incw %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_ANY)
+   Atomic_Add16(var, 1);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Dec16 --
+ *
+ *      Atomic read, decrement, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; decw %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_ANY)
+   Atomic_Sub16(var, 1);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadOr16 --
+ *
+ *      Atomic read (returned), bitwise OR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadOr16(Atomic_uint16 *var, // IN/OUT
+                uint16 val)         // IN
+{
+   uint16 res;
+
+   do {
+      res = var->value;
+   } while (res != Atomic_ReadIfEqualWrite16(var, res, res | val));
+
+   return res;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadAdd16 --
+ *
+ *      Atomically adds a 16-bit integer to another
+ *
+ * Results:
+ *      Returns the old value just prior to the addition
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
+                 uint16 val)          // IN:
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; xaddw %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 retVal;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+      "1: ldrexh %[retVal], [%[var]] \n\t"
+      "add %[tmp], %[val], %[retVal] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [tmp] "=&r" (tmp), [res] "=&r" (res), [retVal] "=&r" (retVal)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   return ARM_64_ATOMIC_16_OPO_PRIVATE_FENCED(var, val, add);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadInc16 --
+ *
+ *      Atomically increments a 64-bit integer
+ *
+ * Results:
+ *      Returns the old value just prior to incrementing
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadInc16(Atomic_uint16 *var) // IN/OUT
+{
+   return Atomic_ReadAdd16(var, 1);
+}
+
+/*
+
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadDec16 --
+ *
+ *      Atomically decrements a 64-bit integer
+ *
+ * Results:
+ *      Returns the old value just prior to decrementing
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
+{
+   return Atomic_ReadAdd16(var, -1);
+}
+#endif
+
+/*
+ * Template code for the Atomic_<name> type and its operators.
+ *
+ * The cast argument is an intermediate type cast to make some
+ * compilers stop complaining about casting uint32 <-> void *,
+ * even though we only do it in the 32-bit case so they are always
+ * the same size.  So for val of type uint32, instead of
+ * (void *)val, we have (void *)(uintptr_t)val.
+ * The specific problem case is the Windows ddk compiler
+ * (as used by the SVGA driver).  -- edward
+ *
+ * NOTE: See the comment in vm_assert.h for why we need UNUSED_TYPE in
+ * AtomicAssertOnCompile(), and why we need to be very careful doing so.
+ */
+
+#define MAKE_ATOMIC_TYPE(name, size, in, out, cast)                           \
+   typedef Atomic_uint ## size Atomic_ ## name;                               \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   AtomicAssertOnCompile ## name(void)                                        \
+   {                                                                          \
+      enum { AssertOnCompileMisused =    8 * sizeof (in) == size              \
+                                      && 8 * sizeof (out) == size             \
+                                      && 8 * sizeof (cast) == size            \
+                                         ? 1 : -1 };                          \
+      UNUSED_TYPE(typedef char AssertOnCompileFailed[AssertOnCompileMisused]);\
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_Read ## name(Atomic_ ## name const *var)                            \
+   {                                                                          \
+      return (out)(cast)Atomic_Read ## size(var);                             \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Write ## name(Atomic_ ## name *var,                                 \
+                        in val)                                               \
+   {                                                                          \
+      Atomic_Write ## size(var, (uint ## size)(cast)val);                     \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadWrite ## name(Atomic_ ## name *var,                             \
+                            in val)                                           \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadWrite ## size(var,                         \
+		(uint ## size)(cast)val);                                     \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadIfEqualWrite ## name(Atomic_ ## name *var,                      \
+                                   in oldVal,                                 \
+                                   in newVal)                                 \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadIfEqualWrite ## size(var,                  \
+                (uint ## size)(cast)oldVal, (uint ## size)(cast)newVal);      \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_And ## name(Atomic_ ## name *var,                                   \
+                      in val)                                                 \
+   {                                                                          \
+      Atomic_And ## size(var, (uint ## size)(cast)val);                       \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Or ## name(Atomic_ ## name *var,                                    \
+                     in val)                                                  \
+   {                                                                          \
+      Atomic_Or ## size(var, (uint ## size)(cast)val);                        \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Xor ## name(Atomic_ ## name *var,                                   \
+                      in val)                                                 \
+   {                                                                          \
+      Atomic_Xor ## size(var, (uint ## size)(cast)val);                       \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Add ## name(Atomic_ ## name *var,                                   \
+                      in val)                                                 \
+   {                                                                          \
+      Atomic_Add ## size(var, (uint ## size)(cast)val);                       \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Sub ## name(Atomic_ ## name *var,                                   \
+                      in val)                                                 \
+   {                                                                          \
+      Atomic_Sub ## size(var, (uint ## size)(cast)val);                       \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Inc ## name(Atomic_ ## name *var)                                   \
+   {                                                                          \
+      Atomic_Inc ## size(var);                                                \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Dec ## name(Atomic_ ## name *var)                                   \
+   {                                                                          \
+      Atomic_Dec ## size(var);                                                \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadOr ## name(Atomic_ ## name *var,                                \
+                         in val)                                              \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadOr ## size(var, (uint ## size)(cast)val);  \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadAdd ## name(Atomic_ ## name *var,                               \
+                          in val)                                             \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadAdd ## size(var, (uint ## size)(cast)val); \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadInc ## name(Atomic_ ## name *var)                               \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadInc ## size(var);                          \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadDec ## name(Atomic_ ## name *var)                               \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadDec ## size(var);                          \
+   }
+
+
+/*
+ * Since we use a macro to generate these definitions, it is hard to look for
+ * them. So DO NOT REMOVE THIS COMMENT and keep it up-to-date. --hpreg
+ *
+ * Atomic_Ptr
+ * Atomic_ReadPtr --
+ * Atomic_WritePtr --
+ * Atomic_ReadWritePtr --
+ * Atomic_ReadIfEqualWritePtr --
+ * Atomic_AndPtr --
+ * Atomic_OrPtr --
+ * Atomic_XorPtr --
+ * Atomic_AddPtr --
+ * Atomic_SubPtr --
+ * Atomic_IncPtr --
+ * Atomic_DecPtr --
+ * Atomic_ReadOrPtr --
+ * Atomic_ReadAddPtr --
+ * Atomic_ReadIncPtr --
+ * Atomic_ReadDecPtr --
+ *
+ * Atomic_Int
+ * Atomic_ReadInt --
+ * Atomic_WriteInt --
+ * Atomic_ReadWriteInt --
+ * Atomic_ReadIfEqualWriteInt --
+ * Atomic_AndInt --
+ * Atomic_OrInt --
+ * Atomic_XorInt --
+ * Atomic_AddInt --
+ * Atomic_SubInt --
+ * Atomic_IncInt --
+ * Atomic_DecInt --
+ * Atomic_ReadOrInt --
+ * Atomic_ReadAddInt --
+ * Atomic_ReadIncInt --
+ * Atomic_ReadDecInt --
+ */
+#if defined(VM_64BIT)
+MAKE_ATOMIC_TYPE(Ptr, 64, void const *, void *, uintptr_t)
+#else
+MAKE_ATOMIC_TYPE(Ptr, 32, void const *, void *, uintptr_t)
+#endif
+MAKE_ATOMIC_TYPE(Int, 32, int, int, int)
+
+
+/* Prevent the compiler from re-ordering memory references. */
+#ifdef __GNUC__
+#define ATOMIC_COMPILER_BARRIER()   __asm__ __volatile__ ("": : :"memory")
+#elif defined(_MSC_VER)
+#define ATOMIC_COMPILER_BARRIER()   _ReadWriteBarrier()
+#else
+#error No compiler defined for ATOMIC_COMPILER_BARRIER
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_MFence --
+ *
+ *      Implements mfence in terms of a lock xor. The reason for implementing
+ *      our own mfence is that not all of our supported cpus have an assembly
+ *      mfence (P3, Athlon). We put it here to avoid duplicating code which is
+ *      also why it is prefixed with "Atomic_". Moreover, this implementation
+ *      performs slightly better than 'mfence' on modern CPUs (See PR 817059).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Cause loads and stores prior to this to be globally
+ *      visible.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_MFence(void)
+{
+   Atomic_uint32 fence;
+   ATOMIC_COMPILER_BARRIER();
+   Atomic_Xor(&fence, 0x1);
+   ATOMIC_COMPILER_BARRIER();
+}
+
+#ifdef ATOMIC_COMPILER_BARRIER
+#undef ATOMIC_COMPILER_BARRIER
+#endif /* ATOMIC_COMPILER_BARRIER */
+
+#endif // ifndef _ATOMIC_H_
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
new file mode 100644
index 00000000..0e4adae6
--- /dev/null
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -0,0 +1,1258 @@
+/*********************************************************
+ * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_asm.h
+ *
+ *	Basic asm macros
+ */
+
+#ifndef _VM_BASIC_ASM_H_
+#define _VM_BASIC_ASM_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+#if defined VM_X86_64
+#include "vm_basic_asm_x86_common.h"
+#include "vm_basic_asm_x86_64.h"
+#elif defined VM_X86_32
+#include "vm_basic_asm_x86_common.h"
+#include "vm_basic_asm_x86.h"
+#elif defined VM_ARM_64
+#include "arm64_basic_defs.h"
+#include "vm_basic_asm_arm64.h"
+#else
+#define MUL64_NO_ASM 1
+#include "mul64.h"
+#endif
+
+/*
+ * Locate most and least significant bit set functions. Use our own name
+ * space to avoid namespace collisions. The new names follow a pattern,
+ * <prefix><size><option>, where:
+ *
+ * <prefix> is [lm]ssb (least/most significant bit set)
+ * <size> is size of the argument: 32 (32-bit), 64 (64-bit) or Ptr (pointer)
+ * <option> is for alternative versions of the functions
+ *
+ * NAME        FUNCTION                    BITS     FUNC(0)
+ *-----        --------                    ----     -------
+ * lssb32_0    LSB set (uint32)            0..31    -1
+ * mssb32_0    MSB set (uint32)            0..31    -1
+ * lssb64_0    LSB set (uint64)            0..63    -1
+ * mssb64_0    MSB set (uint64)            0..63    -1
+ * lssbPtr_0   LSB set (uintptr_t;32-bit)  0..31    -1
+ * lssbPtr_0   LSB set (uintptr_t;64-bit)  0..63    -1
+ * mssbPtr_0   MSB set (uintptr_t;32-bit)  0..31    -1
+ * mssbPtr_0   MSB set (uintptr_t;64-bit)  0..63    -1
+ * lssbPtr     LSB set (uintptr_t;32-bit)  1..32    0
+ * lssbPtr     LSB set (uintptr_t;64-bit)  1..64    0
+ * mssbPtr     MSB set (uintptr_t;32-bit)  1..32    0
+ * mssbPtr     MSB set (uintptr_t;64-bit)  1..64    0
+ * lssb32      LSB set (uint32)            1..32    0
+ * mssb32      MSB set (uint32)            1..32    0
+ * lssb64      LSB set (uint64)            1..64    0
+ * mssb64      MSB set (uint64)            1..64    0
+ */
+
+#ifdef _MSC_VER
+static INLINE int
+lssb32_0(const uint32 value)
+{
+   unsigned long idx;
+   unsigned char ret;
+
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   }
+   ret = _BitScanForward(&idx, (unsigned long)value);
+#ifdef __analysis_assume
+   __analysis_assume(ret != 0);
+#endif
+
+#pragma warning(suppress: 6001 6102) // Suppress bogus complaint that idx may be uninitialized in error case
+   return idx;
+}
+
+static INLINE int
+mssb32_0(const uint32 value)
+{
+   unsigned long idx;
+   unsigned char ret;
+
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   }
+   ret = _BitScanReverse(&idx, (unsigned long)value);
+#ifdef __analysis_assume
+   __analysis_assume(ret != 0);
+#endif
+
+#pragma warning(suppress: 6001 6102) // Suppress bogus complaint that idx may be uninitialized in error case
+   return idx;
+}
+
+static INLINE int
+lssb64_0(const uint64 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+#ifdef VM_X86_64
+      unsigned long idx;
+      unsigned char ret;
+
+      ret = _BitScanForward64(&idx, (unsigned __int64)value);
+#ifdef __analysis_assume
+      __analysis_assume(ret != 0);
+#endif
+
+#pragma warning(suppress: 6001 6102) // Suppress bogus complaint that idx may be uninitialized in error case
+      return idx;
+#else
+      /* The coding was chosen to minimize conditionals and operations */
+      int lowFirstBit = lssb32_0((uint32) value);
+      if (lowFirstBit == -1) {
+         lowFirstBit = lssb32_0((uint32) (value >> 32));
+         if (lowFirstBit != -1) {
+            return lowFirstBit + 32;
+         }
+      }
+      return lowFirstBit;
+#endif
+   }
+}
+
+static INLINE int
+mssb64_0(const uint64 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+#ifdef VM_X86_64
+      unsigned long idx;
+      unsigned char ret;
+
+      ret = _BitScanReverse64(&idx, (unsigned __int64)value);
+#ifdef __analysis_assume
+      __analysis_assume(ret != 0);
+#endif
+
+#pragma warning(suppress: 6001 6102) // Suppress bogus complaint that idx may be uninitialized in error case
+      return idx;
+#else
+      /* The coding was chosen to minimize conditionals and operations */
+      if (value > 0xFFFFFFFFULL) {
+         return 32 + mssb32_0((uint32) (value >> 32));
+      }
+      return mssb32_0((uint32) value);
+#endif
+   }
+}
+#endif
+
+#ifdef __GNUC__
+
+#ifdef VM_X86_ANY
+#define USE_ARCH_X86_CUSTOM
+#endif
+
+/* **********************************************************
+ *  GCC's intrinsics for the lssb and mssb family produce sub-optimal code,
+ *  so we use inline assembly to improve matters.  However, GCC cannot
+ *  propagate constants through inline assembly, so we help GCC out by
+ *  allowing it to use its intrinsics for compile-time constant values.
+ *  Some day, GCC will make better code and these can collapse to intrinsics.
+ *
+ *  For example, in Decoder_AddressSize, inlined into VVT_GetVTInstrInfo:
+ *  __builtin_ffs(a) compiles to:
+ *  mov   $0xffffffff, %esi
+ *  bsf   %eax, %eax
+ *  cmovz %esi, %eax
+ *  sub   $0x1, %eax
+ *  and   $0x7, %eax
+ *
+ *  While the code below compiles to:
+ *  bsf   %eax, %eax
+ *  sub   $0x1, %eax
+ *
+ *  Ideally, GCC should have recognized non-zero input in the first case.
+ *  Other instances of the intrinsic produce code like
+ *  sub $1, %eax; add $1, %eax; clts
+ * **********************************************************
+ */
+
+#if __GNUC__ < 4
+#define FEWER_BUILTINS
+#endif
+
+static INLINE int
+lssb32_0(uint32 value)
+{
+#ifdef USE_ARCH_X86_CUSTOM
+   if (!__builtin_constant_p(value)) {
+      if (UNLIKELY(value == 0)) {
+         return -1;
+      } else {
+         int pos;
+         __asm__ ("bsfl %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+         return pos;
+      }
+   }
+#endif
+   return __builtin_ffs(value) - 1;
+}
+
+#ifndef FEWER_BUILTINS
+static INLINE int
+mssb32_0(uint32 value)
+{
+   /*
+    * We must keep the UNLIKELY(...) outside the #if defined ...
+    * because __builtin_clz(0) is undefined according to gcc's
+    * documentation.
+    */
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+      int pos;
+#ifdef USE_ARCH_X86_CUSTOM
+      if (!__builtin_constant_p(value)) {
+         __asm__ ("bsrl %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+         return pos;
+      }
+#endif
+      pos = 32 - __builtin_clz(value) - 1;
+      return pos;
+   }
+}
+
+static INLINE int
+lssb64_0(const uint64 value)
+{
+#ifdef USE_ARCH_X86_CUSTOM
+   if (!__builtin_constant_p(value)) {
+      if (UNLIKELY(value == 0)) {
+         return -1;
+      } else {
+         intptr_t pos;
+#ifdef VM_X86_64
+         __asm__ ("bsf %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+#else
+         /* The coding was chosen to minimize conditionals and operations */
+         pos = lssb32_0((uint32) value);
+         if (pos == -1) {
+            pos = lssb32_0((uint32) (value >> 32));
+            if (pos != -1) {
+               return pos + 32;
+            }
+         }
+#endif
+         return pos;
+      }
+   }
+#endif
+   return __builtin_ffsll(value) - 1;
+}
+#endif /* !FEWER_BUILTINS */
+
+#ifdef FEWER_BUILTINS
+/* GCC 3.3.x does not like __bulitin_clz or __builtin_ffsll. */
+static INLINE int
+mssb32_0(uint32 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+      int pos;
+      __asm__ __volatile__("bsrl %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+      return pos;
+   }
+}
+
+static INLINE int
+lssb64_0(const uint64 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+      intptr_t pos;
+
+#ifdef VM_X86_64
+      __asm__ __volatile__("bsf %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+#else
+      /* The coding was chosen to minimize conditionals and operations */
+      pos = lssb32_0((uint32) value);
+      if (pos == -1) {
+         pos = lssb32_0((uint32) (value >> 32));
+         if (pos != -1) {
+            return pos + 32;
+         }
+      }
+#endif /* VM_X86_64 */
+      return pos;
+   }
+}
+#endif /* FEWER_BUILTINS */
+
+
+static INLINE int
+mssb64_0(const uint64 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+      intptr_t pos;
+
+#ifdef USE_ARCH_X86_CUSTOM
+#ifdef VM_X86_64
+      __asm__ ("bsr %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+#else
+      /* The coding was chosen to minimize conditionals and operations */
+      if (value > 0xFFFFFFFFULL) {
+         pos = 32 + mssb32_0((uint32) (value >> 32));
+      } else {
+         pos = mssb32_0((uint32) value);
+      }
+#endif
+#else
+      pos = 64 - __builtin_clzll(value) - 1;
+#endif
+
+      return pos;
+   }
+}
+
+#ifdef USE_ARCH_X86_CUSTOM
+#undef USE_ARCH_X86_CUSTOM
+#endif
+
+#endif // __GNUC__
+
+static INLINE int
+lssbPtr_0(const uintptr_t value)
+{
+#ifdef VM_64BIT
+   return lssb64_0((uint64) value);
+#else
+   return lssb32_0((uint32) value);
+#endif
+}
+
+static INLINE int
+lssbPtr(const uintptr_t value)
+{
+   return lssbPtr_0(value) + 1;
+}
+
+static INLINE int
+mssbPtr_0(const uintptr_t value)
+{
+#ifdef VM_64BIT
+   return mssb64_0((uint64) value);
+#else
+   return mssb32_0((uint32) value);
+#endif
+}
+
+static INLINE int
+mssbPtr(const uintptr_t value)
+{
+   return mssbPtr_0(value) + 1;
+}
+
+static INLINE int
+lssb32(const uint32 value)
+{
+   return lssb32_0(value) + 1;
+}
+
+static INLINE int
+mssb32(const uint32 value)
+{
+   return mssb32_0(value) + 1;
+}
+
+static INLINE int
+lssb64(const uint64 value)
+{
+   return lssb64_0(value) + 1;
+}
+
+static INLINE int
+mssb64(const uint64 value)
+{
+   return mssb64_0(value) + 1;
+}
+
+#ifdef __GNUC__
+#if defined(VM_X86_ANY) || defined(VM_ARM_ANY)
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * uint16set --
+ *
+ *      memset a given address with an uint16 value, count times.
+ *
+ * Results:
+ *      Pointer to filled memory range.
+ *
+ * Side effects:
+ *      As with memset.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void *
+uint16set(void *dst, uint16 val, size_t count)
+{
+#ifdef VM_ARM_32
+   void *tmpDst = dst;
+
+   __asm__ __volatile__ (
+      "cmp     %1, #0\n\t"
+      "beq     2f\n"
+      "1:\n\t"
+      "strh    %2, [%0], #2\n\t"
+      "subs    %1, %1, #1\n\t"
+      "bne     1b\n"
+      "2:"
+      : "+r" (tmpDst), "+r" (count)
+      : "r" (val)
+      : "cc", "memory");
+#elif defined(VM_ARM_64)
+   void   *tmpDst = dst;
+   uint64  tmpVal = 0;
+
+   if (count == 0) {
+      return dst;
+   }
+
+   __asm__ __volatile__ (
+      "cbz     %3, 1f\n\t"
+
+      // Copy 16 bits twice...
+      "bfm     %2, %3, #0, #15\n\t"
+      "lsl     %2, %2, #16\n\t"
+      "bfm     %2, %3, #0, #15\n\t"
+
+      // Copy 32 bits from the bottom of the reg. to the top...
+      "lsl     %2, %2, #32\n\t"
+      "bfm     %2, %2, #32, #63\n"
+
+      // Copy into dst 8 bytes (4 uint16s) at a time
+      "1:\t"
+      "cmp     %1, #4\n\t"
+      "b.lo    2f\n\t"
+      "str     %2, [%0], #8\n\t"
+      "sub     %1, %1, #4\n\t"
+      "b       1b\n"
+
+      // Copy into dst 4 bytes at a time
+      "2:\t"
+      "cmp     %1, #2\n\t"
+      "b.lo    3f\n\t"
+      "str     %w2, [%0], #4\n\t"
+      "sub     %1, %1, #2\n\t"
+      "b       2b\n"
+
+      // We have 1 or zero items left...
+      "3:\t"
+      "cbz     %1, 4f\n\t"
+      "strh    %w2, [%0]\n"
+      "4:"
+      : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
+      : "r" (val)
+      : "cc", "memory");
+#else
+   size_t dummy0;
+   void *dummy1;
+
+   __asm__ __volatile__("\t"
+                        "cld"            "\n\t"
+                        "rep ; stosw"    "\n"
+                        : "=c" (dummy0), "=D" (dummy1)
+                        : "0" (count), "1" (dst), "a" (val)
+                        : "memory", "cc"
+      );
+#endif
+   return dst;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * uint32set --
+ *
+ *      memset a given address with an uint32 value, count times.
+ *
+ * Results:
+ *      Pointer to filled memory range.
+ *
+ * Side effects:
+ *      As with memset.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void *
+uint32set(void *dst, uint32 val, size_t count)
+{
+#ifdef VM_ARM_32
+   void *tmpDst = dst;
+
+   __asm__ __volatile__ (
+      "cmp     %1, #0\n\t"
+      "beq     2f\n"
+      "1:\n\t"
+      "str     %2, [%0], #4\n\t"
+      "subs    %1, %1, #1\n\t"
+      "bne     1b\n"
+      "2:"
+      : "+r" (tmpDst), "+r" (count)
+      : "r" (val)
+      : "cc", "memory");
+#elif defined(VM_ARM_64)
+   void   *tmpDst = dst;
+
+   if (count == 0) {
+      return dst;
+   }
+
+   __asm__ __volatile__ (
+      "cbz     %2, 1f\n\t"
+
+      // Drop our value in the top 32 bits, then copy from there to the bottom
+      "lsl     %2, %2, #32\n\t"
+      "bfm     %2, %2, #32, #63\n"
+
+      // Copy four at a time
+      "1:\t"
+      "cmp     %1, #16\n\t"
+      "b.lo    2f\n\t"
+      "stp     %2, %2, [%0], #16\n\t"
+      "stp     %2, %2, [%0], #16\n\t"
+      "stp     %2, %2, [%0], #16\n\t"
+      "stp     %2, %2, [%0], #16\n\t"
+      "sub     %1, %1, #16\n\t"
+      "b       1b\n"
+
+      // Copy remaining pairs of data
+      "2:\t"
+      "cmp     %1, #2\n\t"
+      "b.lo    3f\n\t"
+      "str     %2, [%0], #8\n\t"
+      "sub     %1, %1, #2\n\t"
+      "b       2b\n"
+
+      // One or zero values left to copy
+      "3:\t"
+      "cbz     %1, 4f\n\t"
+      "str     %w2, [%0]\n\t" // No incr
+      "4:"
+      : "+r" (tmpDst), "+r" (count), "+r" (val)
+      :
+      : "cc", "memory");
+#else
+   size_t dummy0;
+   void *dummy1;
+
+   __asm__ __volatile__("\t"
+                        "cld"            "\n\t"
+                        "rep ; stosl"    "\n"
+                        : "=c" (dummy0), "=D" (dummy1)
+                        : "0" (count), "1" (dst), "a" (val)
+                        : "memory", "cc"
+      );
+#endif
+   return dst;
+}
+
+#else /* unknown system: rely on C to write */
+static INLINE void *
+uint16set(void *dst, uint16 val, size_t count)
+{
+   size_t i;
+   for (i = 0; i < count; i++) {
+     ((uint16 *) dst)[i] = val;
+   }
+   return dst;
+}
+
+static INLINE void *
+uint32set(void *dst, uint32 val, size_t count)
+{
+   size_t i;
+   for (i = 0; i < count; i++) {
+     ((uint32 *) dst)[i] = val;
+   }
+   return dst;
+}
+#endif // defined(VM_X86_ANY) || defined(VM_ARM_ANY)
+#elif defined(_MSC_VER)
+
+static INLINE void *
+uint16set(void *dst, uint16 val, size_t count)
+{
+#ifdef VM_X86_64
+   __stosw((uint16*)dst, val, count);
+#else
+   __asm { pushf;
+           mov ax, val;
+           mov ecx, count;
+           mov edi, dst;
+           cld;
+           rep stosw;
+           popf;
+   }
+#endif
+   return dst;
+}
+
+static INLINE void *
+uint32set(void *dst, uint32 val, size_t count)
+{
+#ifdef VM_X86_64
+   __stosd((unsigned long*)dst, (unsigned long)val, count);
+#else
+   __asm { pushf;
+           mov eax, val;
+           mov ecx, count;
+           mov edi, dst;
+           cld;
+           rep stosd;
+           popf;
+   }
+#endif
+   return dst;
+}
+
+#else
+#error "No compiler defined for uint*set"
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Bswap16 --
+ *
+ *      Swap the 2 bytes of "v" as follows: 32 -> 23.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Bswap16(uint16 v)
+{
+#if defined(VM_ARM_64)
+   __asm__("rev16 %0, %0" : "+r"(v));
+   return v;
+#else
+   return ((v >> 8) & 0x00ff) | ((v << 8) & 0xff00);
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Bswap32 --
+ *
+ *      Swap the 4 bytes of "v" as follows: 3210 -> 0123.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Bswap32(uint32 v) // IN
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   /* Checked against the Intel manual and GCC. --hpreg */
+   __asm__(
+      "bswap %0"
+      : "=r" (v)
+      : "0" (v)
+   );
+   return v;
+#elif defined(VM_ARM_32) && !defined(__ANDROID__)
+    __asm__("rev %0, %0" : "+r"(v));
+    return v;
+#elif defined(VM_ARM_64)
+   __asm__("rev32 %0, %0" : "+r"(v));
+    return v;
+#else
+   return    (v >> 24)
+          | ((v >>  8) & 0xFF00)
+          | ((v & 0xFF00) <<  8)
+          |  (v << 24)          ;
+#endif
+}
+#define Bswap Bswap32
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Bswap64 --
+ *
+ *      Swap the 8 bytes of "v" as follows: 76543210 -> 01234567.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Bswap64(uint64 v) // IN
+{
+#if defined(VM_ARM_64)
+   __asm__("rev %0, %0" : "+r"(v));
+   return v;
+#else
+   return ((uint64)Bswap((uint32)v) << 32) | Bswap((uint32)(v >> 32));
+#endif
+}
+
+
+/*
+ * COMPILER_MEM_BARRIER prevents the compiler from re-ordering memory
+ * references accross the barrier.  NOTE: It does not generate any
+ * instruction, so the CPU is free to do whatever it wants to...
+ */
+#ifdef __GNUC__
+#define COMPILER_MEM_BARRIER()   __asm__ __volatile__ ("": : :"memory")
+#define COMPILER_READ_BARRIER()  COMPILER_MEM_BARRIER()
+#define COMPILER_WRITE_BARRIER() COMPILER_MEM_BARRIER()
+#elif defined(_MSC_VER)
+#define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
+#define COMPILER_READ_BARRIER()  _ReadBarrier()
+#define COMPILER_WRITE_BARRIER() _WriteBarrier()
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * COMPILER_FORCED_LOAD_AND_MEM_BARRIER --
+ *
+ *        This macro prevents the compiler from re-ordering memory references
+ *        across the barrier. In addition it emits a forced load from the given
+ *        memory reference. The memory reference has to be either 1, 2, 4 or 8
+ *        bytes wide.
+ *        The forced load of a memory reference can be used exploit details of a
+ *        given CPUs memory model. For example x86 CPUs won't reorder stores to
+ *        a memory location x with loads from a memory location x.
+ *        NOTE: It does not generate any fencing instruction, so the CPU is free
+ *              to reorder instructions according to its memory model.
+ *
+ * Results:
+ *        None
+ *
+ * Side Effects:
+ *        None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#ifdef VM_X86_64
+#ifdef __GNUC__
+
+#define COMPILER_FORCED_LOAD_AND_MEM_BARRIER(_memory_reference)               \
+   do {                                                                       \
+      typeof(_memory_reference) _dummy;                                       \
+                                                                              \
+      asm volatile("mov %1, %0\n\t"                                           \
+                   : "=r" (_dummy) /* Let compiler choose reg for _dummy */   \
+                   : "m" (_memory_reference)                                  \
+                   : "memory");                                               \
+   } while(0)
+
+#endif /* __GNUC__ */
+#endif /* VM_X86_64 */
+
+
+/*
+ * PAUSE is a P4 instruction that improves spinlock power+performance;
+ * on non-P4 IA32 systems, the encoding is interpreted as a REPZ-NOP.
+ * Use volatile to avoid NOP removal.
+ */
+static INLINE void
+PAUSE(void)
+#ifdef __GNUC__
+{
+#ifdef VM_ARM_ANY
+   /*
+    * ARM has no instruction to execute "spin-wait loop", just leave it
+    * empty.
+    */
+#else
+   __asm__ __volatile__( "pause" :);
+#endif
+}
+#elif defined(_MSC_VER)
+#ifdef VM_X86_64
+{
+   _mm_pause();
+}
+#else /* VM_X86_64 */
+#pragma warning( disable : 4035)
+{
+   __asm _emit 0xf3 __asm _emit 0x90
+}
+#pragma warning (default: 4035)
+#endif /* VM_X86_64 */
+#else  /* __GNUC__  */
+#error No compiler defined for PAUSE
+#endif
+
+
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ *
+ * volatile because the tsc always changes without the compiler knowing it.
+ */
+static INLINE uint64
+RDTSC(void)
+#ifdef __GNUC__
+{
+#ifdef VM_X86_64
+   uint64 tscLow;
+   uint64 tscHigh;
+
+   __asm__ __volatile__(
+      "rdtsc"
+      : "=a" (tscLow), "=d" (tscHigh)
+   );
+
+   return tscHigh << 32 | tscLow;
+#elif defined(VM_X86_32)
+   uint64 tim;
+
+   __asm__ __volatile__(
+      "rdtsc"
+      : "=A" (tim)
+   );
+
+   return tim;
+#elif defined(VM_ARM_64)
+#if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1)
+   return MRS(CNTPCT_EL0);
+#else
+   return MRS(CNTVCT_EL0);
+#endif
+#else
+   /*
+    * For platform without cheap timer, just return 0.
+    */
+   return 0;
+#endif
+}
+#elif defined(_MSC_VER)
+#ifdef VM_X86_64
+{
+   return __rdtsc();
+}
+#else
+#pragma warning( disable : 4035)
+{
+   __asm _emit 0x0f __asm _emit 0x31
+}
+#pragma warning (default: 4035)
+#endif /* VM_X86_64 */
+#else  /* __GNUC__  */
+#error No compiler defined for RDTSC
+#endif /* __GNUC__  */
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * DEBUGBREAK --
+ *
+ *    Does an int3 for MSVC / GCC, bkpt/brk for ARM. This is a macro to make
+ *    sure int3 is always inlined.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#ifdef VM_ARM_32
+#define DEBUGBREAK() __asm__("bkpt")
+#elif defined(VM_ARM_64)
+#define DEBUGBREAK() __asm__("brk #0")
+#elif defined(_MSC_VER)
+#define DEBUGBREAK() __debugbreak()
+#else
+#define DEBUGBREAK() __asm__("int $3")
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * {Clear,Set,Test}Bit{32,64} --
+ *
+ *    Sets or clears a specified single bit in the provided variable.
+ *
+ *    The index input value specifies which bit to modify and is 0-based.
+ *    Index is truncated by hardware to a 5-bit or 6-bit offset for the
+ *    32 and 64-bit flavors, respectively, but input values are not validated
+ *    with asserts to avoid include dependencies.
+ *
+ *    64-bit flavors are not handcrafted for 32-bit builds because they may
+ *    defeat compiler optimizations.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+SetBit32(uint32 *var, uint32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   __asm__ (
+      "bts %1, %0"
+      : "+mr" (*var)
+      : "rI" (index)
+      : "cc"
+   );
+#elif defined(_MSC_VER)
+   _bittestandset((long *)var, index);
+#else
+   *var |= (1 << index);
+#endif
+}
+
+static INLINE void
+ClearBit32(uint32 *var, uint32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   __asm__ (
+      "btr %1, %0"
+      : "+mr" (*var)
+      : "rI" (index)
+      : "cc"
+   );
+#elif defined(_MSC_VER)
+   _bittestandreset((long *)var, index);
+#else
+   *var &= ~(1 << index);
+#endif
+}
+
+static INLINE void
+SetBit64(uint64 *var, uint64 index)
+{
+#if defined(VM_64BIT) && !defined(VM_ARM_64)
+#ifdef __GNUC__
+   __asm__ (
+      "bts %1, %0"
+      : "+mr" (*var)
+      : "rJ" (index)
+      : "cc"
+   );
+#elif defined(_MSC_VER)
+   _bittestandset64((__int64 *)var, index);
+#endif
+#else
+   *var |= ((uint64)1 << index);
+#endif
+}
+
+static INLINE void
+ClearBit64(uint64 *var, uint64 index)
+{
+#if defined(VM_64BIT) && !defined(VM_ARM_64)
+#ifdef __GNUC__
+   __asm__ (
+      "btrq %1, %0"
+      : "+mr" (*var)
+      : "rJ" (index)
+      : "cc"
+   );
+#elif defined(_MSC_VER)
+   _bittestandreset64((__int64 *)var, index);
+#endif
+#else
+   *var &= ~((uint64)1 << index);
+#endif
+}
+
+static INLINE Bool
+TestBit32(const uint32 *var, uint32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "bt %[index], %[var] \n"
+      "setc %[bit]"
+      : [bit] "=qQm" (bit)
+      : [index] "rI" (index), [var] "r" (*var)
+      : "cc"
+   );
+   return bit;
+#else
+   return (*var & (1 << index)) != 0;
+#endif
+}
+
+static INLINE Bool
+TestBit64(const uint64 *var, uint64 index)
+{
+#if defined __GNUC__ && defined VM_X86_64
+   Bool bit;
+   __asm__ (
+      "bt %[index], %[var] \n"
+      "setc %[bit]"
+      : [bit] "=qQm" (bit)
+      : [index] "rJ" (index), [var] "r" (*var)
+      : "cc"
+   );
+   return bit;
+#else
+   return (*var & (CONST64U(1) << index)) != 0;
+#endif
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * {Clear,Set,Complement,Test}BitVector --
+ *
+ *    Sets, clears, complements, or tests a specified single bit in the
+ *    provided array.  The index input value specifies which bit to modify
+ *    and is 0-based.  Bit number can be +-2Gb (+-128MB) relative from 'var'
+ *    variable.
+ *
+ *    All functions return value of the bit before modification was performed.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+SetBitVector(void *var, int32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "bts %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (*(uint32 *)var)
+      : "rI" (index)
+      : "memory", "cc"
+   );
+   return bit;
+#elif defined(_MSC_VER)
+   return _bittestandset((long *)var, index) != 0;
+#else
+   Bool retVal = (((uint8 *)var)[index / 8] & (1 << (index % 8))) != 0;
+   ((uint8 *)var)[index / 8] |= 1 << (index % 8);
+   return retVal;
+#endif
+}
+
+static INLINE Bool
+ClearBitVector(void *var, int32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "btr %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (*(uint32 *)var)
+      : "rI" (index)
+      : "cc"
+   );
+   return bit;
+#elif defined(_MSC_VER)
+   return _bittestandreset((long *)var, index) != 0;
+#else
+   Bool retVal = (((uint8 *)var)[index / 8] & (1 << (index % 8))) != 0;
+   ((uint8 *)var)[index / 8] &= ~(1 << (index % 8));
+   return retVal;
+#endif
+}
+
+static INLINE Bool
+ComplementBitVector(void *var, int32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "btc %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (*(uint32 *)var)
+      : "rI" (index)
+      : "cc"
+   );
+   return bit;
+#elif defined(_MSC_VER)
+   return _bittestandcomplement((long *)var, index) != 0;
+#else
+   Bool retVal = (((uint8 *)var)[index / 8] & (1 << (index % 8))) != 0;
+   ((uint8 *)var)[index / 8] ^= ~(1 << (index % 8));
+   return retVal;
+#endif
+}
+
+static INLINE Bool
+TestBitVector(const void *var, int32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "bt %2, %1;"
+      "setc %0"
+      : "=qQm" (bit)
+      : "m" (*(const uint32 *)var), "rI" (index)
+      : "cc"
+   );
+   return bit;
+#elif defined _MSC_VER
+   return _bittest((long *)var, index) != 0;
+#else
+   return (((const uint8 *)var)[index / 8] & (1 << (index % 8))) != 0;
+#endif
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ * RoundUpPow2_{64,32} --
+ *
+ *   Rounds a value up to the next higher power of 2.  Returns the original
+ *   value if it is a power of 2.  The next power of 2 for inputs {0, 1} is 1.
+ *   The result is undefined for inputs above {2^63, 2^31} (but equal to 1
+ *   in this implementation).
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+RoundUpPow2C64(uint64 value)
+{
+   if (value <= 1 || value > (CONST64U(1) << 63)) {
+      return 1; // Match the assembly's undefined value for large inputs.
+   } else {
+      return (CONST64U(2) << mssb64_0(value - 1));
+   }
+}
+
+#if defined(__GNUC__) && defined(VM_X86_64)
+static INLINE uint64
+RoundUpPow2Asm64(uint64 value)
+{
+   uint64 out = 2;
+   __asm__("lea -1(%[in]), %%rcx;"      // rcx = value - 1.  Preserve original.
+           "bsr %%rcx, %%rcx;"          // rcx = log2(value - 1) if value != 1
+                                        // if value == 0, then rcx = 63
+                                        // if value == 1 then zf = 1, else zf = 0.
+           "rol %%cl, %[out];"          // out = 2 << rcx (if rcx != -1)
+                                        //     = 2^(log2(value - 1) + 1)
+                                        // if rcx == -1 (value == 0), out = 1
+                                        // zf is always unmodified.
+           "cmovz %[in], %[out]"        // if value == 1 (zf == 1), write 1 to out.
+       : [out]"+r"(out) : [in]"r"(value) : "%rcx", "cc");
+   return out;
+}
+#endif
+
+static INLINE uint64
+RoundUpPow2_64(uint64 value)
+{
+#if defined(__GNUC__) && defined(VM_X86_64)
+   if (__builtin_constant_p(value)) {
+      return RoundUpPow2C64(value);
+   } else {
+      return RoundUpPow2Asm64(value);
+   }
+#else
+   return RoundUpPow2C64(value);
+#endif
+}
+
+static INLINE uint32
+RoundUpPow2C32(uint32 value)
+{
+   if (value <= 1 || value > (1U << 31)) {
+      return 1; // Match the assembly's undefined value for large inputs.
+   } else {
+      return (2 << mssb32_0(value - 1));
+   }
+}
+
+#ifdef __GNUC__
+static INLINE uint32
+RoundUpPow2Asm32(uint32 value)
+{
+#ifdef VM_ARM_32
+   uint32 out = 1;
+   // Note: None Thumb only!
+   //       The value of the argument "value"
+   //       will be affected!
+   __asm__("sub %[in], %[in], #1;"         // r1 = value - 1 . if value == 0 then r1 = 0xFFFFFFFF
+           "clz %[in], %[in];"             // r1 = log2(value - 1) if value != 1
+                                           // if value == 0 then r1 = 0
+                                           // if value == 1 then r1 = 32
+           "mov %[out], %[out], ror %[in]" // out = 2^(32 - r1)
+                                           // if out == 2^32 then out = 1 as it is right rotate
+       : [in]"+r"(value),[out]"+r"(out));
+   return out;
+#elif defined(VM_ARM_64)
+   return RoundUpPow2C32(value);
+#else
+   uint32 out = 2;
+
+   __asm__("lea -1(%[in]), %%ecx;"      // ecx = value - 1.  Preserve original.
+           "bsr %%ecx, %%ecx;"          // ecx = log2(value - 1) if value != 1
+                                        // if value == 0, then ecx = 31
+                                        // if value == 1 then zf = 1, else zf = 0.
+           "rol %%cl, %[out];"          // out = 2 << ecx (if ecx != -1)
+                                        //     = 2^(log2(value - 1) + 1).
+                                        // if ecx == -1 (value == 0), out = 1
+                                        // zf is always unmodified
+           "cmovz %[in], %[out]"        // if value == 1 (zf == 1), write 1 to out.
+       : [out]"+r"(out) : [in]"r"(value) : "%ecx", "cc");
+   return out;
+#endif
+}
+#endif // __GNUC__
+
+static INLINE uint32
+RoundUpPow2_32(uint32 value)
+{
+#ifdef __GNUC__
+   if (__builtin_constant_p(value)) {
+      return RoundUpPow2C32(value);
+   } else {
+      return RoundUpPow2Asm32(value);
+   }
+#else
+   return RoundUpPow2C32(value);
+#endif
+}
+
+#endif // _VM_BASIC_ASM_H_
+
diff --git a/vmmon-only/include/vm_basic_asm_x86.h b/vmmon-only/include/vm_basic_asm_x86.h
new file mode 100644
index 00000000..2c4232c3
--- /dev/null
+++ b/vmmon-only/include/vm_basic_asm_x86.h
@@ -0,0 +1,548 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_asm_x86.h
+ *
+ *	Basic IA32 asm macros
+ */
+
+#ifndef _VM_BASIC_ASM_X86_H_
+#define _VM_BASIC_ASM_X86_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#ifdef VM_X86_64
+/*
+ * The gcc inline asm uses the "A" constraint which differs in 32 & 64
+ * bit mode.  32 bit means eax and edx, 64 means rax or rdx.
+ */
+#error "x86-64 not supported"
+#endif
+
+/*
+ * XTEST
+ *     Return TRUE if processor is in transaction region.
+ *
+ */
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+static INLINE Bool
+xtest(void)
+{
+   uint8 al;
+   __asm__ __volatile__(".byte 0x0f, 0x01, 0xd6    # xtest \n"
+                        "setnz %%al\n"
+                        : "=a"(al) : : "cc");
+   return al;
+}
+
+#endif /* __GNUC__ */
+
+
+/*
+ * FXSAVE/FXRSTOR
+ *     save/restore SIMD/MMX fpu state
+ *
+ * The pointer passed in must be 16-byte aligned.
+ *
+ * Intel and AMD processors behave differently w.r.t. fxsave/fxrstor. Intel
+ * processors unconditionally save the exception pointer state (instruction
+ * ptr., data ptr., and error instruction opcode). FXSAVE_ES1 and FXRSTOR_ES1
+ * work correctly for Intel processors.
+ *
+ * AMD processors only save the exception pointer state if ES=1. This leads to a
+ * security hole whereby one process/VM can inspect the state of another process
+ * VM. The AMD recommended workaround involves clobbering the exception pointer
+ * state unconditionally, and this is implemented in FXRSTOR_AMD_ES0. Note that
+ * FXSAVE_ES1 will only save the exception pointer state for AMD processors if
+ * ES=1.
+ *
+ * The workaround (FXRSTOR_AMD_ES0) only costs 1 cycle more than just doing an
+ * fxrstor, on both AMD Opteron and Intel Core CPUs.
+ */
+#if defined(__GNUC__)
+static INLINE void 
+FXSAVE_ES1(void *save)
+{
+   __asm__ __volatile__ ("fxsave %0\n" : "=m" (*(uint8 *)save) : : "memory");
+}
+
+static INLINE void 
+FXRSTOR_ES1(const void *load)
+{
+   __asm__ __volatile__ ("fxrstor %0\n"
+                         : : "m" (*(const uint8 *)load) : "memory");
+}
+
+static INLINE void 
+FXRSTOR_AMD_ES0(const void *load)
+{
+   uint64 dummy = 0;
+
+   __asm__ __volatile__ 
+       ("fnstsw  %%ax    \n"     // Grab x87 ES bit
+        "bt      $7,%%ax \n"     // Test ES bit
+        "jnc     1f      \n"     // Jump if ES=0
+        "fnclex          \n"     // ES=1. Clear it so fild doesn't trap
+        "1:              \n"
+        "ffree   %%st(7) \n"     // Clear tag bit - avoid poss. stack overflow
+        "fildl   %0      \n"     // Dummy Load from "safe address" changes all
+                                 // x87 exception pointers.
+        "fxrstor %1      \n"
+        :  
+        : "m" (dummy), "m" (*(const uint8 *)load)
+        : "ax", "memory");
+}
+#endif /* __GNUC__ */
+
+/*
+ * XSAVE/XRSTOR
+ *     save/restore GSSE/SIMD/MMX fpu state
+ *
+ * The pointer passed in must be 64-byte aligned.
+ * See above comment for more information.
+ */
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+
+static INLINE void 
+XSAVE_ES1(void *save, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x21 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xsave %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XSAVEOPT_ES1(void *save, uint64 mask)
+{
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x31 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+}
+
+static INLINE void 
+XRSTOR_ES1(const void *load, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x29 \n"
+        :
+        : "c" ((const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xrstor %0 \n"
+        :
+        : "m" (*(const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XRSTOR_AMD_ES0(const void *load, uint64 mask)
+{
+   uint64 dummy = 0;
+
+   __asm__ __volatile__ 
+       ("fnstsw  %%ax    \n"     // Grab x87 ES bit
+        "bt      $7,%%ax \n"     // Test ES bit
+        "jnc     1f      \n"     // Jump if ES=0
+        "fnclex          \n"     // ES=1. Clear it so fild doesn't trap
+        "1:              \n"
+        "ffree   %%st(7) \n"     // Clear tag bit - avoid poss. stack overflow
+        "fildl   %0      \n"     // Dummy Load from "safe address" changes all
+                                 // x87 exception pointers.
+        "mov %%ebx, %%eax \n"
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+        ".byte 0x0f, 0xae, 0x29 \n"
+        :
+        : "m" (dummy), "c" ((const uint8 *)load),
+          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
+#else
+        "xrstor %1 \n"
+        :
+        : "m" (dummy), "m" (*(const uint8 *)load),
+          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
+#endif
+        : "eax", "memory");
+}
+#endif /* __GNUC__ */
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Div643232 --
+ *
+ *    Unsigned integer division:
+ *       The dividend is 64-bit wide
+ *       The divisor  is 32-bit wide
+ *       The quotient is 32-bit wide
+ *
+ *    Use this function if you are certain that:
+ *    o Either the quotient will fit in 32 bits,
+ *    o Or your code is ready to handle a #DE exception indicating overflow.
+ *    If that is not the case, then use Div643264().
+ *
+ * Results:
+ *    Quotient and remainder
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__)
+
+static INLINE void
+Div643232(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint32 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   __asm__(
+      "divl %4"
+      : "=a" (*quotient),
+        "=d" (*remainder)
+      : "0" ((uint32)dividend),
+        "1" ((uint32)(dividend >> 32)),
+        "rm" (divisor)
+      : "cc"
+   );
+}
+
+#elif defined _MSC_VER
+
+static INLINE void
+Div643232(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint32 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   __asm {
+      mov  eax, DWORD PTR [dividend]
+      mov  edx, DWORD PTR [dividend+4]
+      div  DWORD PTR [divisor]
+      mov  edi, DWORD PTR [quotient]
+      mov  [edi], eax
+      mov  edi, DWORD PTR [remainder]
+      mov  [edi], edx
+   }
+}
+
+#else
+#error No compiler defined for Div643232
+#endif
+
+
+#if defined(__GNUC__)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Div643264 --
+ *
+ *    Unsigned integer division:
+ *       The dividend is 64-bit wide
+ *       The divisor  is 32-bit wide
+ *       The quotient is 64-bit wide
+ *
+ * Results:
+ *    Quotient and remainder
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Div643264(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint64 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   uint32 hQuotient;
+   uint32 lQuotient;
+
+   __asm__(
+      "divl %5"        "\n\t"
+      "movl %%eax, %0" "\n\t"
+      "movl %4, %%eax" "\n\t"
+      "divl %5"
+      : "=&rm" (hQuotient),
+        "=a" (lQuotient),
+        "=d" (*remainder)
+      : "1" ((uint32)(dividend >> 32)),
+        "g" ((uint32)dividend),
+        "rm" (divisor),
+        "2" (0)
+      : "cc"
+   );
+   *quotient = (uint64)hQuotient << 32 | lQuotient;
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Mul64x3264 --
+ *
+ *    Unsigned integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Unsigned 64-bit integer multiplicand.
+ *       Unsigned 32-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Unsigned 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && \
+   (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 4)) && \
+   !defined(MUL64_NO_ASM)
+
+static INLINE uint64
+Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   uint64 result;
+   uint32 tmp1, tmp2;
+   // ASSERT(shift >= 0 && shift < 64);
+  
+   __asm__("mov   %%eax, %2\n\t"      // Save lo(multiplicand)
+           "mov   %%edx, %%eax\n\t"   // Get hi(multiplicand)
+           "mull  %4\n\t"             // p2 = hi(multiplicand) * multiplier
+           "xchg  %%eax, %2\n\t"      // Save lo(p2), get lo(multiplicand)
+           "mov   %%edx, %1\n\t"      // Save hi(p2)
+           "mull  %4\n\t"             // p1 = lo(multiplicand) * multiplier
+           "addl  %2, %%edx\n\t"      // hi(p1) += lo(p2)
+           "adcl  $0, %1\n\t"         // hi(p2) += carry from previous step
+           "cmpl  $32, %%ecx\n\t"     // shift < 32?
+           "jl    2f\n\t"             // Go if so
+           "shll  $1, %%eax\n\t"      // Save lo(p1) bit 31 in CF in case shift=32
+           "mov   %%edx, %%eax\n\t"   // result = hi(p2):hi(p1) >> (shift & 31)
+           "mov   %1, %%edx\n\t"
+           "shrdl %%edx, %%eax\n\t"
+           "mov   $0, %2\n\t"
+           "adcl  $0, %2\n\t"         // Get highest order bit shifted out, from CF
+           "shrl  %%cl, %%edx\n\t"
+           "jmp   3f\n"
+        "2:\n\t"
+           "xor   %2, %2\n\t"
+           "shrdl %%edx, %%eax\n\t"   // result = hi(p2):hi(p1):lo(p1) >> shift
+           "adcl  $0, %2\n\t"         // Get highest order bit shifted out, from CF
+           "shrdl %1, %%edx\n"
+        "3:\n\t"
+           "addl  %2, %%eax\n\t"      // result += highest order bit shifted out
+           "adcl  $0, %%edx"
+           : "=A" (result), "=&r" (tmp1), "=&r" (tmp2)
+           : "0" (multiplicand), "rm" (multiplier), "c" (shift)
+           : "cc");
+   return result;
+}
+
+#elif defined _MSC_VER
+#pragma warning(disable: 4035)
+
+static INLINE uint64
+Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   // ASSERT(shift >= 0 && shift < 64);
+
+   __asm {
+      mov  eax, DWORD PTR [multiplicand+4]  // Get hi(multiplicand)
+      mul  DWORD PTR [multiplier]           // p2 = hi(multiplicand) * multiplier
+      mov  ecx, eax                         // Save lo(p2)
+      mov  ebx, edx                         // Save hi(p2)
+      mov  eax, DWORD PTR [multiplicand]    // Get lo(multiplicand)
+      mul  DWORD PTR [multiplier+0]         // p1 = lo(multiplicand) * multiplier
+      add  edx, ecx                         // hi(p1) += lo(p2)
+      adc  ebx, 0                           // hi(p2) += carry from previous step
+      mov  ecx, DWORD PTR [shift]           // Get shift
+      cmp  ecx, 32                          // shift < 32?
+      jl   SHORT l2                         // Go if so
+      shl  eax, 1                           // Save lo(p1) bit 31 in CF in case shift=32
+      mov  eax, edx                         // result = hi(p2):hi(p1) >> (shift & 31)
+      mov  edx, ebx
+      shrd eax, edx, cl
+      mov  esi, 0
+      adc  esi, 0                           // Get highest order bit shifted out, from CF
+      shr  edx, cl
+      jmp  SHORT l3
+   l2:
+      xor  esi, esi
+      shrd eax, edx, cl                     // result = hi(p2):hi(p1):lo(p1) >> shift
+      adc  esi, 0                           // Get highest order bit shifted out, from CF
+      shrd edx, ebx, cl
+   l3:
+      add  eax, esi                         // result += highest order bit shifted out
+      adc  edx, 0
+   }
+   // return with result in edx:eax
+}
+
+#pragma warning(default: 4035)
+#else
+#define MUL64_NO_ASM 1
+#include "mul64.h"
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Muls64x32s64 --
+ *
+ *    Signed integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Signed 64-bit integer multiplicand.
+ *       Unsigned 32-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Signed 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && \
+   (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 4)) && \
+   !defined(MUL64_NO_ASM)
+
+static INLINE int64
+Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   int64 result;
+   uint32 tmp1, tmp2;
+   // ASSERT(shift >= 0 && shift < 64);
+
+   __asm__("mov   %%eax, %2\n\t"      // Save lo(multiplicand)
+           "mov   %%edx, %%eax\n\t"   // Get hi(multiplicand)
+           "test  %%eax, %%eax\n\t"   // Check sign of multiplicand
+           "jl    0f\n\t"             // Go if negative
+           "mull  %4\n\t"             // p2 = hi(multiplicand) * multiplier
+           "jmp   1f\n"
+        "0:\n\t"
+           "mull  %4\n\t"             // p2 = hi(multiplicand) * multiplier
+           "sub   %4, %%edx\n"        // hi(p2) += -1 * multiplier
+        "1:\n\t"
+           "xchg  %%eax, %2\n\t"      // Save lo(p2), get lo(multiplicand)
+           "mov   %%edx, %1\n\t"      // Save hi(p2)
+           "mull  %4\n\t"             // p1 = lo(multiplicand) * multiplier
+           "addl  %2, %%edx\n\t"      // hi(p1) += lo(p2)
+           "adcl  $0, %1\n\t"         // hi(p2) += carry from previous step
+           "cmpl  $32, %%ecx\n\t"     // shift < 32?
+           "jl    2f\n\t"             // Go if so
+           "shll  $1, %%eax\n\t"      // Save lo(p1) bit 31 in CF in case shift=32
+           "mov   %%edx, %%eax\n\t"   // result = hi(p2):hi(p1) >> (shift & 31)
+           "mov   %1, %%edx\n\t"
+           "shrdl %%edx, %%eax\n\t"
+           "mov   $0, %2\n\t"
+           "adcl  $0, %2\n\t"         // Get highest order bit shifted out from CF
+           "sarl  %%cl, %%edx\n\t"
+           "jmp   3f\n"
+        "2:\n\t"
+           "xor   %2, %2\n\t"
+           "shrdl %%edx, %%eax\n\t"   // result = hi(p2):hi(p1):lo(p1) >> shift
+           "adcl  $0, %2\n\t"         // Get highest order bit shifted out from CF
+           "shrdl %1, %%edx\n"
+        "3:\n\t"
+           "addl  %2, %%eax\n\t"      // result += highest order bit shifted out
+           "adcl  $0, %%edx"
+           : "=A" (result), "=&r" (tmp1), "=&rm" (tmp2)
+           : "0" (multiplicand), "rm" (multiplier), "c" (shift)
+           : "cc");
+   return result;
+}
+
+#elif defined(_MSC_VER)
+#pragma warning(disable: 4035)
+
+static INLINE int64
+Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   //ASSERT(shift >= 0 && shift < 64);
+  
+   __asm {
+      mov  eax, DWORD PTR [multiplicand+4]  // Get hi(multiplicand)
+      test eax, eax                         // Check sign of multiplicand
+      jl   SHORT l0                         // Go if negative
+      mul  DWORD PTR [multiplier]           // p2 = hi(multiplicand) * multiplier
+      jmp  SHORT l1
+   l0:
+      mul  DWORD PTR [multiplier]           // p2 = hi(multiplicand) * multiplier
+      sub  edx, DWORD PTR [multiplier]      // hi(p2) += -1 * multiplier
+   l1:
+      mov  ecx, eax                         // Save lo(p2)
+      mov  ebx, edx                         // Save hi(p2)
+      mov  eax, DWORD PTR [multiplicand]    // Get lo(multiplicand)
+      mul  DWORD PTR [multiplier]           // p1 = lo(multiplicand) * multiplier
+      add  edx, ecx                         // hi(p1) += lo(p2)
+      adc  ebx, 0                           // hi(p2) += carry from previous step
+      mov  ecx, DWORD PTR [shift]           // Get shift
+      cmp  ecx, 32                          // shift < 32?
+      jl   SHORT l2                         // Go if so
+      shl  eax, 1                           // Save lo(p1) bit 31 in CF in case shift=32
+      mov  eax, edx                         // result = hi(p2):hi(p1) >> (shift & 31)
+      mov  edx, ebx
+      shrd eax, edx, cl
+      mov  esi, 0
+      adc  esi, 0                           // Get highest order bit shifted out, from CF
+      sar  edx, cl
+      jmp  SHORT l3
+   l2:
+      xor  esi, esi
+      shrd eax, edx, cl                     // result = hi(p2):hi(p1):lo(p1) << shift
+      adc  esi, 0                           // Get highest order bit shifted out, from CF
+      shrd edx, ebx, cl
+   l3:
+      add  eax, esi                         // result += highest order bit shifted out
+      adc  edx, 0
+   }
+   // return with result in edx:eax
+}
+
+#pragma warning(default: 4035)
+#endif
+
+#endif
diff --git a/vmmon-only/include/vm_basic_asm_x86_64.h b/vmmon-only/include/vm_basic_asm_x86_64.h
new file mode 100644
index 00000000..bef0056d
--- /dev/null
+++ b/vmmon-only/include/vm_basic_asm_x86_64.h
@@ -0,0 +1,615 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_asm_x86_64.h
+ *
+ *	Basic x86_64 asm macros.
+ */
+
+#ifndef _VM_BASIC_ASM_X86_64_H_
+#define _VM_BASIC_ASM_X86_64_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#ifndef VM_X86_64
+#error "This file is x86-64 only!"
+#endif
+
+#if defined(_MSC_VER) && !defined(BORA_NO_WIN32_INTRINS)
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+uint64 _umul128(uint64 multiplier, uint64 multiplicand,
+                uint64 *highProduct);
+int64 _mul128(int64 multiplier, int64 multiplicand,
+              int64 *highProduct);
+uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
+#ifdef __cplusplus
+}
+#endif
+
+#pragma intrinsic(_umul128, _mul128, __shiftright128)
+
+#endif // _MSC_VER
+
+#if defined(__GNUC__)
+/*
+ * GET_CURRENT_RIP
+ *
+ * Returns the current instruction pointer. In the example below:
+ *
+ *   foo.c
+ *   L123: Foo(GET_CURRENT_RIP())
+ *
+ * the return value from GET_CURRENT_RIP will point a debugger to L123.
+ */
+#define GET_CURRENT_RIP() ({                                          \
+      void *__rip;                                                    \
+      asm("lea 0(%%rip), %0;\n\t"                                     \
+         : "=r" (__rip));                                             \
+      __rip;                                                          \
+})
+
+#define GET_CURRENT_PC() GET_CURRENT_RIP()
+
+/*
+ * GET_CURRENT_LOCATION
+ *
+ * Updates the arguments with the values of the %rip, %rbp, and %rsp
+ * registers at the current code location where the macro is invoked,
+ * and the return address.
+ */
+#define GET_CURRENT_LOCATION(rip, rbp, rsp, retAddr)  do {         \
+      asm("lea 0(%%rip), %0\n"                                     \
+          "mov %%rbp, %1\n"                                        \
+          "mov %%rsp, %2\n"                                        \
+          : "=r" (rip), "=r" (rbp), "=r" (rsp));                   \
+      retAddr = (uint64) GetReturnAddress();                       \
+   } while (0)
+#endif
+
+/*
+ * FXSAVE/FXRSTOR
+ *     save/restore SIMD/MMX fpu state
+ *
+ * The pointer passed in must be 16-byte aligned.
+ *
+ * Intel and AMD processors behave differently w.r.t. fxsave/fxrstor. Intel
+ * processors unconditionally save the exception pointer state (instruction
+ * ptr., data ptr., and error instruction opcode). FXSAVE_ES1 and FXRSTOR_ES1
+ * work correctly for Intel processors.
+ *
+ * AMD processors only save the exception pointer state if ES=1. This leads to a
+ * security hole whereby one process/VM can inspect the state of another process
+ * VM. The AMD recommended workaround involves clobbering the exception pointer
+ * state unconditionally, and this is implemented in FXRSTOR_AMD_ES0. Note that
+ * FXSAVE_ES1 will only save the exception pointer state for AMD processors if
+ * ES=1.
+ *
+ * The workaround (FXRSTOR_AMD_ES0) only costs 1 cycle more than just doing an
+ * fxrstor, on both AMD Opteron and Intel Core CPUs.
+ */
+#if defined(__GNUC__)
+
+static INLINE void 
+FXSAVE_ES1(void *save)
+{
+   __asm__ __volatile__ ("fxsaveq %0  \n" : "=m" (*(uint8 *)save) : : "memory");
+}
+
+static INLINE void 
+FXSAVE_COMPAT_ES1(void *save)
+{
+   __asm__ __volatile__ ("fxsave %0  \n" : "=m" (*(uint8 *)save) : : "memory");
+}
+
+static INLINE void 
+FXRSTOR_ES1(const void *load)
+{
+   __asm__ __volatile__ ("fxrstorq %0 \n"
+                         : : "m" (*(const uint8 *)load) : "memory");
+}
+
+static INLINE void 
+FXRSTOR_COMPAT_ES1(const void *load)
+{
+   __asm__ __volatile__ ("fxrstor %0 \n"
+                         : : "m" (*(const uint8 *)load) : "memory");
+}
+
+static INLINE void 
+FXRSTOR_AMD_ES0(const void *load)
+{
+   uint64 dummy = 0;
+
+   __asm__ __volatile__ 
+       ("fnstsw  %%ax    \n"     // Grab x87 ES bit
+        "bt      $7,%%ax \n"     // Test ES bit
+        "jnc     1f      \n"     // Jump if ES=0
+        "fnclex          \n"     // ES=1. Clear it so fild doesn't trap
+        "1:              \n"
+        "ffree   %%st(7) \n"     // Clear tag bit - avoid poss. stack overflow
+        "fildl   %0      \n"     // Dummy Load from "safe address" changes all
+                                 // x87 exception pointers.
+        "fxrstorq %1 \n"
+        :
+        : "m" (dummy), "m" (*(const uint8 *)load)
+        : "ax", "memory");
+}
+
+#endif /* __GNUC__ */
+
+/*
+ * XSAVE/XRSTOR
+ *     save/restore GSSE/SIMD/MMX fpu state
+ *
+ * The pointer passed in must be 64-byte aligned.
+ * See above comment for more information.
+ */
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+
+static INLINE void 
+XSAVE_ES1(void *save, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x48, 0x0f, 0xae, 0x21 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xsaveq %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XSAVE_COMPAT_ES1(void *save, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x21 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xsave %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XSAVEOPT_ES1(void *save, uint64 mask)
+{
+   __asm__ __volatile__ (
+        ".byte 0x48, 0x0f, 0xae, 0x31 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+}
+
+static INLINE void 
+XRSTOR_ES1(const void *load, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x48, 0x0f, 0xae, 0x29 \n"
+        :
+        : "c" ((const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xrstorq %0 \n"
+        :
+        : "m" (*(const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XRSTOR_COMPAT_ES1(const void *load, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x29 \n"
+        :
+        : "c" ((const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xrstor %0 \n"
+        :
+        : "m" (*(const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XRSTOR_AMD_ES0(const void *load, uint64 mask)
+{
+   uint64 dummy = 0;
+
+   __asm__ __volatile__ 
+       ("fnstsw  %%ax    \n"     // Grab x87 ES bit
+        "bt      $7,%%ax \n"     // Test ES bit
+        "jnc     1f      \n"     // Jump if ES=0
+        "fnclex          \n"     // ES=1. Clear it so fild doesn't trap
+        "1:              \n"
+        "ffree   %%st(7) \n"     // Clear tag bit - avoid poss. stack overflow
+        "fildl   %0      \n"     // Dummy Load from "safe address" changes all
+                                 // x87 exception pointers.
+        "mov %%ebx, %%eax \n"
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+        ".byte 0x48, 0x0f, 0xae, 0x29 \n"
+        :
+        : "m" (dummy), "c" ((const uint8 *)load),
+          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
+#else
+        "xrstorq %1 \n"
+        :
+        : "m" (dummy), "m" (*(const uint8 *)load),
+          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
+#endif
+        : "eax", "memory");
+}
+
+#endif /* __GNUC__ */
+
+/*
+ * XTEST
+ *     Return TRUE if processor is in transaction region.
+ *
+ */
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+static INLINE Bool
+xtest(void)
+{
+   uint8 al;
+   __asm__ __volatile__(".byte 0x0f, 0x01, 0xd6    # xtest \n"
+                        "setnz %%al\n"
+                        : "=a"(al) : : "cc"); 
+   return al;
+}
+
+#endif /* __GNUC__ */
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Mul64x6464 --
+ *
+ *    Unsigned integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Unsigned 64-bit integer multiplicand.
+ *       Unsigned 64-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Unsigned 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && !defined(MUL64_NO_ASM)
+
+static INLINE uint64
+Mul64x6464(uint64 multiplicand,
+           uint64 multiplier,
+           uint32 shift)
+{
+   /*
+    * Implementation:
+    *    Multiply 64x64 bits to yield a full 128-bit product.
+    *    Clear the carry bit (needed for the shift == 0 case).
+    *    Shift result in RDX:RAX right by "shift".
+    *    Add the carry bit.  (If shift > 0, this is the highest order bit
+    *      that was discarded by the shift; else it is 0.)
+    *    Return the low-order 64 bits of the above.
+    *
+    */
+   uint64 result, dummy;
+
+   __asm__("mulq    %3           \n\t"
+           "clc                  \n\t"
+           "shrdq   %b4, %1, %0  \n\t"
+           "adc     $0, %0       \n\t"
+           : "=a" (result),
+             "=d" (dummy)
+           : "0"  (multiplier),
+             "rm" (multiplicand),
+             "c"  (shift)
+           : "cc");
+   return result;
+}
+
+#elif defined(_MSC_VER) && !defined(MUL64_NO_ASM)
+
+static INLINE uint64
+Mul64x6464(uint64 multiplicand,
+           uint64 multiplier,
+           uint32 shift)
+{
+   /*
+    * Unfortunately, MSVC intrinsics don't give us access to the carry
+    * flag after a 128-bit shift, so the implementation is more
+    * awkward:
+    *    Multiply 64x64 bits to yield a full 128-bit product.
+    *    Shift result right by "shift".
+    *    If shift != 0, extract and add in highest order bit that was
+    *      discarded by the shift.
+    *    Return the low-order 64 bits of the above.
+    */
+   uint64 tmplo, tmphi;
+   tmplo = _umul128(multiplicand, multiplier, &tmphi);
+   if (shift == 0) {
+      return tmplo;
+   } else {
+      return __shiftright128(tmplo, tmphi, (uint8) shift) +
+         ((tmplo >> (shift - 1)) & 1);
+   }
+}
+
+#else
+#define MUL64_NO_ASM 1
+#include "mul64.h"
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Muls64x64s64 --
+ *
+ *    Signed integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Signed 64-bit integer multiplicand.
+ *       Unsigned 64-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Signed 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && !defined(MUL64_NO_ASM)
+
+static inline int64
+Muls64x64s64(int64 multiplicand,
+             int64 multiplier,
+             uint32 shift)
+{
+   int64 result, dummy;
+
+   /* Implementation:
+    *    Multiply 64x64 bits to yield a full 128-bit product.
+    *    Clear the carry bit (needed for the shift == 0 case).
+    *    Shift result in RDX:RAX right by "shift".
+    *    Add the carry bit.  (If shift > 0, this is the highest order bit
+    *      that was discarded by the shift; else it is 0.)
+    *    Return the low-order 64 bits of the above.
+    *
+    *    Note: using the unsigned shrd instruction is correct because
+    *    shift < 64 and we return only the low 64 bits of the shifted
+    *    result.
+    */
+   __asm__("imulq   %3           \n\t"
+           "clc                  \n\t"
+           "shrdq   %b4, %1, %0  \n\t"
+           "adc     $0, %0       \n\t"
+           : "=a" (result),
+             "=d" (dummy)
+           : "0"  (multiplier),
+             "rm" (multiplicand),
+             "c"  (shift)
+           : "cc");
+   return result;
+}
+
+#elif defined(_MSC_VER) && !defined(MUL64_NO_ASM)
+
+static INLINE int64
+Muls64x64s64(int64 multiplicand,
+             int64 multiplier,
+             uint32 shift)
+{
+   /*
+    * Unfortunately, MSVC intrinsics don't give us access to the carry
+    * flag after a 128-bit shift, so the implementation is more
+    * awkward:
+    *    Multiply 64x64 bits to yield a full 128-bit product.
+    *    Shift result right by "shift".
+    *    If shift != 0, extract and add in highest order bit that was
+    *      discarded by the shift.
+    *    Return the low-order 64 bits of the above.
+    *
+    * Note: using an unsigned shift is correct because shift < 64 and
+    * we return only the low 64 bits of the shifted result.
+    */
+   int64 tmplo, tmphi;
+   tmplo = _mul128(multiplicand, multiplier, &tmphi);
+   if (shift == 0) {
+      return tmplo;
+   } else {
+      return __shiftright128(tmplo, tmphi, (uint8) shift) +
+         ((tmplo >> (shift - 1)) & 1);
+   }
+}
+
+#endif
+
+#ifndef MUL64_NO_ASM
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Mul64x3264 --
+ *
+ *    Unsigned integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Unsigned 64-bit integer multiplicand.
+ *       Unsigned 32-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Unsigned 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   return Mul64x6464(multiplicand, multiplier, shift);
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Muls64x32s64 --
+ *
+ *    Signed integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Signed 64-bit integer multiplicand.
+ *       Unsigned 32-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Signed 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE int64
+Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   return Muls64x64s64(multiplicand, multiplier, shift);
+}
+#endif
+
+#if defined(__GNUC__)
+
+static INLINE void *
+uint64set(void *dst, uint64 val, uint64 count)
+{
+   int dummy0;
+   int dummy1;
+   __asm__ __volatile__("\t"
+                        "cld"            "\n\t"
+                        "rep ; stosq"    "\n"
+                        : "=c" (dummy0), "=D" (dummy1)
+                        : "0" (count), "1" (dst), "a" (val)
+                        : "memory", "cc");
+   return dst;
+}
+
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Div643232 --
+ *
+ *    Unsigned integer division:
+ *       The dividend is 64-bit wide
+ *       The divisor  is 32-bit wide
+ *       The quotient is 32-bit wide
+ *
+ *    Use this function if you are certain that the quotient will fit in 32 bits,
+ *    If that is not the case, a #DE exception was generated in 32-bit version,
+ *    but not in this 64-bit version. So please be careful.
+ *
+ * Results:
+ *    Quotient and remainder
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) || defined(_MSC_VER)
+
+static INLINE void
+Div643232(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint32 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   *quotient = (uint32)(dividend / divisor);
+   *remainder = (uint32)(dividend % divisor);
+}
+
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Div643264 --
+ *
+ *    Unsigned integer division:
+ *       The dividend is 64-bit wide
+ *       The divisor  is 32-bit wide
+ *       The quotient is 64-bit wide
+ *
+ * Results:
+ *    Quotient and remainder
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__)
+
+static INLINE void
+Div643264(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint64 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   *quotient = dividend / divisor;
+   *remainder = dividend % divisor;
+}
+
+#endif
+
+#endif // _VM_BASIC_ASM_X86_64_H_
diff --git a/vmmon-only/include/vm_basic_asm_x86_common.h b/vmmon-only/include/vm_basic_asm_x86_common.h
new file mode 100644
index 00000000..6bbbc3e6
--- /dev/null
+++ b/vmmon-only/include/vm_basic_asm_x86_common.h
@@ -0,0 +1,313 @@
+/*********************************************************
+ * Copyright (C) 2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_asm_x86_common.h --
+ *
+ *	Basic assembler macros common to 32-bit and 64-bit x86 ISA.
+ */
+
+#ifndef _VM_BASIC_ASM_X86_COMMON_H_
+#define _VM_BASIC_ASM_X86_COMMON_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#ifndef VM_X86_ANY
+#error "Should be included only in x86 builds"
+#endif
+
+/*
+ * x86-64 windows doesn't support inline asm so we have to use these
+ * intrinsic functions defined in the compiler.  Not all of these are well
+ * documented.  There is an array in the compiler dll (c1.dll) which has
+ * an array of the names of all the intrinsics minus the leading
+ * underscore.  Searching around in the ntddk.h file can also be helpful.
+ *
+ * The declarations for the intrinsic functions were taken from the DDK.
+ * Our declarations must match the ddk's otherwise the 64-bit c++ compiler
+ * will complain about second linkage of the intrinsic functions.
+ * We define the intrinsic using the basic types corresponding to the
+ * Windows typedefs. This avoids having to include windows header files
+ * to get to the windows types.
+ */
+#if defined(_MSC_VER) && !defined(BORA_NO_WIN32_INTRINS)
+#ifdef __cplusplus
+extern "C" {
+#endif
+/*
+ * It seems x86 & x86-64 windows still implements these intrinsic
+ * functions.  The documentation for the x86-64 suggest the
+ * __inbyte/__outbyte intrinsics even though the _in/_out work fine and
+ * __inbyte/__outbyte aren't supported on x86.
+ */
+int            _inp(unsigned short);
+unsigned short _inpw(unsigned short);
+unsigned long  _inpd(unsigned short);
+
+int            _outp(unsigned short, int);
+unsigned short _outpw(unsigned short, unsigned short);
+unsigned long  _outpd(uint16, unsigned long);
+#pragma intrinsic(_inp, _inpw, _inpd, _outp, _outpw, _outpw, _outpd)
+
+/*
+ * Prevents compiler from re-ordering reads, writes and reads&writes.
+ * These functions do not add any instructions thus only affect
+ * the compiler ordering.
+ *
+ * See:
+ * `Lockless Programming Considerations for Xbox 360 and Microsoft Windows'
+ * http://msdn.microsoft.com/en-us/library/bb310595(VS.85).aspx
+ */
+void _ReadBarrier(void);
+void _WriteBarrier(void);
+void _ReadWriteBarrier(void);
+#pragma intrinsic(_ReadBarrier, _WriteBarrier, _ReadWriteBarrier)
+
+void _mm_mfence(void);
+void _mm_lfence(void);
+#pragma intrinsic(_mm_mfence, _mm_lfence)
+
+unsigned int __getcallerseflags(void);
+#pragma intrinsic(__getcallerseflags)
+
+#ifdef VM_X86_64
+/*
+ * intrinsic functions only supported by x86-64 windows as of 2k3sp1
+ */
+unsigned __int64 __rdtsc(void);
+void             __stosw(unsigned short *, unsigned short, size_t);
+void             __stosd(unsigned long *, unsigned long, size_t);
+void             _mm_pause(void);
+#pragma intrinsic(__rdtsc, __stosw, __stosd, _mm_pause)
+
+unsigned char  _BitScanForward64(unsigned long *, unsigned __int64);
+unsigned char  _BitScanReverse64(unsigned long *, unsigned __int64);
+#pragma intrinsic(_BitScanForward64, _BitScanReverse64)
+#endif /* VM_X86_64 */
+
+unsigned char  _BitScanForward(unsigned long *, unsigned long);
+unsigned char  _BitScanReverse(unsigned long *, unsigned long);
+#pragma intrinsic(_BitScanForward, _BitScanReverse)
+
+unsigned char  _bittest(const long *, long);
+unsigned char  _bittestandset(long *, long);
+unsigned char  _bittestandreset(long *, long);
+unsigned char  _bittestandcomplement(long *, long);
+#pragma intrinsic(_bittest, _bittestandset, _bittestandreset, _bittestandcomplement)
+#ifdef VM_X86_64
+unsigned char  _bittestandset64(__int64 *, __int64);
+unsigned char  _bittestandreset64(__int64 *, __int64);
+#pragma intrinsic(_bittestandset64, _bittestandreset64)
+#endif // VM_X86_64
+#ifdef __cplusplus
+}
+#endif
+#endif // _MSC_VER
+
+#ifdef __GNUC__
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ *
+ * volatile because reading from port can modify the state of the underlying
+ * hardware.
+ *
+ * Note: The undocumented %z construct doesn't work (internal compiler error)
+ *       with gcc-2.95.1
+ */
+
+#define __GCC_IN(s, type, name) \
+static INLINE type              \
+name(uint16 port)               \
+{                               \
+   type val;                    \
+                                \
+   __asm__ __volatile__(        \
+      "in" #s " %w1, %0"        \
+      : "=a" (val)              \
+      : "Nd" (port)             \
+   );                           \
+                                \
+   return val;                  \
+}
+
+__GCC_IN(b, uint8, INB)
+__GCC_IN(w, uint16, INW)
+__GCC_IN(l, uint32, IN32)
+
+
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ *
+ * Note: The undocumented %z construct doesn't work (internal compiler error)
+ *       with gcc-2.95.1
+ */
+
+#define __GCC_OUT(s, s2, port, val) do { \
+   __asm__(                              \
+      "out" #s " %" #s2 "1, %w0"         \
+      :                                  \
+      : "Nd" (port), "a" (val)           \
+   );                                    \
+} while (0)
+
+#define OUTB(port, val) __GCC_OUT(b, b, port, val)
+#define OUTW(port, val) __GCC_OUT(w, w, port, val)
+#define OUT32(port, val) __GCC_OUT(l, , port, val)
+
+#define GET_CURRENT_EIP(_eip) \
+      __asm__ __volatile("call 0\n\tpopl %0" : "=r" (_eip): );
+
+static INLINE unsigned int
+GetCallerEFlags(void)
+{
+   unsigned long flags;
+   asm volatile("pushf; pop %0" : "=r"(flags));
+   return flags;
+}
+
+#elif defined(_MSC_VER)
+static INLINE  uint8
+INB(uint16 port)
+{
+   return (uint8)_inp(port);
+}
+static INLINE void
+OUTB(uint16 port, uint8 value)
+{
+   _outp(port, value);
+}
+static INLINE uint16
+INW(uint16 port)
+{
+   return _inpw(port);
+}
+static INLINE void
+OUTW(uint16 port, uint16 value)
+{
+   _outpw(port, value);
+}
+static INLINE  uint32
+IN32(uint16 port)
+{
+   return _inpd(port);
+}
+static INLINE void
+OUT32(uint16 port, uint32 value)
+{
+   _outpd(port, value);
+}
+
+#ifndef VM_X86_64
+#ifdef NEAR
+#undef NEAR
+#endif
+
+#define GET_CURRENT_EIP(_eip) do { \
+   __asm call NEAR PTR $+5 \
+   __asm pop eax \
+   __asm mov _eip, eax \
+} while (0)
+#endif // VM_X86_64
+
+static INLINE unsigned int
+GetCallerEFlags(void)
+{
+   return __getcallerseflags();
+}
+
+#endif // __GNUC__
+
+/* Sequence recommended by Intel for the Pentium 4. */
+#define INTEL_MICROCODE_VERSION() (             \
+   __SET_MSR(MSR_BIOS_SIGN_ID, 0),              \
+   __GET_EAX_FROM_CPUID(1),                     \
+   __GET_MSR(MSR_BIOS_SIGN_ID))
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * RDTSC_BARRIER --
+ *
+ *      Implements an RDTSC fence.  Instructions executed prior to the
+ *      fence will have completed before the fence and all stores to
+ *      memory are flushed from the store buffer.
+ *
+ *      On AMD, MFENCE is sufficient.  On Intel, only LFENCE is
+ *      documented to fence RDTSC, but LFENCE won't drain the store
+ *      buffer.  So, use MFENCE;LFENCE, which will work on both AMD and
+ *      Intel.
+ *
+ *      It is the callers' responsibility to check for SSE2 before
+ *      calling this function.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Cause loads and stores prior to this to be globally visible, and
+ *      RDTSC will not pass.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+RDTSC_BARRIER(void)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "mfence \n\t"
+      "lfence \n\t"
+      ::: "memory"
+   );
+#elif defined _MSC_VER
+   /* Prevent compiler from moving code across mfence/lfence. */
+   _ReadWriteBarrier();
+   _mm_mfence();
+   _mm_lfence();
+   _ReadWriteBarrier();
+#else
+#error No compiler defined for RDTSC_BARRIER
+#endif
+}
+
+
+/*
+ * Compiler/CPU barriers. These take the form of <mem access type>_<mem access
+ * type>_MEM_BARRIER, where <mem access type> is either LD (load), ST (store) or
+ * LDST (any). On x86 we only need to care specifically about store-load
+ * reordering on normal memory types and mfence, otherwise only a compiler
+ * barrier is needed.
+ */
+#define LD_LD_MEM_BARRIER()      COMPILER_MEM_BARRIER()
+#define LD_ST_MEM_BARRIER()      COMPILER_MEM_BARRIER()
+#define LD_LDST_MEM_BARRIER()    COMPILER_MEM_BARRIER()
+#define ST_LD_MEM_BARRIER()      asm volatile ("mfence" ::: "memory")
+#define ST_ST_MEM_BARRIER()      COMPILER_MEM_BARRIER()
+#define ST_LDST_MEM_BARRIER()    ST_LD_MEM_BARRIER()
+#define LDST_LD_MEM_BARRIER()    ST_LD_MEM_BARRIER()
+#define LDST_ST_MEM_BARRIER()    COMPILER_MEM_BARRIER()
+#define LDST_LDST_MEM_BARRIER()  ST_LD_MEM_BARRIER()
+
+#endif // _VM_BASIC_ASM_X86_COMMON_H_
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
new file mode 100644
index 00000000..efe492ab
--- /dev/null
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -0,0 +1,786 @@
+/*********************************************************
+ * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_defs.h --
+ *
+ *	Standard macros for VMware source code.
+ */
+
+#ifndef _VM_BASIC_DEFS_H_
+#define _VM_BASIC_DEFS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+#include "vm_basic_types.h" // For INLINE.
+
+/* Checks for FreeBSD, filtering out VMKERNEL. */
+#define __IS_FREEBSD__ (!defined(VMKERNEL) && defined(__FreeBSD__))
+#define __IS_FREEBSD_VER__(ver) (__IS_FREEBSD__ && __FreeBSD_version >= (ver))
+
+#if defined _WIN32 && defined USERLEVEL
+   #include <stddef.h>  /*
+                         * We redefine offsetof macro from stddef; make 
+                         * sure that it's already defined before we do that.
+                         */
+   #include <windows.h>	// for Sleep() and LOWORD() etc.
+   #undef GetFreeSpace  // Unpollute preprocessor namespace.
+#endif
+
+
+/*
+ * Simple macros
+ */
+
+#ifndef vmw_offsetof
+#define vmw_offsetof(TYPE, MEMBER) ((size_t) &((TYPE *)0)->MEMBER)
+#endif
+
+#if (defined __APPLE__ || defined __FreeBSD__) && \
+    (!defined KERNEL && !defined _KERNEL && !defined VMKERNEL && !defined __KERNEL__)
+#   include <stddef.h>
+#else
+#ifndef offsetof
+#define VMW_DEFINED_OFFSETOF
+
+/*
+ * XXX While the _WIN32 implementation appears to be identical to vmw_offsetof
+ * in terms of behavior, they need to be separate to match verbatim the
+ * definition used by the respective compilers, to avoid a redefinition warning.
+ *
+ * This is necessary until we eliminate the inclusion of <windows.h> above.
+ */
+#ifdef _WIN32
+#define offsetof(s,m)   (size_t)&(((s *)0)->m)
+/*
+ * We use the builtin offset for gcc/clang, except when we're running under the
+ * vmkernel's GDB macro preprocessor, since gdb doesn't understand
+ * __builtin_offsetof.
+ */
+#elif defined __GNUC__ && !defined VMKERNEL_GDB_MACRO_BUILDER
+#define offsetof __builtin_offsetof
+#else
+#define offsetof vmw_offsetof
+#endif
+
+#endif // offsetof
+#endif // __APPLE__
+
+#define VMW_CONTAINER_OF(ptr, type, member) \
+   ((type *)((char *)(ptr) - vmw_offsetof(type, member)))
+
+#ifndef ARRAYSIZE
+#define ARRAYSIZE(a) (sizeof (a) / sizeof *(a))
+#endif
+
+#ifndef MIN
+#define MIN(_a, _b)   (((_a) < (_b)) ? (_a) : (_b))
+#endif
+
+/* The Solaris 9 cross-compiler complains about these not being used */
+#ifndef sun
+static INLINE int 
+Min(int a, int b)
+{
+   return a < b ? a : b;
+}
+#endif
+
+#ifndef MAX
+#define MAX(_a, _b)   (((_a) > (_b)) ? (_a) : (_b))
+#endif
+
+#ifndef sun
+static INLINE int 
+Max(int a, int b)
+{
+   return a > b ? a : b;
+}
+#endif
+
+#define VMW_CLAMP(x, min, max) \
+   ((x) < (min) ? (min) : ((x) > (max) ? (max) : (x)))
+
+#define ROUNDUP(x,y)		(((x) + (y) - 1) / (y) * (y))
+#define ROUNDDOWN(x,y)		((x) / (y) * (y))
+#define ROUNDUPBITS(x, bits)	(((uintptr_t) (x) + MASK(bits)) & ~MASK(bits))
+#define ROUNDDOWNBITS(x, bits)	((uintptr_t) (x) & ~MASK(bits))
+#define CEILING(x, y)		(((x) + (y) - 1) / (y))
+#if defined __APPLE__
+#include <machine/param.h>
+#undef MASK
+#endif
+
+/*
+ * The MASK macro behaves badly when given negative numbers or numbers larger
+ * than the highest order bit number (e.g. 32 on a 32-bit machine) as an
+ * argument. The range 0..31 is safe.
+ */
+
+#define MASK(n)		((1 << (n)) - 1)	    /* make an n-bit mask */
+#define MASK64(n)	((CONST64U(1) << (n)) - 1)  /* make an n-bit mask */
+/*
+ * MASKRANGE64 makes a bit vector starting at bit lo and ending at bit hi.  No
+ * checking for lo < hi is done.
+ */
+#define MASKRANGE64(hi, lo)      (MASK64((hi) - (lo) + 1) << (lo))
+
+/* SIGNEXT64 sign extends a n-bit value to 64-bits. */
+#define SIGNEXT64(val, n)       (((int64)(val) << (64 - (n))) >> (64 - (n)))
+
+#define DWORD_ALIGN(x)          ((((x) + 3) >> 2) << 2)
+#define QWORD_ALIGN(x)          ((((x) + 7) >> 3) << 3)
+
+#define IMPLIES(a,b) (!(a) || (b))
+
+/*
+ * Not everybody (e.g., the monitor) has NULL
+ */
+
+#ifndef NULL
+#ifdef  __cplusplus
+#define NULL    0
+#else
+#define NULL    ((void *)0)
+#endif
+#endif
+
+
+/* 
+ * Token concatenation
+ *
+ * The C preprocessor doesn't prescan arguments when they are
+ * concatenated or stringified.  So we need extra levels of
+ * indirection to convince the preprocessor to expand its
+ * arguments.
+ */
+
+#define CONC(x, y)              x##y
+#define XCONC(x, y)             CONC(x, y)
+#define XXCONC(x, y)            XCONC(x, y)
+#define MAKESTR(x)              #x
+#define XSTR(x)                 MAKESTR(x)
+
+
+/*
+ * Wide versions of string constants.
+ */
+
+#ifndef WSTR
+#define WSTR_(X)     L ## X
+#define WSTR(X)      WSTR_(X)
+#endif
+
+
+/*
+ * Page operations
+ *
+ * It has been suggested that these definitions belong elsewhere
+ * (like x86types.h).  However, I deem them common enough
+ * (since even regular user-level programs may want to do
+ * page-based memory manipulation) to be here.
+ * -- edward
+ */
+
+#ifndef PAGE_SHIFT // {
+#if defined VM_I386
+   #define PAGE_SHIFT    12
+#elif defined __APPLE__
+   #define PAGE_SHIFT    12
+#elif defined VM_ARM_64
+   #define PAGE_SHIFT    12
+#elif defined __arm__
+   #define PAGE_SHIFT    12
+#else
+   #error
+#endif
+#endif // }
+
+#ifndef PAGE_SIZE
+#define PAGE_SIZE     (1 << PAGE_SHIFT)
+#endif
+
+#ifndef PAGE_MASK
+#define PAGE_MASK     (PAGE_SIZE - 1)
+#endif
+
+#ifndef PAGE_OFFSET
+#define PAGE_OFFSET(_addr)  ((uintptr_t)(_addr) & (PAGE_SIZE - 1))
+#endif
+
+#ifndef PAGE_NUMBER
+#define PAGE_NUMBER(_addr)  ((uintptr_t)(_addr) / PAGE_SIZE)
+#endif
+
+#ifndef VM_PAGE_BASE
+#define VM_PAGE_BASE(_addr)  ((_addr) & ~(PAGE_SIZE - 1))
+#endif
+
+#ifndef VM_PAGES_SPANNED
+#define VM_PAGES_SPANNED(_addr, _size) \
+   ((((_addr) & (PAGE_SIZE - 1)) + (_size) + (PAGE_SIZE - 1)) >> PAGE_SHIFT)
+#endif
+
+#ifndef BYTES_2_PAGES
+#define BYTES_2_PAGES(_nbytes)  ((_nbytes) >> PAGE_SHIFT)
+#endif
+
+#ifndef PAGES_2_BYTES
+#define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
+#endif
+
+#ifndef MBYTES_2_PAGES
+#define MBYTES_2_PAGES(_nbytes) ((_nbytes) << (20 - PAGE_SHIFT))
+#endif
+
+#ifndef PAGES_2_MBYTES
+#define PAGES_2_MBYTES(_npages) ((_npages) >> (20 - PAGE_SHIFT))
+#endif
+
+#ifndef GBYTES_2_PAGES
+#define GBYTES_2_PAGES(_nbytes) ((_nbytes) << (30 - PAGE_SHIFT))
+#endif
+
+#ifndef PAGES_2_GBYTES
+#define PAGES_2_GBYTES(_npages) ((_npages) >> (30 - PAGE_SHIFT))
+#endif
+
+#ifndef BYTES_2_MBYTES
+#define BYTES_2_MBYTES(_nbytes) ((_nbytes) >> 20)
+#endif
+
+#ifndef MBYTES_2_BYTES
+#define MBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << 20)
+#endif
+
+#ifndef BYTES_2_GBYTES
+#define BYTES_2_GBYTES(_nbytes) ((_nbytes) >> 30)
+#endif
+
+#ifndef GBYTES_2_BYTES
+#define GBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << 30)
+#endif
+
+#ifndef VM_PAE_LARGE_PAGE_SHIFT
+#define VM_PAE_LARGE_PAGE_SHIFT 21
+#endif
+
+#ifndef VM_PAE_LARGE_PAGE_SIZE
+#define VM_PAE_LARGE_PAGE_SIZE (1 << VM_PAE_LARGE_PAGE_SHIFT)
+#endif
+
+#ifndef VM_PAE_LARGE_PAGE_MASK
+#define VM_PAE_LARGE_PAGE_MASK (VM_PAE_LARGE_PAGE_SIZE - 1)
+#endif
+
+#ifndef VM_PAE_LARGE_2_SMALL_PAGES
+#define VM_PAE_LARGE_2_SMALL_PAGES (BYTES_2_PAGES(VM_PAE_LARGE_PAGE_SIZE))
+#endif
+
+/*
+ * Word operations
+ */
+
+#ifndef LOWORD
+#define LOWORD(_dw)   ((_dw) & 0xffff)
+#endif
+#ifndef HIWORD
+#define HIWORD(_dw)   (((_dw) >> 16) & 0xffff)
+#endif
+
+#ifndef LOBYTE
+#define LOBYTE(_w)    ((_w) & 0xff)
+#endif
+#ifndef HIBYTE
+#define HIBYTE(_w)    (((_w) >> 8) & 0xff)
+#endif
+
+#ifndef HIDWORD
+#define HIDWORD(_qw)   ((uint32)((_qw) >> 32))
+#endif
+#ifndef LODWORD
+#define LODWORD(_qw)   ((uint32)(_qw))
+#endif
+#define QWORD(_hi, _lo)   ((((uint64)(_hi)) << 32) | ((uint32)(_lo)))
+
+
+/*
+ * Deposit a field _src at _pos bits from the right,
+ * with a length of _len, into the integer _target.
+ */
+
+#define DEPOSIT_BITS(_src,_pos,_len,_target) { \
+	unsigned mask = ((1 << _len) - 1); \
+	unsigned shiftedmask = ((1 << _len) - 1) << _pos; \
+	_target = (_target & ~shiftedmask) | ((_src & mask) << _pos); \
+}
+
+
+/*
+ * Get return address.
+ */
+
+#ifdef _MSC_VER
+#ifdef __cplusplus
+extern "C"
+#endif 
+void *_ReturnAddress(void);
+#pragma intrinsic(_ReturnAddress)
+#define GetReturnAddress() _ReturnAddress()
+#elif __GNUC__
+#define GetReturnAddress() __builtin_return_address(0)
+#endif
+
+
+#ifdef __GNUC__
+#ifndef sun
+
+/*
+ * A bug in __builtin_frame_address was discovered in gcc 4.1.1, and
+ * fixed in 4.2.0; assume it originated in 4.0. PR 147638 and 554369.
+ */
+#if  !(__GNUC__ == 4 && (__GNUC_MINOR__ == 0 || __GNUC_MINOR__ == 1))
+#define GetFrameAddr() __builtin_frame_address(0)
+#endif
+
+#endif // sun
+#endif // __GNUC__
+
+/*
+ * Data prefetch was added in gcc 3.1.1
+ * http://www.gnu.org/software/gcc/gcc-3.1/changes.html
+ */
+#ifdef __GNUC__
+#  if ((__GNUC__ > 3) || (__GNUC__ == 3 && __GNUC_MINOR__ > 1) || \
+       (__GNUC__ == 3 && __GNUC_MINOR__ == 1 && __GNUC_PATCHLEVEL__ >= 1))
+#     define PREFETCH_R(var) __builtin_prefetch((var), 0 /* read */, \
+                                                3 /* high temporal locality */)
+#     define PREFETCH_W(var) __builtin_prefetch((var), 1 /* write */, \
+                                                3 /* high temporal locality */)
+#  else
+#     define PREFETCH_R(var) ((void)(var))
+#     define PREFETCH_W(var) ((void)(var))
+#  endif
+#endif /* __GNUC__ */
+
+
+#ifdef USERLEVEL // {
+
+/*
+ * Note this might be a problem on NT b/c while sched_yield guarantees it
+ * moves you to the end of your priority list, Sleep(0) offers no such
+ * guarantee.  Bummer.  --Jeremy.
+ */
+
+#if defined(N_PLAT_NLM)
+/* We do not have YIELD() as we do not need it yet... */
+#elif defined(_WIN32)
+#      define YIELD()		Sleep(0)
+#elif defined(VMKERNEL)
+/* We don't have a YIELD macro in the vmkernel */
+#else
+#      include <sched.h>        // For sched_yield.  Don't ask.  --Jeremy.
+#      define YIELD()		sched_yield()
+#endif 
+
+
+/*
+ * Standardize some Posix names on Windows.
+ */
+
+#ifdef _WIN32 // {
+
+#define snprintf  _snprintf
+#define strtok_r  strtok_s
+
+#if (_MSC_VER < 1500)
+#define	vsnprintf _vsnprintf
+#endif
+
+typedef int uid_t;
+typedef int gid_t;
+
+static INLINE void
+sleep(unsigned int sec)
+{
+   Sleep(sec * 1000);
+}
+
+static INLINE int
+usleep(unsigned long usec)
+{
+   Sleep(CEILING(usec, 1000));
+
+   return 0;
+}
+
+typedef int pid_t;
+#define       F_OK          0
+#define       X_OK          1
+#define       W_OK          2
+#define       R_OK          4
+
+#endif // }
+
+/*
+ * Macro for username comparison.
+ */
+
+#ifdef _WIN32 // {
+#define USERCMP(x,y)  Str_Strcasecmp(x,y)
+#else
+#define USERCMP(x,y)  strcmp(x,y)
+#endif // }
+
+
+#endif // }
+
+#ifndef va_copy
+
+#ifdef _WIN32
+
+/*
+ * Windows needs va_copy. This works for both 32 and 64-bit Windows
+ * based on inspection of how varags.h from the Visual C CRTL is
+ * implemented. (Future versions of the RTL may break this).
+ */
+
+#define va_copy(dest, src) ((dest) = (src))
+
+#elif defined(__APPLE__) && defined(KERNEL)
+
+#include "availabilityMacOS.h"
+
+#if MAC_OS_X_VERSION_MIN_REQUIRED >= 1050
+// The Mac OS 10.5 kernel SDK defines va_copy in stdarg.h.
+#include <stdarg.h>
+#else
+/*
+ * The Mac OS 10.4 kernel SDK needs va_copy. Based on inspection of
+ * stdarg.h from the MacOSX10.4u.sdk kernel framework, this should
+ * work.
+ */
+#define va_copy(dest, src) ((dest) = (src))
+#endif // MAC_OS_X_VERSION_MIN_REQUIRED
+
+#elif defined(__GNUC__) && (__GNUC__ < 3)
+
+/*
+ * Old versions of gcc recognize __va_copy, but not va_copy.
+ */
+
+#define va_copy(dest, src) __va_copy(dest, src)
+
+#endif // _WIN32
+
+#endif // va_copy
+
+/*
+ * This one is outside USERLEVEL because it's used by
+ * files compiled into the Windows hgfs driver or the display
+ * driver.
+ */
+
+#ifdef _WIN32
+#define PATH_MAX 256
+#ifndef strcasecmp
+#define strcasecmp(_s1,_s2)   _stricmp((_s1),(_s2))
+#endif
+#ifndef strncasecmp
+#define strncasecmp(_s1,_s2,_n)   _strnicmp((_s1),(_s2),(_n))
+#endif
+#endif
+
+#if defined __linux__ && !defined __KERNEL__ && !defined MODULE && \
+                         !defined VMM && !defined FROBOS && !defined __ANDROID__
+#include <features.h>
+#if __GLIBC_PREREQ(2, 1) && !defined GLIBC_VERSION_21
+#define GLIBC_VERSION_21
+#endif
+#if __GLIBC_PREREQ(2, 2) && !defined GLIBC_VERSION_22
+#define GLIBC_VERSION_22
+#endif
+#if __GLIBC_PREREQ(2, 3) && !defined GLIBC_VERSION_23
+#define GLIBC_VERSION_23
+#endif
+#if __GLIBC_PREREQ(2, 4) && !defined GLIBC_VERSION_24
+#define GLIBC_VERSION_24
+#endif
+#if __GLIBC_PREREQ(2, 5) && !defined GLIBC_VERSION_25
+#define GLIBC_VERSION_25
+#endif
+#if __GLIBC_PREREQ(2, 12) && !defined GLIBC_VERSION_212
+#define GLIBC_VERSION_212
+#endif
+#endif
+
+/*
+ * Convenience definitions of unicode characters.
+ */
+
+#ifndef UTF8_ELLIPSIS
+#define UTF8_ELLIPSIS "\xe2\x80\xa6"
+#endif
+
+/*
+ * Convenience macros and definitions. Can often be used instead of #ifdef.
+ */
+
+#undef ARM64_ONLY
+#ifdef VM_ARM_64
+#define ARM64_ONLY(x)    x
+#else
+#define ARM64_ONLY(x)
+#endif
+
+#undef X86_ONLY
+#ifdef VM_X86_ANY
+#define X86_ONLY(x)      x
+#else
+#define X86_ONLY(x)
+#endif
+
+#undef DEBUG_ONLY
+#ifdef VMX86_DEBUG
+#define vmx86_debug      1
+#define DEBUG_ONLY(x)    x
+#else
+#define vmx86_debug      0
+#define DEBUG_ONLY(x)
+#endif
+
+#ifdef VMX86_STATS
+#define vmx86_stats   1
+#define STATS_ONLY(x) x
+#else
+#define vmx86_stats   0
+#define STATS_ONLY(x)
+#endif
+
+#ifdef VMX86_DEVEL
+#define vmx86_devel   1
+#define DEVEL_ONLY(x) x
+#else
+#define vmx86_devel   0
+#define DEVEL_ONLY(x)
+#endif
+
+#ifdef VMX86_LOG
+#define vmx86_log     1
+#define LOG_ONLY(x)   x
+#else
+#define vmx86_log     0
+#define LOG_ONLY(x)
+#endif
+
+#ifdef VMX86_BETA
+#define vmx86_beta     1
+#define BETA_ONLY(x)   x
+#else
+#define vmx86_beta     0
+#define BETA_ONLY(x)
+#endif
+
+#ifdef VMX86_RELEASE
+#define vmx86_release   1
+#define RELEASE_ONLY(x) x
+#else
+#define vmx86_release   0
+#define RELEASE_ONLY(x) 
+#endif
+
+#ifdef VMX86_SERVER
+#define vmx86_server 1
+#define SERVER_ONLY(x) x
+#define HOSTED_ONLY(x)
+#else
+#define vmx86_server 0
+#define SERVER_ONLY(x)
+#define HOSTED_ONLY(x) x
+#endif
+
+#ifdef VMKERNEL
+#define vmkernel 1
+#define VMKERNEL_ONLY(x) x
+#else
+#define vmkernel 0
+#define VMKERNEL_ONLY(x)
+#endif
+
+#ifdef _WIN32
+#define WIN32_ONLY(x) x
+#define POSIX_ONLY(x)
+#define vmx86_win32 1
+#else
+#define WIN32_ONLY(x)
+#define POSIX_ONLY(x) x
+#define vmx86_win32 0
+#endif
+
+#ifdef __linux__
+#define vmx86_linux 1
+#define LINUX_ONLY(x) x
+#else
+#define vmx86_linux 0
+#define LINUX_ONLY(x)
+#endif
+
+#ifdef __APPLE__
+#define vmx86_apple 1
+#define APPLE_ONLY(x) x
+#else
+#define vmx86_apple 0
+#define APPLE_ONLY(x) 
+#endif
+
+#ifdef VMM
+#define VMM_ONLY(x) x
+#define USER_ONLY(x)
+#else
+#define VMM_ONLY(x)
+#define USER_ONLY(x) x
+#endif
+
+/* VMVISOR ifdef only allowed in the vmkernel */
+#ifdef VMKERNEL
+#ifdef VMVISOR
+#define vmvisor 1
+#define VMVISOR_ONLY(x) x
+#else
+#define vmvisor 0
+#define VMVISOR_ONLY(x)
+#endif
+#endif
+
+#ifdef _WIN32
+#define VMW_INVALID_HANDLE INVALID_HANDLE_VALUE
+#else
+#define VMW_INVALID_HANDLE (-1LL)
+#endif
+
+#ifdef _WIN32
+#define fsync(fd) _commit(fd)
+#define fileno(f) _fileno(f)
+#else
+#endif
+
+/*
+ * Debug output macros for Windows drivers (the Eng variant is for
+ * display/printer drivers only.
+ */
+#ifdef _WIN32
+#ifndef USES_OLD_WINDDK
+#if defined(VMX86_LOG)
+#ifdef _WIN64
+#define WinDrvPrint(arg, ...) DbgPrintEx(DPFLTR_IHVDRIVER_ID, (ULONG)~0, arg, __VA_ARGS__)
+#else
+#define WinDrvPrint(arg, ...) DbgPrint(arg, __VA_ARGS__)
+#endif
+#define WinDrvEngPrint(arg, ...) EngDbgPrint(arg, __VA_ARGS__)
+#else
+#define WinDrvPrint(arg, ...)
+#define WinDrvEngPrint(arg, ...)
+#endif
+#endif
+#endif // _WIN32
+
+#ifdef HOSTED_LG_PG
+#define hosted_lg_pg 1
+#else
+#define hosted_lg_pg 0
+#endif
+
+/*
+ * Use to initialize cbSize for this structure to preserve < Vista
+ * compatibility.
+ */
+#define NONCLIENTMETRICSINFO_V1_SIZE CCSIZEOF_STRUCT(NONCLIENTMETRICS, \
+                                                     lfMessageFont)
+
+/* This is not intended to be thread-safe. */
+#define DO_ONCE(code)                                                   \
+   do {                                                                 \
+      static Bool _doOnceDone = FALSE;                                  \
+      if (UNLIKELY(!_doOnceDone)) {                                     \
+         _doOnceDone = TRUE;                                            \
+         code;                                                          \
+      }                                                                 \
+   } while (0)
+
+/*
+ * Bug 827422 and 838523.
+ */
+
+#if defined __GNUC__ && __GNUC__ >= 4
+#define VISIBILITY_HIDDEN __attribute__((visibility("hidden")))
+#else
+#define VISIBILITY_HIDDEN /* nothing */
+#endif
+
+
+/*
+ * Bitfield extraction.
+ */
+
+#define EXTRACT_BITSLICE32(_val , _lsb, _msb)  \
+   (((uint32)(_val) << (31 - (_msb))) >> ((31 - (_msb)) + (_lsb)))
+#define EXTRACT_BITFIELD32(_val, _pos, _len) \
+   EXTRACT_BITSLICE32((_val), (_pos), ((_pos) + (_len) - 1))
+#define EXTRACT_BITSLICE64(_val, _lsb, _msb) \
+   (((uint64)(_val) << (63 - (_msb))) >> ((63 - (_msb)) + (_lsb)))
+#define EXTRACT_BITFIELD64(_val, _pos, _len) \
+   EXTRACT_BITSLICE64((_val), (_pos), ((_pos) + (_len) - 1))
+
+/*
+ * Typical cache line size.  Use this for aligning structures to cache
+ * lines for performance, but do not rely on it for correctness.
+ *
+ * On x86, all current processors newer than P4 have 64-byte lines,
+ * but P4 had 128.
+ *
+ * On ARM, the line size can vary between cores.  64-byte lines are
+ * common, but either larger or smaller powers of two are possible.
+ */
+#define CACHELINE_SIZE             64
+#define CACHELINE_SHIFT            6
+#define CACHELINE_ALIGNMENT_MASK   (CACHELINE_SIZE - 1)
+
+
+/*
+ * Bits to bytes sizes.
+ */
+
+#define SIZE_8BIT   1
+#define SIZE_16BIT  2
+#define SIZE_24BIT  3
+#define SIZE_32BIT  4
+#define SIZE_48BIT  6
+#define SIZE_64BIT  8
+#define SIZE_80BIT  10
+#define SIZE_128BIT 16
+#define SIZE_256BIT 32
+
+
+#endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmmon-only/include/vm_basic_math.h b/vmmon-only/include/vm_basic_math.h
new file mode 100644
index 00000000..cef94cf1
--- /dev/null
+++ b/vmmon-only/include/vm_basic_math.h
@@ -0,0 +1,166 @@
+/*********************************************************
+ * Copyright (C) 2008-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_math.h --
+ *
+ *	Standard mathematical macros for VMware source code.
+ */
+
+#ifndef _VM_BASIC_MATH_H_
+#define _VM_BASIC_MATH_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+#include "vm_basic_types.h" // For INLINE.
+#include "vm_basic_asm.h"   // For Div64...
+
+
+static INLINE uint32
+RatioOf(uint32 numer1, uint32 numer2, uint32 denom)
+{
+   uint64 numer = (uint64)numer1 * numer2;
+   /* Calculate "(numer1 * numer2) / denom" avoiding round-off errors. */
+#if defined(VMM) || !(defined(__i386__) || defined(__x86_64__))
+   return numer / denom;
+#else
+   uint32 ratio;
+   uint32 unused;
+   Div643232(numer, denom, &ratio, &unused);
+   return ratio;
+#endif
+}
+
+static INLINE uint32
+ExponentialAvg(uint32 avg, uint32 value, uint32 gainNumer, uint32 gainDenom)
+{
+   uint32 term1 = gainNumer * avg;
+   uint32 term2 = (gainDenom - gainNumer) * value;
+   return (term1 + term2) / gainDenom;
+}
+
+static INLINE Bool
+IsPowerOfTwo(uint32 x)
+{
+   /* Does not check for zero. Callers depend on this. */
+   return !(x & (x - 1));
+}
+
+static INLINE uint32
+GetPowerOfTwo(uint32 x)
+{
+   /* Returns next-greatest power-of-two. */
+   uint32 power2 = 1;
+   while (x > power2) {
+      power2 = power2 << 1;
+   }
+   return power2;
+}
+
+
+#if !defined(_WIN32) && !defined(_WIN64)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * RotateLeft32 --
+ *
+ * Results:
+ *      Value rotated to the left by 'shift' bits.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE uint32
+RotateLeft32(uint32 value, uint8 shift)
+{
+   return ((value << shift) | (value >> (32 - shift)));
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * RotateRight32 --
+ *
+ * Results:
+ *      Value rotated to the right by 'shift' bits.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE uint32
+RotateRight32(uint32 value, uint8 shift)
+{
+   return ((value >> shift) | (value << (32 - shift)));
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * RotateLeft64 --
+ *
+ * Results:
+ *      Value rotated to the left by 'shift' bits.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE uint64
+RotateLeft64(uint64 value, uint8 shift)
+{
+   return ((value << shift) | (value >> (64 - shift)));
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * RotateRight64 --
+ *
+ * Results:
+ *      Value rotated to the right by 'shift' bits.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE uint64
+RotateRight64(uint64 value, uint8 shift)
+{
+   return ((value >> shift) | (value << (64 - shift)));
+}
+#endif // if !defined(_WIN32) && !defined(_WIN64)
+
+
+#endif // ifndef _VM_BASIC_MATH_H_
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
new file mode 100644
index 00000000..17b11b96
--- /dev/null
+++ b/vmmon-only/include/vm_basic_types.h
@@ -0,0 +1,1158 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *
+ * vm_basic_types.h --
+ *
+ *    basic data types.
+ */
+
+
+#ifndef _VM_BASIC_TYPES_H_
+#define _VM_BASIC_TYPES_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+/* STRICT ANSI means the Xserver build and X defines Bool differently. */
+#if !defined(_XTYPEDEF_BOOL) && \
+    (!defined(__STRICT_ANSI__) || defined(__FreeBSD__) || defined(__MINGW32__))
+#define _XTYPEDEF_BOOL
+typedef char           Bool;
+#endif
+
+#ifndef FALSE
+#define FALSE          0
+#endif
+
+#ifndef TRUE
+#define TRUE           1
+#endif
+
+#define IsBool(x)      (((x) & ~1) == 0)
+#define IsBool2(x, y)  ((((x) | (y)) & ~1) == 0)
+
+/*
+ * Macros __i386__ and __ia64 are intrinsically defined by GCC
+ */
+#if defined _MSC_VER && defined _M_X64
+#  define __x86_64__
+#elif defined _MSC_VER && defined _M_IX86
+#  define __i386__
+#endif
+
+/*
+ * Setup a bunch of defines for instruction set architecture (ISA) related
+ * properties.
+ *
+ * For compiler types/size:
+ *
+ * - VM_32BIT for a 32-bit ISA (with the same C compiler types/sizes as 32-bit
+ *   x86/ARM).
+ * - VM_64BIT for a 64-bit ISA (with the same C compiler types/sizes as 64-bit
+ *   x86/ARM).
+ *
+ * For a given <arch> in {X86, ARM}:
+ *
+ * - VM_<arch>_32 for the 32-bit variant.
+ * - VM_<arch>_64 for the 64-bit variant.
+ * - VM_<arch>_ANY for any variant of <arch>.
+ *
+ * VM_X86_ANY is synonymous with the confusing and deprecated VM_I386 (which
+ * should really be VM_X86_32).
+ */
+
+#ifdef __i386__
+/* VM_I386 is historically synonymous with VM_X86_ANY in bora, but misleading,
+ * since it is confused with the __i386__ gcc but defined for both 32- and
+ * 64-bit x86. We retain it here for legacy compatibility.
+ */
+#define VM_I386
+#define VM_X86_32
+#define VM_X86_ANY
+#define VM_32BIT
+#endif
+
+#ifdef __x86_64__
+#define VM_X86_64
+#define VM_I386
+#define VM_X86_ANY
+#define VM_64BIT
+#define vm_x86_64 (1)
+#else
+#define vm_x86_64 (0)
+#endif
+
+#ifdef __arm__
+#define VM_ARM_32
+#define VM_ARM_ANY
+#define VM_32BIT
+#endif
+
+#ifdef __aarch64__
+#define VM_ARM_64
+#define VM_ARM_ANY
+#define VM_64BIT
+#define vm_arm_64 (1)
+#else
+#define vm_arm_64 (0)
+#endif
+
+#ifdef _MSC_VER
+
+#pragma warning (3 :4505) // unreferenced local function
+#pragma warning (disable :4018) // signed/unsigned mismatch
+#pragma warning (disable :4761) // integral size mismatch in argument; conversion supplied
+#pragma warning (disable :4305) // truncation from 'const int' to 'short'
+#pragma warning (disable :4244) // conversion from 'unsigned short' to 'unsigned char'
+#pragma warning (disable :4267) // truncation of 'size_t'
+#pragma warning (disable :4146) // unary minus operator applied to unsigned type, result still unsigned
+#pragma warning (disable :4142) // benign redefinition of type
+
+#endif
+
+#if defined(__linux__) && defined(__cplusplus) && __cplusplus >= 201103L
+
+/*
+ * We're using stdint.h instead of cstdint below because of libstdcpp.cpp.
+ * It looks like a C++ file. When being preprocessed all the C++ specific
+ * defines(e.g. __cplusplus) are set, but the C++ include paths are not.
+ */
+#include <stdint.h>
+
+typedef char          Bool;
+
+typedef uint64_t    uint64;
+typedef  int64_t     int64;
+typedef uint32_t    uint32;
+typedef  int32_t     int32;
+typedef uint16_t    uint16;
+typedef  int16_t     int16;
+typedef  uint8_t     uint8;
+typedef   int8_t      int8;
+
+typedef uint64 BA;
+typedef uint64 MA;
+typedef uint32 MPN32;
+
+#elif defined(__APPLE__) || defined(HAVE_STDINT_H)
+
+/*
+ * TODO: This is a C99 standard header.  We should be able to test for
+ * #if __STDC_VERSION__ >= 199901L, but that breaks the Netware build
+ * (which doesn't have stdint.h).
+ */
+
+#include <stdint.h>
+
+typedef uint64_t    uint64;
+typedef  int64_t     int64;
+typedef uint32_t    uint32;
+typedef  int32_t     int32;
+typedef uint16_t    uint16;
+typedef  int16_t     int16;
+typedef  uint8_t    uint8;
+typedef   int8_t     int8;
+
+/*
+ * Note: C does not specify whether char is signed or unsigned, and
+ * both gcc and msvc implement processor-specific signedness.  With
+ * three types:
+ * typeof(char) != typeof(signed char) != typeof(unsigned char)
+ *
+ * Be careful here, because gcc (4.0.1 and others) likes to warn about
+ * conversions between signed char * and char *.
+ */
+
+#else /* !HAVE_STDINT_H */
+
+#ifdef _MSC_VER
+
+typedef unsigned __int64 uint64;
+typedef signed __int64 int64;
+
+#elif __GNUC__
+/* The Xserver source compiles with -ansi -pendantic */
+#   if !defined(__STRICT_ANSI__) || defined(__FreeBSD__)
+#      if defined(VM_X86_64) || defined(VM_ARM_64)
+typedef unsigned long uint64;
+typedef long int64;
+#      else
+typedef unsigned long long uint64;
+typedef long long int64;
+#      endif
+#   endif
+#else
+#   error - Need compiler define for int64/uint64
+#endif /* _MSC_VER */
+
+typedef unsigned int       uint32;
+typedef unsigned short     uint16;
+typedef unsigned char      uint8;
+
+typedef int                int32;
+typedef short              int16;
+typedef signed char        int8;
+
+#endif /* HAVE_STDINT_H */
+
+/*
+ * FreeBSD (for the tools build) unconditionally defines these in
+ * sys/inttypes.h so don't redefine them if this file has already
+ * been included. [greg]
+ *
+ * This applies to Solaris as well.
+ */
+
+/*
+ * Before trying to do the includes based on OS defines, see if we can use
+ * feature-based defines to get as much functionality as possible
+ */
+
+#ifdef HAVE_INTTYPES_H
+#include <inttypes.h>
+#endif
+#ifdef HAVE_SYS_TYPES_H
+#include <sys/types.h>
+#endif
+#ifdef HAVE_SYS_INTTYPES_H
+#include <sys/inttypes.h>
+#endif
+#ifdef HAVE_STDLIB_H
+#include <stdlib.h>
+#endif
+
+#ifdef __FreeBSD__
+#include <sys/param.h> /* For __FreeBSD_version */
+#endif
+
+#if !defined(USING_AUTOCONF)
+#   if defined(__FreeBSD__) || defined(sun)
+#      ifdef KLD_MODULE
+#         include <sys/types.h>
+#      else
+#         if __FreeBSD_version >= 500043
+#            if !defined(VMKERNEL)
+#               include <inttypes.h>
+#            endif
+#            include <sys/types.h>
+#         else
+#            include <sys/inttypes.h>
+#         endif
+#      endif
+#   elif defined __APPLE__
+#      if KERNEL
+#         include <sys/unistd.h>
+#         include <sys/types.h> /* mostly for size_t */
+#         include <stdint.h>
+#      else
+#         include <unistd.h>
+#         include <inttypes.h>
+#         include <stdlib.h>
+#         include <stdint.h>
+#      endif
+#   elif defined __ANDROID__
+#      include <stdint.h>
+#   else
+#      if !defined(__intptr_t_defined) && !defined(intptr_t)
+#         ifdef VM_I386
+#            define __intptr_t_defined
+#            if defined(VM_X86_64)
+typedef int64     intptr_t;
+#            else
+typedef int32     intptr_t;
+#            endif
+#         elif defined(VM_ARM_64)
+#            define __intptr_t_defined
+typedef int64     intptr_t;
+#         elif defined(__arm__)
+#            define __intptr_t_defined
+typedef int32     intptr_t;
+#         endif
+#      endif
+
+#      ifndef _STDINT_H
+#         ifdef VM_I386
+#            if defined(VM_X86_64)
+typedef uint64    uintptr_t;
+#            else
+typedef uint32    uintptr_t;
+#            endif
+#         elif defined(VM_ARM_64)
+typedef uint64    uintptr_t;
+#         elif defined(__arm__)
+typedef uint32    uintptr_t;
+#         endif
+#      endif
+#   endif
+#endif
+
+
+/*
+ * Time
+ * XXX These should be cleaned up.  -- edward
+ */
+
+typedef int64 VmTimeType;          /* Time in microseconds */
+typedef int64 VmTimeRealClock;     /* Real clock kept in microseconds */
+typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
+
+/*
+ * Printf format specifiers for size_t and 64-bit number.
+ * Use them like this:
+ *    printf("%" FMT64 "d\n", big);
+ * The spaces are important for C++11 compatibility.
+ *
+ * FMTH is for handles/fds.
+ */
+
+#ifdef _MSC_VER
+   #define FMT64      "I64"
+   #ifdef VM_X86_64
+      #define FMTSZ      "I64"
+      #define FMTPD      "I64"
+      #define FMTH       "I64"
+   #else
+      #define FMTSZ      "I"
+      #define FMTPD      "I"
+      #define FMTH       "I"
+   #endif
+#elif defined __APPLE__
+   /* Mac OS hosts use the same formatters for 32- and 64-bit. */
+   #define FMT64 "ll"
+   #if KERNEL
+      #define FMTSZ "l"
+   #else
+      #define FMTSZ "z"
+   #endif
+   #define FMTPD "l"
+   #define FMTH ""
+#elif __GNUC__
+   #define FMTH ""
+   #if defined(N_PLAT_NLM) || defined(sun) || \
+       (defined(__FreeBSD__) && (__FreeBSD__ + 0) && ((__FreeBSD__ + 0) < 5))
+      /*
+       * Why (__FreeBSD__ + 0)?  See bug 141008.
+       * Yes, we really need to test both (__FreeBSD__ + 0) and
+       * ((__FreeBSD__ + 0) < 5).  No, we can't remove "+ 0" from
+       * ((__FreeBSD__ + 0) < 5).
+       */
+      #if defined(VM_X86_64) || defined(VM_ARM_64)
+         #define FMTSZ  "l"
+         #define FMTPD  "l"
+      #else
+         #define FMTSZ  ""
+         #define FMTPD  ""
+      #endif
+   #elif defined(__linux__) \
+      || (defined(_POSIX_C_SOURCE) && _POSIX_C_SOURCE >= 200112L) \
+      || (defined(_POSIX_VERSION) && _POSIX_VERSION >= 200112L) \
+      || (defined(_POSIX2_VERSION) && _POSIX2_VERSION >= 200112L)
+      /* BSD, Linux */
+      #define FMTSZ     "z"
+
+      #if defined(VM_X86_64) || defined(VM_ARM_64)
+         #define FMTPD  "l"
+      #else
+         #define FMTPD  ""
+      #endif
+   #else
+      /* Systems with a pre-C99 libc */
+      #define FMTSZ     "Z"
+      #if defined(VM_X86_64) || defined(VM_ARM_64)
+         #define FMTPD  "l"
+      #else
+         #define FMTPD  ""
+      #endif
+   #endif
+   #if defined(VM_X86_64) || defined(VM_ARM_64)
+      #define FMT64     "l"
+   #elif defined(sun) || defined(__FreeBSD__)
+      #define FMT64     "ll"
+   #else
+      #define FMT64     "L"
+   #endif
+#else
+   #error - Need compiler define for FMT64 and FMTSZ
+#endif
+
+/*
+ * Suffix for 64-bit constants.  Use it like this:
+ *    CONST64(0x7fffffffffffffff) for signed or
+ *    CONST64U(0x7fffffffffffffff) for unsigned.
+ *
+ * 2004.08.30(thutt):
+ *   The vmcore/asm64/gen* programs are compiled as 32-bit
+ *   applications, but must handle 64 bit constants.  If the
+ *   64-bit-constant defining macros are already defined, the
+ *   definition will not be overwritten.
+ */
+
+#if !defined(CONST64) || !defined(CONST64U)
+#ifdef _MSC_VER
+#define CONST64(c) c##I64
+#define CONST64U(c) c##uI64
+#elif defined __APPLE__
+#define CONST64(c) c##LL
+#define CONST64U(c) c##uLL
+#elif __GNUC__
+#if defined(VM_X86_64) || defined(VM_ARM_64)
+#define CONST64(c) c##L
+#define CONST64U(c) c##uL
+#else
+#define CONST64(c) c##LL
+#define CONST64U(c) c##uLL
+#endif
+#else
+#error - Need compiler define for CONST64
+#endif
+#endif
+
+/*
+ * Use CONST3264/CONST3264U if you want a constant to be
+ * treated as a 32-bit number on 32-bit compiles and
+ * a 64-bit number on 64-bit compiles. Useful in the case
+ * of shifts, like (CONST3264U(1) << x), where x could be
+ * more than 31 on a 64-bit compile.
+ */
+
+#if defined(VM_X86_64) || defined(VM_ARM_64)
+    #define CONST3264(a) CONST64(a)
+    #define CONST3264U(a) CONST64U(a)
+#else
+    #define CONST3264(a) (a)
+    #define CONST3264U(a) (a)
+#endif
+
+#define MIN_INT8   ((int8)0x80)
+#define MAX_INT8   ((int8)0x7f)
+
+#define MIN_UINT8  ((uint8)0)
+#define MAX_UINT8  ((uint8)0xff)
+
+#define MIN_INT16  ((int16)0x8000)
+#define MAX_INT16  ((int16)0x7fff)
+
+#define MIN_UINT16 ((uint16)0)
+#define MAX_UINT16 ((uint16)0xffff)
+
+#define MIN_INT32  ((int32)0x80000000)
+#define MAX_INT32  ((int32)0x7fffffff)
+
+#define MIN_UINT32 ((uint32)0)
+#define MAX_UINT32 ((uint32)0xffffffff)
+
+#define MIN_INT64  (CONST64(0x8000000000000000))
+#define MAX_INT64  (CONST64(0x7fffffffffffffff))
+
+#define MIN_UINT64 (CONST64U(0))
+#define MAX_UINT64 (CONST64U(0xffffffffffffffff))
+
+typedef uint8 *TCA;  /* Pointer into TC (usually). */
+
+/*
+ * Type big enough to hold an integer between 0..100
+ */
+typedef uint8 Percent;
+#define AsPercent(v)	((Percent)(v))
+
+
+typedef uintptr_t VA;
+typedef uintptr_t VPN;
+
+typedef uint64    PA;
+typedef uint32    PPN;
+
+typedef uint64    TPA;
+typedef uint32    TPPN;
+
+typedef uint64    PhysMemOff;
+typedef uint64    PhysMemSize;
+
+/* The Xserver source compiles with -ansi -pendantic */
+#ifndef __STRICT_ANSI__
+typedef uint64    BA;
+#endif
+
+#ifdef VMKERNEL
+typedef void     *BPN;
+#else
+typedef uint64    BPN;
+#endif
+
+#define UINT64_2_BPN(u) ((BPN)(u))
+#define BPN_2_UINT64(b) ((uint64)(b))
+
+typedef uint32    PageNum;
+typedef unsigned      MemHandle;
+typedef unsigned int  IoHandle;
+typedef int32     World_ID;
+
+/* !! do not alter the definition of INVALID_WORLD_ID without ensuring
+ * that the values defined in both bora/public/vm_basic_types.h and
+ * lib/vprobe/vm_basic_types.h are the same.  Additionally, the definition
+ * of VMK_INVALID_WORLD_ID in vmkapi_world.h also must be defined with
+ * the same value
+ */
+
+#define INVALID_WORLD_ID ((World_ID)0)
+
+typedef World_ID User_CartelID;
+#define INVALID_CARTEL_ID INVALID_WORLD_ID
+
+typedef User_CartelID User_SessionID;
+#define INVALID_SESSION_ID INVALID_CARTEL_ID
+
+typedef User_CartelID User_CartelGroupID;
+#define INVALID_CARTELGROUP_ID INVALID_CARTEL_ID
+
+typedef uint32 Worldlet_ID;
+#define INVALID_WORLDLET_ID ((Worldlet_ID)-1)
+
+typedef  int8    Reg8;
+typedef  int16   Reg16;
+typedef  int32   Reg32;
+typedef  int64   Reg64;
+
+typedef uint8   UReg8;
+typedef uint16  UReg16;
+typedef uint32  UReg32;
+typedef uint64  UReg64;
+
+#if defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
+    defined (VMKERNEL) || defined (VMKBOOT)
+typedef  Reg64  Reg;
+typedef UReg64 UReg;
+#endif
+/* The Xserver source compiles with -ansi -pendantic */
+#ifndef __STRICT_ANSI__
+typedef uint64 MA;
+typedef uint32 MPN32;
+#endif
+
+/*
+ * This type should be used for variables that contain sector
+ * position/quantity.
+ */
+typedef uint64 SectorType;
+
+/*
+ * Linear address
+ */
+
+typedef uintptr_t LA;
+typedef uintptr_t LPN;
+#define LA_2_LPN(_la)     ((_la) >> PAGE_SHIFT)
+#define LPN_2_LA(_lpn)    ((_lpn) << PAGE_SHIFT)
+
+#define LAST_LPN   ((((LA)  1) << (8 * sizeof(LA)   - PAGE_SHIFT)) - 1)
+#define LAST_LPN32 ((((LA32)1) << (8 * sizeof(LA32) - PAGE_SHIFT)) - 1)
+#define LAST_LPN64 ((((LA64)1) << (8 * sizeof(LA64) - PAGE_SHIFT)) - 1)
+
+/* Valid bits in a LPN. */
+#define LPN_MASK   LAST_LPN
+#define LPN_MASK32 LAST_LPN32
+#define LPN_MASK64 LAST_LPN64
+
+/*
+ * On 64 bit platform, address and page number types default
+ * to 64 bit. When we need to represent a 32 bit address, we use
+ * types defined below.
+ *
+ * On 32 bit platform, the following types are the same as the
+ * default types.
+ */
+typedef uint32 VA32;
+typedef uint32 VPN32;
+typedef uint32 LA32;
+typedef uint32 LPN32;
+typedef uint32 PA32;
+typedef uint32 PPN32;
+
+/*
+ * On 64 bit platform, the following types are the same as the
+ * default types.
+ */
+typedef uint64 VA64;
+typedef uint64 VPN64;
+typedef uint64 LA64;
+typedef uint64 LPN64;
+typedef uint64 PA64;
+typedef uint64 PPN64;
+typedef uint64 MA64;
+typedef uint64 MPN;
+
+/*
+ * IO device DMA virtual address and page number (translated by IOMMU to
+ * MA/MPN). IOPN can be in the inclusive range 0 -> MAX_IOPN.
+ */
+typedef uint64 IOA;
+typedef uint64 IOPN;
+
+/*
+ * VA typedefs for user world apps.
+ */
+typedef VA32 UserVA32;
+typedef VA64 UserVA64;
+typedef UserVA64 UserVAConst; /* Userspace ptr to data that we may only read. */
+typedef UserVA32 UserVA32Const; /* Userspace ptr to data that we may only read. */
+typedef UserVA64 UserVA64Const; /* Used by 64-bit syscalls until conversion is finished. */
+#ifdef VMKERNEL
+typedef UserVA64 UserVA;
+#else
+typedef void * UserVA;
+#endif
+
+
+#define MAX_PPN_BITS      31
+#define MAX_PPN           (((PPN)1 << MAX_PPN_BITS) - 1) /* Maximal observable PPN value. */
+#define INVALID_PPN       ((PPN)0xffffffff)
+#define APIC_INVALID_PPN  ((PPN)0xfffffffe)
+
+#define INVALID_BPN       ((BPN)0x000000ffffffffffull)
+
+#define MPN38_MASK        ((1ull << 38) - 1)
+
+#define RESERVED_MPN      ((MPN)0)
+#define INVALID_MPN       ((MPN)MPN38_MASK)
+#define MEMREF_MPN        ((MPN)MPN38_MASK - 1)
+#define RELEASED_MPN      ((MPN)MPN38_MASK - 2)
+
+/* account for special MPNs defined above */
+#define MAX_MPN           ((MPN)MPN38_MASK - 3) /* 50 bits of address space */
+
+#define INVALID_IOPN      ((IOPN)-1)
+#define MAX_IOPN          (INVALID_IOPN - 1)
+
+#define INVALID_LPN       ((LPN)-1)
+#define INVALID_VPN       ((VPN)-1)
+#define INVALID_LPN64     ((LPN64)-1)
+#define INVALID_PAGENUM   ((PageNum)-1)
+
+/*
+ * Format modifier for printing VA, LA, and VPN.
+ * Use them like this: Log("%#" FMTLA "x\n", laddr)
+ */
+
+#if defined(VMM) || defined(FROBOS64) || vm_x86_64 || vm_arm_64 || defined __APPLE__
+#   define FMTLA "l"
+#   define FMTVA "l"
+#   define FMTVPN "l"
+#else
+#   define FMTLA ""
+#   define FMTVA ""
+#   define FMTVPN ""
+#endif
+
+#ifndef EXTERN
+#define EXTERN        extern
+#endif
+#define CONST         const
+
+
+#ifndef INLINE
+#   ifdef _MSC_VER
+#      define INLINE        __inline
+#   else
+#      define INLINE        inline
+#   endif
+#endif
+
+
+/*
+ * Annotation for data that may be exported into a DLL and used by other
+ * apps that load that DLL and import the data.
+ */
+#if defined(_WIN32) && defined(VMX86_IMPORT_DLLDATA)
+#  define VMX86_EXTERN_DATA       extern __declspec(dllimport)
+#else // !_WIN32
+#  define VMX86_EXTERN_DATA       extern
+#endif
+
+#ifdef _WIN32
+
+/* under windows, __declspec(thread) is supported since VS 2003 */
+#define __thread __declspec(thread)
+
+#else
+
+/*
+ * under other platforms instead, __thread is supported by gcc since
+ * version 3.3.1 and by clang since version 3.x
+ */
+
+#endif
+
+
+/*
+ * Due to the wonderful "registry redirection" feature introduced in
+ * 64-bit Windows, if you access any key under HKLM\Software in 64-bit
+ * code, you need to open/create/delete that key with
+ * VMKEY_WOW64_32KEY if you want a consistent view with 32-bit code.
+ */
+
+#ifdef _WIN32
+#ifdef _WIN64
+#define VMW_KEY_WOW64_32KEY KEY_WOW64_32KEY
+#else
+#define VMW_KEY_WOW64_32KEY 0x0
+#endif
+#endif
+
+
+/*
+ * At present, we effectively require a compiler that is at least
+ * gcc-3.3 (circa 2003).  Enforce this here, various things below
+ * this line depend upon it.
+ *
+ * In practice, most things presently compile with gcc-4.1 or gcc-4.4.
+ * The various linux kernel modules may use older (gcc-3.3) compilers.
+ */
+#if defined __GNUC__ && (__GNUC__ < 3 || (__GNUC__ == 3 && __GNUC_MINOR__ < 3))
+#error "gcc version is too old to compile assembly, need gcc-3.3 or better"
+#endif
+
+
+/*
+ * Consider the following reasons functions are inlined:
+ *
+ *  1) inlined for performance reasons
+ *  2) inlined because it's a single-use function
+ *
+ * Functions which meet only condition 2 should be marked with this
+ * inline macro; It is not critical to be inlined (but there is a
+ * code-space & runtime savings by doing so), so when other callers
+ * are added the inline-ness should be removed.
+ */
+
+#if defined __GNUC__
+/*
+ * Starting at version 3.3, gcc does not always inline functions marked
+ * 'inline' (it depends on their size and other factors). To force gcc
+ * to inline a function, one must use the __always_inline__ attribute.
+ * This attribute should be used sparingly and with care.  It is usually
+ * preferable to let gcc make its own inlining decisions
+ */
+#   define INLINE_ALWAYS INLINE __attribute__((__always_inline__))
+#else
+#   define INLINE_ALWAYS INLINE
+#endif
+#define INLINE_SINGLE_CALLER INLINE_ALWAYS
+
+/*
+ * Used when a hard guaranteed of no inlining is needed. Very few
+ * instances need this since the absence of INLINE is a good hint
+ * that gcc will not do inlining.
+ */
+
+#if defined(__GNUC__)
+#define ABSOLUTELY_NOINLINE __attribute__((__noinline__))
+#elif defined(_MSC_VER)
+#define ABSOLUTELY_NOINLINE __declspec(noinline)
+#endif
+
+/*
+ * Used when a function has no effects except the return value and the
+ * return value depends only on the parameters and/or global variables
+ * Such a function can be subject to common subexpression elimination
+ * and loop optimization just as an arithmetic operator would be.
+ */
+
+#if defined(__GNUC__) && (defined(VMM) || defined (VMKERNEL))
+#define SIDE_EFFECT_FREE __attribute__((__pure__))
+#else
+#define SIDE_EFFECT_FREE
+#endif
+
+/*
+ * Used when a function exmaines no input other than its arguments and
+ * has no side effects other than its return value.  Stronger than
+ * SIDE_EFFECT_FREE as the function is not allowed to read from global
+ * memory.
+ */
+
+#if defined(__GNUC__) && (defined(VMM) || defined (VMKERNEL))
+#define CONST_FUNCTION __attribute__((__const__))
+#else
+#define CONST_FUNCTION
+#endif
+
+/*
+ * Attributes placed on function declarations to tell the compiler
+ * that the function never returns.
+ */
+
+#ifdef _MSC_VER
+#define NORETURN __declspec(noreturn)
+#elif defined __GNUC__
+#define NORETURN __attribute__((__noreturn__))
+#else
+#define NORETURN
+#endif
+
+/*
+ * Static profiling hints for functions.
+ *    A function can be either hot, cold, or neither.
+ *    It is an error to specify both hot and cold for the same function.
+ *    Note that there is no annotation for "neither."
+ */
+
+#if defined __GNUC__ && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3))
+#define HOT __attribute__((hot))
+#define COLD __attribute__((cold))
+#else
+#define HOT
+#define COLD
+#endif
+
+/*
+ * Branch prediction hints:
+ *     LIKELY(exp)   - Expression exp is likely TRUE.
+ *     UNLIKELY(exp) - Expression exp is likely FALSE.
+ *   Usage example:
+ *        if (LIKELY(excCode == EXC_NONE)) {
+ *               or
+ *        if (UNLIKELY(REAL_MODE(vc))) {
+ *
+ * We know how to predict branches on gcc3 and later (hopefully),
+ * all others we don't so we do nothing.
+ */
+
+#if defined __GNUC__
+/*
+ * gcc3 uses __builtin_expect() to inform the compiler of an expected value.
+ * We use this to inform the static branch predictor. The '!!' in LIKELY
+ * will convert any !=0 to a 1.
+ */
+#define LIKELY(_exp)     __builtin_expect(!!(_exp), 1)
+#define UNLIKELY(_exp)   __builtin_expect((_exp), 0)
+#else
+#define LIKELY(_exp)      (_exp)
+#define UNLIKELY(_exp)    (_exp)
+#endif
+
+/*
+ * GCC's argument checking for printf-like functions
+ * This is conditional until we have replaced all `"%x", void *'
+ * with `"0x%08x", (uint32) void *'. Note that %p prints different things
+ * on different platforms.  Argument checking is enabled for the
+ * vmkernel, which has already been cleansed.
+ *
+ * fmtPos is the position of the format string argument, beginning at 1
+ * varPos is the position of the variable argument, beginning at 1
+ */
+
+#if defined(__GNUC__)
+# define PRINTF_DECL(fmtPos, varPos) __attribute__((__format__(__printf__, fmtPos, varPos)))
+#else
+# define PRINTF_DECL(fmtPos, varPos)
+#endif
+
+#if defined(__GNUC__)
+# define SCANF_DECL(fmtPos, varPos) __attribute__((__format__(__scanf__, fmtPos, varPos)))
+#else
+# define SCANF_DECL(fmtPos, varPos)
+#endif
+
+/*
+ * UNUSED_PARAM should surround the parameter name and type declaration,
+ * e.g. "int MyFunction(int var1, UNUSED_PARAM(int var2))"
+ *
+ */
+
+#ifndef UNUSED_PARAM
+# if defined(__GNUC__)
+#  define UNUSED_PARAM(_parm) _parm  __attribute__((__unused__))
+# else
+#  define UNUSED_PARAM(_parm) _parm
+# endif
+#endif
+
+#ifndef UNUSED_TYPE
+// XXX _Pragma would better but doesn't always work right now.
+#  define UNUSED_TYPE(_parm) UNUSED_PARAM(_parm)
+#endif
+
+#ifndef UNUSED_VARIABLE
+// XXX is there a better way?
+#  define UNUSED_VARIABLE(_var) (void)_var
+#endif
+
+/*
+ * gcc can warn us if we're ignoring returns
+ */
+#if defined(__GNUC__)
+# define MUST_CHECK_RETURN __attribute__((warn_unused_result))
+#else
+# define MUST_CHECK_RETURN
+#endif
+
+/*
+ * ALIGNED specifies minimum alignment in "n" bytes.
+ */
+
+#ifdef __GNUC__
+#define ALIGNED(n) __attribute__((__aligned__(n)))
+#else
+#define ALIGNED(n)
+#endif
+
+/*
+ * Once upon a time, this was used to silence compiler warnings that
+ * get generated when the compiler thinks that a function returns
+ * when it is marked noreturn.  Don't do it.  Use NOT_REACHED().
+ */
+
+#define INFINITE_LOOP()           do { } while (1)
+
+/*
+ * On FreeBSD (for the tools build), size_t is typedef'd if _BSD_SIZE_T_
+ * is defined. Use the same logic here so we don't define it twice. [greg]
+ */
+#ifdef __FreeBSD__
+#   ifdef _BSD_SIZE_T_
+#      undef _BSD_SIZE_T_
+#      ifdef VM_I386
+#         ifdef VM_X86_64
+             typedef uint64 size_t;
+#         else
+             typedef uint32 size_t;
+#         endif
+#      endif /* VM_I386 */
+#   endif
+
+#   ifdef _BSD_SSIZE_T_
+#      undef _BSD_SSIZE_T_
+#      ifdef VM_I386
+#         ifdef VM_X86_64
+             typedef int64 ssize_t;
+#         else
+             typedef int32 ssize_t;
+#         endif
+#      endif /* VM_I386 */
+#   endif
+
+#else
+#   if !defined(_SIZE_T) && !defined(_SIZE_T_DEFINED)
+#      ifdef VM_I386
+#         define _SIZE_T
+#         ifdef VM_X86_64
+             typedef uint64 size_t;
+#         else
+             typedef uint32 size_t;
+#         endif
+#      elif defined(VM_ARM_64)
+#         define _SIZE_T
+          typedef uint64 size_t;
+#      elif defined(__arm__)
+#         define _SIZE_T
+          typedef uint32 size_t;
+#      endif
+#   endif
+
+#   if !defined(FROBOS) && !defined(_SSIZE_T) && !defined(_SSIZE_T_) && \
+       !defined(ssize_t) && !defined(__ssize_t_defined) && \
+       !defined(_SSIZE_T_DECLARED) && !defined(_SSIZE_T_DEFINED) && \
+       !defined(_SSIZE_T_DEFINED_)
+#      ifdef VM_I386
+#         define _SSIZE_T
+#         define __ssize_t_defined
+#         define _SSIZE_T_DECLARED
+#         define _SSIZE_T_DEFINED_
+#         ifdef VM_X86_64
+             typedef int64 ssize_t;
+#         else
+             typedef int32 ssize_t;
+#         endif
+#      elif defined(VM_ARM_64)
+#         define _SSIZE_T
+#         define __ssize_t_defined
+#         define _SSIZE_T_DECLARED
+#         define _SSIZE_T_DEFINED_
+          typedef int64 ssize_t;
+#      elif defined(__arm__)
+#         define _SSIZE_T
+#         define __ssize_t_defined
+#         define _SSIZE_T_DECLARED
+#         define _SSIZE_T_DEFINED_
+             typedef int32 ssize_t;
+#      endif
+#   endif
+
+#endif
+
+/*
+ * Format modifier for printing pid_t.  On sun the pid_t is a ulong, but on
+ * Linux it's an int.
+ * Use this like this: printf("The pid is %" FMTPID ".\n", pid);
+ */
+#ifdef sun
+#   ifdef VM_X86_64
+#      define FMTPID "d"
+#   else
+#      define FMTPID "lu"
+#   endif
+#else
+# define FMTPID "d"
+#endif
+
+/*
+ * Format modifier for printing uid_t.  On Solaris 10 and earlier, uid_t
+ * is a ulong, but on other platforms it's an unsigned int.
+ * Use this like this: printf("The uid is %" FMTUID ".\n", uid);
+ */
+#if defined(sun) && !defined(SOL11)
+#   ifdef VM_X86_64
+#      define FMTUID "u"
+#   else
+#      define FMTUID "lu"
+#   endif
+#else
+# define FMTUID "u"
+#endif
+
+/*
+ * Format modifier for printing mode_t.  On sun the mode_t is a ulong, but on
+ * Linux it's an int.
+ * Use this like this: printf("The mode is %" FMTMODE ".\n", mode);
+ */
+#ifdef sun
+#   ifdef VM_X86_64
+#      define FMTMODE "o"
+#   else
+#      define FMTMODE "lo"
+#   endif
+#else
+# define FMTMODE "o"
+#endif
+
+/*
+ * Format modifier for printing time_t. Most platforms define a time_t to be
+ * a long int, but on FreeBSD (as of 5.0, it seems), the time_t is a signed
+ * size quantity. Refer to the definition of FMTSZ to see why we need silly
+ * preprocessor arithmetic.
+ * Use this like this: printf("The mode is %" FMTTIME ".\n", time);
+ */
+#if defined(__FreeBSD__) && (__FreeBSD__ + 0) && ((__FreeBSD__ + 0) >= 5)
+#   define FMTTIME FMTSZ"d"
+#else
+#   if defined(_MSC_VER)
+#      ifndef _SAFETIME_H_
+#         if (_MSC_VER < 1400) || defined(_USE_32BIT_TIME_T)
+#             define FMTTIME "ld"
+#         else
+#             define FMTTIME FMT64"d"
+#         endif
+#      else
+#         ifndef FMTTIME
+#            error "safetime.h did not define FMTTIME"
+#         endif
+#      endif
+#   else
+#      define FMTTIME "ld"
+#   endif
+#endif
+
+#ifdef __APPLE__
+/*
+ * Format specifier for all these annoying types such as {S,U}Int32
+ * which are 'long' in 32-bit builds
+ *       and  'int' in 64-bit builds.
+ */
+#   ifdef __LP64__
+#      define FMTLI ""
+#   else
+#      define FMTLI "l"
+#   endif
+
+/*
+ * Format specifier for all these annoying types such as NS[U]Integer
+ * which are  'int' in 32-bit builds
+ *       and 'long' in 64-bit builds.
+ */
+#   ifdef __LP64__
+#      define FMTIL "l"
+#   else
+#      define FMTIL ""
+#   endif
+#endif
+
+
+/*
+ * Define MXSemaHandle here so both vmmon and vmx see this definition.
+ */
+
+#ifdef _WIN32
+typedef uintptr_t MXSemaHandle;
+#else
+typedef int MXSemaHandle;
+#endif
+
+/*
+ * Define type for poll device handles.
+ */
+
+typedef int64 PollDevHandle;
+
+/*
+ * Define the utf16_t type.
+ */
+
+#if defined(_WIN32) && defined(_NATIVE_WCHAR_T_DEFINED)
+typedef wchar_t utf16_t;
+#else
+typedef uint16 utf16_t;
+#endif
+
+/*
+ * Define for point and rectangle types.  Defined here so they
+ * can be used by other externally facing headers in bora/public.
+ */
+
+typedef struct VMPoint {
+   int x, y;
+} VMPoint;
+
+#if defined _WIN32 && defined USERLEVEL
+struct tagRECT;
+typedef struct tagRECT VMRect;
+#else
+typedef struct VMRect {
+   int left;
+   int top;
+   int right;
+   int bottom;
+} VMRect;
+#endif
+
+/*
+ * ranked locks "everywhere"
+ */
+
+typedef uint32 MX_Rank;
+
+#endif  /* _VM_BASIC_TYPES_H_ */
diff --git a/vmmon-only/include/vm_time.h b/vmmon-only/include/vm_time.h
new file mode 100644
index 00000000..aa1e6dbe
--- /dev/null
+++ b/vmmon-only/include/vm_time.h
@@ -0,0 +1,55 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * vm_time.h  --
+ *
+ *    Time management functions.
+ *    Part of driver-only distribution
+ *
+ *    see comment in poll.c
+ */
+
+
+#ifndef VM_TIME_H
+#define VM_TIME_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+
+struct VmTimeVirtualRealClock;
+typedef struct VmTimeVirtualRealClock VmTimeVirtualRealClock;
+
+#ifdef USERLEVEL
+
+VmTimeType VmTime_ReadVirtualTime(void);
+VmTimeVirtualRealClock *VmTime_NewVirtualRealClock(void);
+void VmTime_StartVirtualRealClock(VmTimeVirtualRealClock *, double);
+void VmTime_ResetVirtualRealClock(VmTimeVirtualRealClock *);
+VmTimeType VmTime_ReadVirtualRealTime(VmTimeVirtualRealClock *);
+VmTimeType VmTime_RemainingVirtualRealTime(VmTimeVirtualRealClock *,
+                                           VmTimeType realTime);
+void VmTime_UpdateVirtualRealTime(VmTimeVirtualRealClock *clock,
+                                  VmTimeType realTime,
+                                  VmTimeType virtualTime);
+#endif
+#endif /* VM_TIME_H */
+
diff --git a/vmmon-only/include/vmm_constants.h b/vmmon-only/include/vmm_constants.h
new file mode 100644
index 00000000..54ad6724
--- /dev/null
+++ b/vmmon-only/include/vmm_constants.h
@@ -0,0 +1,48 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/* Do not include inline functions, typedefs or other such
+ * nonsense here.   This file is for _constants_.
+ */
+
+#ifndef _VMM_CONSTANTS_H_
+#define _VMM_CONSTANTS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#define INTERRUPT_REDIRECTION_BITMAP_SIZE 32
+#define IO_PERMISSION_BITMAP_SIZE 0
+
+
+#define VMM_PANIC_NONE         0
+#define VMM_PANIC_MSG_COPYING  1
+#define VMM_PANIC_MSG_COPIED   2
+#define VMM_PANIC_COREDUMPING  3
+#define VMM_PANIC_VCPU         4
+
+#define VMM_PANIC_MSG_SIZE     256
+
+#define VMM_CPL0_STACK 1
+#define VMM_CPL1_STACK 2
+
+#endif
diff --git a/vmmon-only/include/vmmem_shared.h b/vmmon-only/include/vmmem_shared.h
new file mode 100644
index 00000000..4f9fefc9
--- /dev/null
+++ b/vmmon-only/include/vmmem_shared.h
@@ -0,0 +1,108 @@
+/*********************************************************
+ * Copyright (C) 2000-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmmem_shared.h --
+ *
+ *      This is the header file for machine memory manager.
+ */
+
+
+#ifndef _VMMEM_SHARED_H
+#define _VMMEM_SHARED_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMX
+#include "includeCheck.h"
+
+/*
+ * Page remapping definitions.
+ */
+
+#define VMMEM_FLAG_BIT(x) (1 << (x))
+
+#define VMMEM_ANON_LOW_MEM        VMMEM_FLAG_BIT(0)
+#define VMMEM_ANON_LARGE_PAGE     VMMEM_FLAG_BIT(1)
+#define VMMEM_ANON_CAN_FAIL       VMMEM_FLAG_BIT(2)
+#define VMMEM_ANON_USE_PREALLOC   VMMEM_FLAG_BIT(3)
+#define VMMEM_ANON_IOABLE_PAGE    VMMEM_FLAG_BIT(4)
+#define VMMEM_ANON_ALL_FLAGS      MASK(5)
+
+#define VMMEM_GUEST_WRITEABLE     VMMEM_FLAG_BIT(0)
+#define VMMEM_GUEST_BREAKCOW      VMMEM_FLAG_BIT(1)
+#define VMMEM_GUEST_LARGE_PAGE    VMMEM_FLAG_BIT(2)
+#define VMMEM_GUEST_CAN_FAIL      VMMEM_FLAG_BIT(3)
+#define VMMEM_GUEST_TEST_ZEROCOW  VMMEM_FLAG_BIT(4)
+#define VMMEM_GUEST_TRY_ZEROCOW   VMMEM_FLAG_BIT(5)
+#define VMMEM_GUEST_TRY_POISONCOW VMMEM_FLAG_BIT(6)
+#define VMMEM_GUEST_PREALLOC      VMMEM_FLAG_BIT(7)
+#define VMMEM_GUEST_ALL_FLAGS     MASK(8)
+#define VMMEM_GUEST_TRY_COW       (VMMEM_GUEST_TEST_ZEROCOW | \
+                                   VMMEM_GUEST_TRY_ZEROCOW  | \
+                                   VMMEM_GUEST_TRY_POISONCOW)
+
+#define VMMEM_PLATFORM_CHECK_OK           VMMEM_FLAG_BIT(0)
+#define VMMEM_PLATFORM_KEY_OK             VMMEM_FLAG_BIT(1)
+#define VMMEM_PLATFORM_COW                VMMEM_FLAG_BIT(2)
+#define VMMEM_PLATFORM_EXPOSED_TO_VMM     VMMEM_FLAG_BIT(3)
+#define VMMEM_PLATFORM_P2M_UPDATE_PENDING VMMEM_FLAG_BIT(4)
+#define VMMEM_PLATFORM_TRY_COW_SUCCESS    VMMEM_FLAG_BIT(5)
+#define VMMEM_PLATFORM_DIRTY              VMMEM_FLAG_BIT(6)
+#define VMMEM_PLATFORM_BACKED_LARGE       VMMEM_FLAG_BIT(7)
+#define VMMEM_PLATFORM_LARGE_RETRY        VMMEM_FLAG_BIT(8)
+
+
+#define MAX_PLATFORM_PAGE_INFO_PAGES  240
+
+/*
+ * Structure used to query platform about the page state.
+ */
+typedef struct PlatformPageInfoList {
+   uint32 numPages;
+   uint32 _pad;
+   BPN    bpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // bpns to check
+   MPN    mpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // filled in by host
+   uint8  flags[MAX_PLATFORM_PAGE_INFO_PAGES];  // filled in by host
+} PlatformPageInfoList;
+
+#define VMMEM_SERVICES_TYPE_2_MASK(type)                  \
+           (1 << type)
+#define VMMEM_SERVICES_IN_MASK(typeMask, type)            \
+           (VMMEM_SERVICES_TYPE_2_MASK(type) & typeMask)
+#define VMMEM_SERVICES_CLEAR_MASK(typeMask, type)         \
+           (typeMask & ~VMMEM_SERVICES_TYPE_2_MASK(type))
+
+#define VMMEM_SERVICES_DEFS                               \
+   MDEF(VMMEM_SERVICES_TYPE_P2M,  P2MUpdate_FilterPages)  \
+   MDEF(VMMEM_SERVICES_TYPE_SWAP, BusMemSwap_FilterPages)
+
+#define MDEF(_type, _cb) _type,
+typedef enum VmMemServices_Type {
+   VMMEM_SERVICES_DEFS
+#undef MDEF
+   VMMEM_SERVICES_TYPE_MAX
+} VmMemServices_Type;
+#define VMMEM_SERVICES_TYPE_INVALID (VMMEM_SERVICES_TYPE_MAX)
+
+void VmMem_DisableLargePageAllocations(void);
+void VmMem_EnableLargePageAllocations(void);
+
+#endif
diff --git a/vmmon-only/include/vmware.h b/vmmon-only/include/vmware.h
new file mode 100644
index 00000000..fa6881ff
--- /dev/null
+++ b/vmmon-only/include/vmware.h
@@ -0,0 +1,57 @@
+/*********************************************************
+ * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmware.h --
+ *
+ *	Standard include file for VMware source code.
+ */
+
+#ifndef _VMWARE_H_
+#define _VMWARE_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "vm_assert.h"
+
+/*
+ * Global error codes. Currently used internally, but may be exported
+ * to customers one day, like VM_E_XXX in vmcontrol_constants.h
+ */
+
+typedef enum VMwareStatus {
+   VMWARE_STATUS_SUCCESS,  /* success */
+   VMWARE_STATUS_ERROR,    /* generic error */
+   VMWARE_STATUS_NOMEM,    /* generic memory allocation error */
+   VMWARE_STATUS_INSUFFICIENT_RESOURCES, /* internal or system resource limit exceeded */
+   VMWARE_STATUS_INVALID_ARGS  /* invalid arguments */
+} VMwareStatus;
+
+#define VMWARE_SUCCESS(s) ((s) == VMWARE_STATUS_SUCCESS)
+
+
+#endif // ifndef _VMWARE_H_
diff --git a/vmmon-only/include/vmware_pack_begin.h b/vmmon-only/include/vmware_pack_begin.h
new file mode 100644
index 00000000..d0eb4bd9
--- /dev/null
+++ b/vmmon-only/include/vmware_pack_begin.h
@@ -0,0 +1,43 @@
+/*********************************************************
+ * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmware_pack_begin.h --
+ *
+ *    Begin of structure packing. See vmware_pack_init.h for details.
+ *
+ *    Note that we do not use the following construct in this include file,
+ *    because we want to emit the code every time the file is included --hpreg
+ *
+ *    #ifndef foo
+ *    #   define foo
+ *    ...
+ *    #endif
+ *
+ */
+
+
+#include "vmware_pack_init.h"
+
+
+#ifdef _MSC_VER
+#   pragma pack(push, 1)
+#elif __GNUC__
+#else
+#   error Compiler packing...
+#endif
diff --git a/vmmon-only/include/vmware_pack_end.h b/vmmon-only/include/vmware_pack_end.h
new file mode 100644
index 00000000..f02e2152
--- /dev/null
+++ b/vmmon-only/include/vmware_pack_end.h
@@ -0,0 +1,44 @@
+/*********************************************************
+ * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmware_pack_end.h --
+ *
+ *    End of structure packing. See vmware_pack_init.h for details.
+ *
+ *    Note that we do not use the following construct in this include file,
+ *    because we want to emit the code every time the file is included --hpreg
+ *
+ *    #ifndef foo
+ *    #   define foo
+ *    ...
+ *    #endif
+ *
+ */
+
+
+#include "vmware_pack_init.h"
+
+
+#ifdef _MSC_VER
+#   pragma pack(pop)
+#elif __GNUC__
+__attribute__((__packed__))
+#else
+#   error Compiler packing...
+#endif
diff --git a/vmmon-only/include/vmware_pack_init.h b/vmmon-only/include/vmware_pack_init.h
new file mode 100644
index 00000000..c401d66c
--- /dev/null
+++ b/vmmon-only/include/vmware_pack_init.h
@@ -0,0 +1,65 @@
+/*********************************************************
+ * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __VMWARE_PACK_INIT_H__
+#   define __VMWARE_PACK_INIT_H__
+
+
+/*
+ * vmware_pack_init.h --
+ *
+ *    Platform-independent code to make the compiler pack (i.e. have them
+ *    occupy the smallest possible space) structure definitions. The following
+ *    constructs are known to work --hpreg
+ *
+ *    #include "vmware_pack_begin.h"
+ *    struct foo {
+ *       ...
+ *    }
+ *    #include "vmware_pack_end.h"
+ *    ;
+ *
+ *    typedef
+ *    #include "vmware_pack_begin.h"
+ *    struct foo {
+ *       ...
+ *    }
+ *    #include "vmware_pack_end.h"
+ *    foo;
+ */
+
+
+#ifdef _MSC_VER
+/*
+ * MSVC 6.0 emits warning 4103 when the pack push and pop pragma pairing is
+ * not balanced within 1 included file. That is annoying because our scheme
+ * is based on the pairing being balanced between 2 included files.
+ *
+ * So we disable this warning, but this is safe because the compiler will also
+ * emit warning 4161 when there is more pops than pushes within 1 main
+ * file --hpreg
+ */
+
+#   pragma warning(disable:4103)
+#elif __GNUC__
+#else
+#   error Compiler packing...
+#endif
+
+
+#endif /* __VMWARE_PACK_INIT_H__ */
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
new file mode 100644
index 00000000..7a5ba992
--- /dev/null
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -0,0 +1,242 @@
+/*********************************************************
+ * Copyright (C) 2006-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86_basic_defs.h --
+ *
+ *    Basic macros describing the x86 architecture.
+ */
+
+#ifndef _X86_BASIC_DEFS_H_
+#define _X86_BASIC_DEFS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#define X86_MAX_INSTR_LEN  15   /* Max byte length of an x86 instruction. */
+
+#define NUM_IDT_VECTORS 256
+
+/*
+ *   control registers
+ */
+
+#define CR0_PE         0x00000001
+#define CR0_MP         0x00000002
+#define CR0_EM         0x00000004
+#define CR0_TS         0x00000008
+#define CR0_ET         0x00000010
+#define CR0_NE         0x00000020
+#define CR0_WP         0x00010000
+#define CR0_AM         0x00040000
+#define CR0_NW         0x20000000
+#define CR0_CD         0x40000000
+#define CR0_PG         0x80000000
+#define CR0_RESERVED   CONST64U(0xffffffff1ffaffc0)
+
+#define CR3_PWT        0x00000008
+#define CR3_PCD        0x00000010
+#define CR3_PDB_SHIFT  12
+#define CR3_PDB_MASK   0xfffff000
+#define CR3_IGNORE     0xFFF
+#define PAE_CR3_IGNORE 0x1F
+#define CR3_PCID_MASK  0xFFF
+#define CR3_NO_FLUSH   (1ULL << 63)
+
+#define CR4_VME        0x00000001
+#define CR4_PVI        0x00000002
+#define CR4_TSD        0x00000004
+#define CR4_DE         0x00000008
+#define CR4_PSE        0x00000010
+#define CR4_PAE        0x00000020
+#define CR4_MCE        0x00000040
+#define CR4_PGE        0x00000080
+#define CR4_PCE        0x00000100
+#define CR4_OSFXSR     0x00000200 // CPU/OS supports SIMD insts
+#define CR4_OSXMMEXCPT 0x00000400 // #XF exception enable PIII only
+#define CR4_VMXE       0x00002000
+#define CR4_SMXE       0x00004000
+#define CR4_FSGSBASE   0x00010000
+#define CR4_PCIDE      0x00020000
+#define CR4_OSXSAVE    0x00040000
+#define CR4_SMEP       0x00100000
+#define CR4_SMAP       0x00200000
+/* Removing a bit from CR4_RESERVED causes Task_Switch to leave the bit set. */
+#define CR4_RESERVED   CONST64U(0xffffffffffc89800) 
+#define CR8_RESERVED   CONST64U(0xfffffffffffffff0)
+
+/*
+ * Debug registers.
+ */
+
+#define DR_COUNT       4
+
+#define DR6_B0         0x00000001
+#define DR6_B1         0x00000002
+#define DR6_B2         0x00000004
+#define DR6_B3         0x00000008
+#define DR6_B0123      (DR6_B0 | DR6_B1 | DR6_B2 | DR6_B3)
+#define DR6_B(_n)      (1 << (_n))
+#define DR6_BD         0x00002000
+#define DR6_BS         0x00004000
+#define DR6_BT         0x00008000
+#define DR6_RTM        0x00010000
+#define DR6_ONES       0xfffe0ff0
+#define DR6_DEFAULT    (DR6_ONES | DR6_RTM)
+#define DR6_RESERVED_MASK 0xfffe1ff0
+
+#define DR7_L_MASK(_n)   (1 << ((_n) * 2))
+#define DR7_G_MASK(_n)   (1 << ((_n) * 2 + 1))
+#define DR7_LG_MASK(_n)  (3 << ((_n) * 2))
+#define DR7_RW_MASK(_n)  (3 << (16 + (_n) * 4))
+#define DR7_LEN_MASK(_n) (3 << (18 + (_n) * 4))
+#define DR7_BP_MASK(_n) (DR7_L_MASK(_n)  |\
+                         DR7_G_MASK(_n)  |\
+                         DR7_RW_MASK(_n) |\
+                         DR7_LEN_MASK(_n))
+
+#define DR7_L0         DR7_L_MASK(0)
+#define DR7_G0         DR7_G_MASK(0)
+#define DR7_L1         DR7_L_MASK(1)
+#define DR7_G1         DR7_G_MASK(1)
+#define DR7_L2         DR7_L_MASK(2)
+#define DR7_G2         DR7_G_MASK(2)
+#define DR7_L3         DR7_L_MASK(3)
+#define DR7_G3         DR7_G_MASK(3)
+#define DR7_ENABLED    0x000000ff
+
+#define DR7_LE         0x00000100    // Deprecated in modern hardware
+#define DR7_GE         0x00000200    // Deprecated in modern hardware
+#define DR7_GD         0x00002000
+#define DR7_ONES       0x00000400
+#define DR7_RTM        0x00000800
+#define DR7_RESERVED   CONST64U(0xffffffff0000d400)
+#define DR7_DEFUNCT    (DR7_LE | DR7_GE)
+#define DR7_DEFAULT    DR7_ONES
+#define DR7_LX_MASK    (DR7_L0 | DR7_L1 | DR7_L2 | DR7_L3 | DR7_LE)
+#define DR7_GX_MASK    (DR7_G0 | DR7_G1 | DR7_G2 | DR7_G3 | DR7_GE)
+#define DR7_LGX_MASK   (DR7_LX_MASK | DR7_GX_MASK)
+
+#define DR7_RW(_r,_n)  (((_r) >> (16+(_n)*4)) & 0x3)
+#define DR7_L(_r,_n)   (((_r) >> ((_n)*2)) & 1)
+#define DR7_G(_r,_n)   (((_r) >> (1 + (_n)*2)) & 1)
+#define DR7_LEN(_r,_n) (((_r) >> (18+(_n)*4)) & 0x3)
+
+#define DR7_RW_BITS(_n,_rw)     ((_rw) << (16 + (_n) * 4))
+#define DR7_LEN_BITS(_n,_len)   ((_len) << (18 + (_n) * 4))
+
+#define DR7_RW_INST    0x0
+#define DR7_RW_WRITES  0x1
+#define DR7_RW_IO      0x2
+#define DR7_RW_ACCESS  0x3
+
+#define DR7_LENGTH_1   0x0
+#define DR7_LENGTH_2   0x1
+#define DR7_LENGTH_8   0x2
+#define DR7_LENGTH_4   0x3
+
+#define DEBUG_STATUS_B0   (1<<0)
+#define DEBUG_STATUS_B1   (1<<1)
+#define DEBUG_STATUS_B2   (1<<2)
+#define DEBUG_STATUS_B3   (1<<3)
+#define DEBUG_STATUS_DB   (1<<13)
+#define DEBUG_STATUS_BS   (1<<14)
+#define DEBUG_STATUS_BT   (1<<15)
+
+/*
+ *   exception error codes
+ */
+
+#define EXC_DE            0
+#define EXC_DB            1
+#define EXC_NMI           2
+#define EXC_BP            3
+#define EXC_OF            4
+#define EXC_BR            5
+#define EXC_UD            6
+#define EXC_NM            7
+#define EXC_DF            8
+#define EXC_TS           10
+#define EXC_NP           11
+#define EXC_SS           12
+#define EXC_GP           13
+#define EXC_PF           14
+#define EXC_MF           16
+#define EXC_AC           17
+#define EXC_MC           18
+#define EXC_XF           19  /* SIMD exception.                */
+#define EXC_SX           30  /* Security exception (SVM only). */
+
+/*
+ * eflag/rflag definitions.
+ */
+
+#define EFLAGS_IOPL_SHIFT 12
+
+typedef enum x86_FLAGS {
+   EFLAGS_NONE         = 0,
+   EFLAGS_CF           = (1 << 0),     /* User */ 
+   EFLAGS_SET          = (1 << 1),                                  
+   EFLAGS_PF           = (1 << 2),     /* User */ 
+   EFLAGS_AF           = (1 << 4),     /* User */ 
+   EFLAGS_ZF           = (1 << 6),     /* User */ 
+   EFLAGS_SF           = (1 << 7),     /* User */ 
+   EFLAGS_TF           = (1 << 8),     /* Priv */ 
+   EFLAGS_IF           = (1 << 9),     /* Priv */ 
+   EFLAGS_DF           = (1 << 10),    /* User */ 
+   EFLAGS_OF           = (1 << 11),    /* User */ 
+   EFLAGS_NT           = (1 << 14),    /* Priv */ 
+   EFLAGS_RF           = (1 << 16),    /* Priv */ 
+   EFLAGS_VM           = (1 << 17),    /* Priv */ 
+   EFLAGS_AC           = (1 << 18),    /* Priv */ 
+   EFLAGS_VIF          = (1 << 19),    /* Priv */ 
+   EFLAGS_VIP          = (1 << 20),    /* Priv */ 
+   EFLAGS_ID           = (1 << 21),    /* Priv */
+   
+   EFLAGS_IOPL         = 3 << EFLAGS_IOPL_SHIFT,
+   EFLAGS_ARITH        = (EFLAGS_CF | EFLAGS_PF | EFLAGS_AF | EFLAGS_ZF |
+                          EFLAGS_SF | EFLAGS_OF),
+   EFLAGS_USER         = (EFLAGS_CF | EFLAGS_PF | EFLAGS_AF | EFLAGS_ZF |
+                          EFLAGS_SF | EFLAGS_DF | EFLAGS_OF),
+   EFLAGS_PRIV         = (EFLAGS_TF  | EFLAGS_IF  | EFLAGS_IOPL | EFLAGS_NT  |
+                          EFLAGS_RF  | EFLAGS_VM  | EFLAGS_AC   | EFLAGS_VIF |
+                          EFLAGS_VIP | EFLAGS_ID),
+   EFLAGS_ALL          = (EFLAGS_CF | EFLAGS_PF | EFLAGS_AF | EFLAGS_ZF |
+                          EFLAGS_SF | EFLAGS_DF | EFLAGS_OF | EFLAGS_TF |
+                          EFLAGS_IF | EFLAGS_IOPL | EFLAGS_NT | EFLAGS_RF |
+                          EFLAGS_VM | EFLAGS_AC | EFLAGS_VIF | EFLAGS_VIP | 
+                          EFLAGS_ID),
+   EFLAGS_ALL_16       = EFLAGS_ALL & 0xffff,
+   EFLAGS_REAL_32      = (EFLAGS_ALL & ~(EFLAGS_VIP | EFLAGS_VIF | EFLAGS_VM)),
+   EFLAGS_V8086_32     = (EFLAGS_ALL & ~(EFLAGS_VIP | EFLAGS_VIF |
+                                         EFLAGS_VM  | EFLAGS_IOPL)),
+   EFLAGS_REAL_16      = EFLAGS_REAL_32 & 0xffff,
+   EFLAGS_V8086_16     = EFLAGS_V8086_32 & 0xffff,
+   EFLAGS_CLEAR_ON_EXC = (EFLAGS_TF | EFLAGS_VM | EFLAGS_RF | EFLAGS_NT),
+   EFLAGS__4           = 0x7fffffff    /* ensure 4 byte encoding */
+} x86_FLAGS;
+
+
+#endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmmon-only/include/x86apic.h b/vmmon-only/include/x86apic.h
new file mode 100644
index 00000000..325b6d03
--- /dev/null
+++ b/vmmon-only/include/x86apic.h
@@ -0,0 +1,353 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _X86APIC_H_
+#define _X86APIC_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+/*
+ * This file describes all the APIC/IOAPIC register locations and formats
+ * that are defined by the x86 architecture.
+ */
+
+
+/*
+ * APIC registers
+ */
+#define APIC_DEFAULT_ADDRESS      0xfee00000
+#define APIC_ADDRESS_ALIGNMENT    4096
+#define APIC_ADDRESS_MASK         (APIC_ADDRESS_ALIGNMENT-1)
+#define APIC_VERSION_0x11         0x11
+#define XAPIC_VERSION_0x14        0x14
+#define X2APIC_VERSION_0x15       0x15
+#define APIC_MAXLVT_0x4           0x4
+#define XAPIC_MAXLVT_0x5          0x5
+#define APIC_VERSION_MASK         0xff
+#define APIC_MAX_LVT_MASK         0xff
+#define APIC_MAX_LVT_SHIFT        16
+#define APIC_EXTAPICSPACE_MASK    0x80000000
+#define APIC_INVALID_ID           0xff
+#define X2APIC_INVALID_ID         0xffffffff
+
+#define APICR_ID          0x02
+#define APICR_VERSION     0x03
+#define APICR_TPR         0x08
+#define APICR_APR         0x09
+#define APICR_PPR         0x0a
+#define APICR_EOI         0x0b
+#define APICR_RMTREAD     0x0c
+#define APICR_LDR         0x0d
+#define APICR_DFR         0x0e
+#define APICR_SVR         0x0f
+#define APICR_ISR         0x10
+#define APICR_TMR         0x18
+#define APICR_IRR         0x20
+#define APICR_ESR         0x28
+#define APICR_CMCILVT     0x2f
+#define APICR_ICRLO       0x30
+#define APICR_ICRHI       0x31
+#define APICR_TIMERLVT    0x32
+#define APICR_THERMLVT    0x33
+#define APICR_PCLVT       0x34
+#define APICR_LVT0        0x35
+#define APICR_LVT1        0x36
+#define APICR_ERRLVT      0x37
+#define APICR_INITCNT     0x38
+#define APICR_CURCNT      0x39
+#define APICR_DIVIDER     0x3e
+#define APICR_SELFIPI     0x3f // X2 APIC only
+#define APICR_EXTFEATURE  0x40
+#define APICR_EXTLVT      0x50
+
+#define X2APIC_READONLY_BITMASK \
+   ((CONST64U(1) << APICR_ID)     | (CONST64U(1) << APICR_VERSION) | \
+    (CONST64U(1) << APICR_APR)    | (CONST64U(1) << APICR_PPR)     | \
+    (CONST64U(1) << APICR_CURCNT) | (CONST64U(1) << APICR_ICRHI)   | \
+    (CONST64U(1) << APICR_LDR)    | (CONST64U(1) << APICR_DFR)     | \
+    (MASK64(8) << APICR_ISR)      | (MASK64(8) << APICR_IRR)       | \
+    (MASK64(8) << APICR_TMR))
+
+#define APICR_SIZE             0x540
+
+#define APIC_TPR_RESERVED     0xffffff00
+#define APIC_PR_MASK          0x000000ff
+#define APIC_PR_XMASK         0x000000f0
+#define APIC_PR_YMASK         0x0000000f
+#define APIC_PR_X(_r)         (((_r) & APIC_PR_XMASK) >> 4)
+#define APIC_PR_Y(_r)         (((_r) & APIC_PR_YMASK) >> 0)
+
+#define APIC_SVR_ONES         0x0000000f
+#define APIC_SVR_VECTOR       0x000000ff
+#define APIC_SVR_APICENABLE   0x00000100
+#define APIC_SVR_FOCUSCHECK   0x00000200
+#define APIC_SVR_X2_RESERVED  0xffffee00
+
+#define APIC_LVT_MASK         0x10000
+#define APIC_LVT_DELVMODE_NMI 0x400
+#define APIC_LVT_DELVMODE(_lvt) (_lvt & 0x700)
+#define APIC_LVT_RESET_VALUE  0x00010000
+
+#define APIC_LVT_TIMER_RESERVED 0xfff8ef00
+#define APIC_LVT_ERROR_RESERVED 0xfffeef00 
+#define APIC_LVT_LINT_RESERVED  0xfffe0800
+#define APIC_LVT_OTHER_RESERVED 0xfffee800 // CMCI, PC, THERM LVTs
+
+#define APIC_EXTFEATURE_DEFAULT  0x00040004
+#define APIC_EXTLVT_DEFAULT      0x00010000
+
+/*
+ * Use APIC_MSR_BASEMASK as mask only for reading the MSR_APIC_BASE.
+ * Use VMCORESHARED->reservedAPIC as mask when writing MSR_APIC_BASE.
+ */
+#define APIC_MSR_BASEMASK     CONST64U(0x0000fffffffff000)
+#define APIC_MSR_X2APIC_ENABLED 0x00000400
+#define APIC_MSR_ENABLED      0x00000800
+#define APIC_MSR_BSP          0x00000100
+
+#define APIC_VTE_VECTOR_MASK      0x000000ff
+#define APIC_VTE_MODE_FIXED       0x00000000
+#define APIC_VTE_MODE_SMI         0x00000200
+#define APIC_VTE_MODE_NMI         0x00000400
+#define APIC_VTE_MODE_EXTINT      0x00000700
+#define APIC_VTE_MODE_MASK        0x00000700
+#define APIC_VTE_DELVSTATUS       0x00001000
+#define APIC_VTE_PINPOL           0x00002000
+#define APIC_VTE_REMIRR           0x00004000
+#define APIC_VTE_TRIGMODE         0x00008000
+#define APIC_VTE_MASK             0x00010000
+#define APIC_VTE_TMR_ONESHOT      0x00000000
+#define APIC_VTE_TMR_PERIODIC     0x00020000
+#define APIC_VTE_TMR_TSC_DEADLINE 0x00040000
+#define APIC_VTE_TMR_MODE_MASK    0x00070000
+
+/* 
+ * Kernels 2.4.0-test8 and higher have the definition 
+ * APIC_ID_MASK, so we use APIC_ID_BITS to avoid naming conflicts.
+ */
+#define APIC_ID_BITS          0x0f000000
+#define XAPIC_ID_BITS         0xff000000
+#define XAPIC_ID_MASK         0xff000000
+#define X2APIC_ID_BITS        0xffffffff
+#define APIC_ID_SHIFT         24
+#define APIC_LDR_BITS         0xff000000
+#define APIC_LDR_SHIFT        24
+
+#define APIC_DIVIDER_BY_1     0x0000000b
+#define APIC_DIVIDER_RESERVED 0xfffffff4
+
+/* APIC illegal vectors */
+#define APIC_MIN_LEGAL_VECTOR 16
+
+/* APIC delivery modes */
+#define APIC_DELMODE_FIXED    0
+#define APIC_DELMODE_LOWEST   1
+#define APIC_DELMODE_SMI      2
+#define APIC_DELMODE_RSVD     3
+#define APIC_DELMODE_NMI      4
+#define APIC_DELMODE_INIT     5
+#define APIC_DELMODE_STARTUP  6
+#define APIC_DELMODE_EXTINT   7
+
+/* APIC destination modes */
+#define APIC_DESTMODE_PHYS    0
+#define APIC_DESTMODE_LOGICAL 1
+
+/* APIC polarities (active high/low) */
+#define APIC_POLARITY_HIGH    0
+#define APIC_POLARITY_LOW     1
+
+/* APIC trigger types (edge/level) */
+#define APIC_TRIGGER_EDGE     0
+#define APIC_TRIGGER_LEVEL    1
+
+/* APIC destination shorthands */
+#define APIC_DEST_DEST        0
+#define APIC_DEST_LOCAL       1
+#define APIC_DEST_ALL_INC     2
+#define APIC_DEST_ALL_EXC     3
+
+/* APIC physical mode broadcasts */
+#define APIC_DEST_BROADCAST   0x0f
+#define XAPIC_DEST_BROADCAST  0xff
+#define X2APIC_DEST_BROADCAST 0xffffffff
+
+/* APIC IPI Command Register format */
+#define APIC_ICRHI_RESERVED         0x00ffffff
+#define APIC_ICRHI_DEST_MASK        0xff000000
+#define APIC_ICRHI_DEST_OFFSET      24
+#define X2APIC_ICR_DEST_OFFSET      32
+
+#define APIC_ICRLO_RESERVED         0xfff32000
+#define APIC_ICRLO_DEST_MASK        0x000c0000
+#define APIC_ICRLO_DEST_OFFSET      18
+#define APIC_ICRLO_TRIGGER_MASK     0x00008000
+#define APIC_ICRLO_TRIGGER_OFFSET   15
+#define APIC_ICRLO_LEVEL_MASK       0x00004000
+#define APIC_ICRLO_LEVEL_OFFSET     14
+#define APIC_ICRLO_STATUS_MASK      0x00001000
+#define APIC_ICRLO_STATUS_OFFSET    12
+#define APIC_ICRLO_DESTMODE_MASK    0x00000800
+#define APIC_ICRLO_DESTMODE_OFFSET  11
+#define APIC_ICRLO_DELMODE_MASK     0x00000700
+#define APIC_ICRLO_DELMODE_OFFSET   8
+#define APIC_ICRLO_VECTOR_MASK      0x000000ff
+#define APIC_ICRLO_VECTOR_OFFSET    0
+
+/* x2APIC Logical ID fields */ 
+#define X2APIC_LDR_BITVEC_MASK      0x0000ffff
+#define X2APIC_LDR_CLUSTER_MASK     0xffff0000
+#define X2APIC_LDR_CLUSTER_SHIFT    16
+
+/* APIC error register bits */ 
+#define APIC_ERR_ILL_REG         (1<<7)
+#define APIC_REC_ILL_VEC         (1<<6)
+#define APIC_SENT_ILL_VEC        (1<<5)
+#define APIC_ERR_REDIR_IPI       (1<<4) // X2APIC
+
+#define X2APIC_SELFIPI_RESERVED     0xffffff00
+
+/*
+ * APIC register accessors
+ */
+#define APIC_VERSION_REG(_apic)  (_apic[APICR_VERSION][0])
+#define APIC_MAX_LVT(_apic)      ((APIC_VERSION_REG(_apic) >> \
+                                   APIC_MAX_LVT_SHIFT) & APIC_MAX_LVT_MASK)
+
+#define APIC_LVT_ISMASKED(_lvt)  (_lvt & APIC_LVT_MASK)
+#define APIC_LVT_VECTOR(_lvt)    (_lvt & 0xff)
+
+#define APIC_SPINT_REG(_apic)    (_apic[APICR_SVR][0])
+#define APIC_TIMER_REG(_apic)    (_apic[APICR_TIMERLVT][0])
+#define APIC_THERM_REG(_apic)    (_apic[APICR_THERMLVT][0])
+#define APIC_PC_REG(_apic)       (_apic[APICR_PCLVT][0])
+#define APIC_LINT0_REG(_apic)    (_apic[APICR_LVT0][0])
+#define APIC_LINT1_REG(_apic)    (_apic[APICR_LVT1][0])
+#define APIC_ERR_REG(_apic)      (_apic[APICR_ERRLVT][0])
+#define APIC_INITCNT_REG(_apic)  (_apic[APICR_INITCNT][0])
+#define APIC_CURCNT_REG(_apic)   (_apic[APICR_CURCNT][0])
+
+#define APIC_SPINT_VECTOR(_apic) (APIC_SPINT_REG(_apic) & 0xff)
+#define APIC_TIMER_VECTOR(_apic) (APIC_TIMER_REG(_apic) & 0xff)
+#define APIC_PC_VECTOR(_apic)    (APIC_PC_REG(_apic) & 0xff)
+#define APIC_LINT0_VECTOR(_apic) (APIC_LINT0_REG(_apic) & 0xff)
+#define APIC_LINT1_VECTOR(_apic) (APIC_LINT1_REG(_apic) & 0xff)
+#define APIC_ERR_VECTOR(_apic)   (APIC_ERR_REG(_apic) & 0xff)
+
+
+/*
+ * I/O APIC registers
+ */
+#define IOAPIC_DEFAULT_ADDRESS    0xfec00000
+#define IOAPIC_ADDRESS_ALIGNMENT  1024
+#define IOAPIC_ADDRESS_MASK       (IOAPIC_ADDRESS_ALIGNMENT-1)
+#define IOAPIC_UVERSIONMASK       0xff
+
+#define IOAPICID              0x00
+#define IOAPICVER             0x01
+#define IOAPICARB             0x02
+#define IOREDTBL_FIRST        0x10
+#define IOREDTBL_LAST         0x3f
+
+#define IO_APIC_TIMER_PIN               2
+#define IO_APIC_RTC_PIN                 8
+
+#define IO_APIC_REG0_RES2_MASK          0x00FFFFFF
+#define IO_APIC_REG0_RES2_OFFSET        0
+#define IO_APIC_REG0_RES1_MASK          0xF0000000
+#define IO_APIC_REG0_RES1_OFFSET        28
+
+#define IO_APIC_REG1_VERSION_MASK       0x000000FF
+#define IO_APIC_REG1_VERSION_OFFSET     0
+#define IO_APIC_REG1_RES2_MASK          0x0000FF00
+#define IO_APIC_REG1_RES2_OFFSET        8
+#define IO_APIC_REG1_ENTRIES_MASK       0x00FF0000
+#define IO_APIC_REG1_ENTRIES_OFFSET     16
+#define IO_APIC_REG1_RES1_MASK          0xFF000000
+#define IO_APIC_REG1_RES1_OFFSET        24
+
+#define IO_APIC_REG2_RES1_MASK          0x00FFFFFF
+#define IO_APIC_REG2_RES1_OFFSET        0
+#define IO_APIC_REG2_RES2_MASK          0xF0000000
+#define IO_APIC_REG2_RES2_OFFSET        28
+
+#define IO_APIC_ROUTE_VECTOR_MASK       0x000000FF
+#define IO_APIC_ROUTE_VECTOR_OFFSET     0
+
+#define IO_APIC_INTMASK_MASK            0x00010000
+#define IO_APIC_INTMASK_OFFSET          16
+
+#define IO_APIC_DELMODE_MASK            0x00000700
+#define IO_APIC_DELMODE_OFFSET          8
+
+#define IO_APIC_DESTMODE_MASK           0x00000800
+#define IO_APIC_DESTMODE_OFFSET         11
+
+#define IO_APIC_POLARITY_MASK           0x00002000
+#define IO_APIC_POLARITY_OFFSET         13
+
+#define IO_APIC_TRIGGER_MASK            0x00008000
+#define IO_APIC_TRIGGER_OFFSET          15
+
+#define IO_APIC_DEST_MASK               0xff000000
+#define IO_APIC_DEST_OFFSET             24
+
+#define IO_APIC_REG0_RES1(_reg) \
+   ((_reg & IO_APIC_REG0_RES1_MASK) >> IO_APIC_REG0_RES1_OFFSET)
+#define IO_APIC_REG0_RES2(_reg) \
+   ((_reg & IO_APIC_REG0_RES2_MASK) >> IO_APIC_REG0_RES2_OFFSET)
+#define IO_APIC_REG1_RES1(_reg) \
+   ((_reg & IO_APIC_REG1_RES1_MASK) >> IO_APIC_REG1_RES1_OFFSET)
+#define IO_APIC_REG1_RES2(_reg) \
+   ((_reg & IO_APIC_REG1_RES2_MASK) >> IO_APIC_REG1_RES2_OFFSET)
+#define IO_APIC_REG2_RES1(_reg) \
+   ((_reg & IO_APIC_REG2_RES1_MASK) >> IO_APIC_REG2_RES1_OFFSET)
+#define IO_APIC_REG2_RES2(_reg) \
+   ((_reg & IO_APIC_REG2_RES2_MASK) >> IO_APIC_REG2_RES2_OFFSET)
+#define IO_APIC_VERSION(_reg) \
+   ((_reg & IO_APIC_REG1_VERSION_MASK) >> IO_APIC_REG1_VERSION_OFFSET)
+#define IO_APIC_ENTRIES(_reg) \
+   ((_reg & IO_APIC_REG1_ENTRIES_MASK) >> IO_APIC_REG1_ENTRIES_OFFSET)
+#define IO_APIC_ENTRY_VECTOR(_entry) \
+   ((_entry & IO_APIC_ROUTE_VECTOR_MASK) >> IO_APIC_ROUTE_VECTOR_OFFSET)
+#define IO_APIC_ISMASKED(_entry) \
+   ((_entry & IO_APIC_INTMASK_MASK) >> IO_APIC_INTMASK_OFFSET)
+#define IO_APIC_ENTRY_DELMODE(_entry) \
+   ((_entry & IO_APIC_DELMODE_MASK) >> IO_APIC_DELMODE_OFFSET)
+#define IO_APIC_ENTRY_DESTMODE(_entry) \
+   ((_entry & IO_APIC_DESTMODE_MASK) >> IO_APIC_DESTMODE_OFFSET)
+#define IO_APIC_ENTRY_POLARITY(_entry) \
+   ((_entry & IO_APIC_POLARITY_MASK) >> IO_APIC_POLARITY_OFFSET)
+#define IO_APIC_ENTRY_TRIGGER(_entry) \
+   ((_entry & IO_APIC_TRIGGER_MASK) >> IO_APIC_TRIGGER_OFFSET)
+#define IO_APIC_ENTRY_DEST(_entry) \
+   ((_entry & IO_APIC_DEST_MASK) >> IO_APIC_DEST_OFFSET)
+
+//
+// We emulate an IOAPIC with 24 redirection registers
+//
+#define IOAPIC_NUM_REDIR_REGS 24
+
+#endif // _X86APIC_H_
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
new file mode 100644
index 00000000..2a237ac6
--- /dev/null
+++ b/vmmon-only/include/x86cpuid.h
@@ -0,0 +1,1783 @@
+/*********************************************************
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _X86CPUID_H_
+#define _X86CPUID_H_
+
+/* http://www.sandpile.org/ia32/cpuid.htm */
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMX
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "community_source.h"
+#include "x86vendor.h"
+#include "vm_assert.h"
+
+/*
+ * The linux kernel's ptrace.h stupidly defines the bare
+ * EAX/EBX/ECX/EDX, which wrecks havoc with our preprocessor tricks.
+ */
+#undef EAX
+#undef EBX
+#undef ECX
+#undef EDX
+
+typedef struct CPUIDRegs {
+   uint32 eax, ebx, ecx, edx;
+} CPUIDRegs;
+
+typedef union CPUIDRegsUnion {
+   uint32 array[4];
+   CPUIDRegs regs;
+} CPUIDRegsUnion;
+
+/*
+ * Results of calling cpuid(eax, ecx) on all host logical CPU.
+ */
+#ifdef _MSC_VER
+#pragma warning (disable :4200) // non-std extension: zero-sized array in struct
+#endif
+
+typedef
+#include "vmware_pack_begin.h"
+struct CPUIDReply {
+   /*
+    * Unique host logical CPU identifier. It does not change across queries, so
+    * we use it to correlate the replies of multiple queries.
+    */
+   uint64 tag;                // OUT
+
+   CPUIDRegs regs;            // OUT
+}
+#include "vmware_pack_end.h"
+CPUIDReply;
+
+typedef
+#include "vmware_pack_begin.h"
+struct CPUIDQuery {
+   uint32 eax;                // IN
+   uint32 ecx;                // IN
+   uint32 numLogicalCPUs;     // IN/OUT
+   CPUIDReply logicalCPUs[0]; // OUT
+}
+#include "vmware_pack_end.h"
+CPUIDQuery;
+
+/*
+ * CPUID levels the monitor caches.
+ *
+ * The first parameter defines whether the level has its default masks
+ * generated from the values in this file.  Any level which is marked
+ * as FALSE here *must* have all monitor support types set to NA.  A
+ * static assert in lib/cpuidcompat/cpuidcompat.c will check this.
+ *
+ * The fourth parameter is a "sub leaf count", where 0 means that ecx
+ * is ignored, otherwise is the count of sub-leaves cached/supported.
+ */
+
+#define CPUID_CACHED_LEVELS                         \
+   CPUIDLEVEL(TRUE,  0,   0,          0)            \
+   CPUIDLEVEL(TRUE,  1,   1,          0)            \
+   CPUIDLEVEL(FALSE, 2,   2,          0)            \
+   CPUIDLEVEL(FALSE, 4,   4,          7)            \
+   CPUIDLEVEL(FALSE, 5,   5,          0)            \
+   CPUIDLEVEL(FALSE, 6,   6,          0)            \
+   CPUIDLEVEL(TRUE,  7,   7,          1)            \
+   CPUIDLEVEL(FALSE, A,   0xA,        0)            \
+   CPUIDLEVEL(FALSE, B,   0xB,        2)            \
+   CPUIDLEVEL(TRUE,  D,   0xD,        4)            \
+   CPUIDLEVEL(FALSE, 12,  0x12,       4)            \
+   CPUIDLEVEL(FALSE, 400, 0x40000000, 0)            \
+   CPUIDLEVEL(FALSE, 401, 0x40000001, 0)            \
+   CPUIDLEVEL(FALSE, 402, 0x40000002, 0)            \
+   CPUIDLEVEL(FALSE, 403, 0x40000003, 0)            \
+   CPUIDLEVEL(FALSE, 404, 0x40000004, 0)            \
+   CPUIDLEVEL(FALSE, 405, 0x40000005, 0)            \
+   CPUIDLEVEL(FALSE, 406, 0x40000006, 0)            \
+   CPUIDLEVEL(FALSE, 410, 0x40000010, 0)            \
+   CPUIDLEVEL(FALSE, 80,  0x80000000, 0)            \
+   CPUIDLEVEL(TRUE,  81,  0x80000001, 0)            \
+   CPUIDLEVEL(FALSE, 82,  0x80000002, 0)            \
+   CPUIDLEVEL(FALSE, 83,  0x80000003, 0)            \
+   CPUIDLEVEL(FALSE, 84,  0x80000004, 0)            \
+   CPUIDLEVEL(FALSE, 85,  0x80000005, 0)            \
+   CPUIDLEVEL(FALSE, 86,  0x80000006, 0)            \
+   CPUIDLEVEL(FALSE, 87,  0x80000007, 0)            \
+   CPUIDLEVEL(FALSE, 88,  0x80000008, 0)            \
+   CPUIDLEVEL(TRUE,  8A,  0x8000000A, 0)            \
+   CPUIDLEVEL(FALSE, 819, 0x80000019, 0)            \
+   CPUIDLEVEL(FALSE, 81A, 0x8000001A, 0)            \
+   CPUIDLEVEL(FALSE, 81B, 0x8000001B, 0)            \
+   CPUIDLEVEL(FALSE, 81C, 0x8000001C, 0)            \
+   CPUIDLEVEL(FALSE, 81D, 0x8000001D, 5)            \
+   CPUIDLEVEL(FALSE, 81E, 0x8000001E, 0)
+
+#define CPUID_ALL_LEVELS CPUID_CACHED_LEVELS
+
+/* Define cached CPUID levels in the form: CPUID_LEVEL_<ShortName> */
+typedef enum {
+#define CPUIDLEVEL(t, s, v, c) CPUID_LEVEL_##s,
+   CPUID_CACHED_LEVELS
+#undef CPUIDLEVEL
+   CPUID_NUM_CACHED_LEVELS
+} CpuidCachedLevel;
+
+/* Enum to translate between shorthand name and actual CPUID level value. */
+enum {
+#define CPUIDLEVEL(t, s, v, c) CPUID_LEVEL_VAL_##s = v,
+   CPUID_ALL_LEVELS
+#undef CPUIDLEVEL
+};
+
+
+/* Named feature leaves */
+#define CPUID_FEATURE_INFORMATION  0x01
+#define CPUID_PROCESSOR_TOPOLOGY   4
+#define CPUID_MWAIT_FEATURES       5
+#define CPUID_XSAVE_FEATURES       0xd
+#define CPUID_HYPERVISOR_LEVEL_0   0x40000000
+#define CPUID_SVM_FEATURES         0x8000000a
+
+
+/*
+ * CPUID result registers
+ */
+
+#define CPUID_REGS                              \
+   CPUIDREG(EAX, eax)                           \
+   CPUIDREG(EBX, ebx)                           \
+   CPUIDREG(ECX, ecx)                           \
+   CPUIDREG(EDX, edx)
+
+typedef enum {
+#define CPUIDREG(uc, lc) CPUID_REG_##uc,
+   CPUID_REGS
+#undef CPUIDREG
+   CPUID_NUM_REGS
+} CpuidReg;
+
+#define CPUID_INTEL_VENDOR_STRING       "GenuntelineI"
+#define CPUID_AMD_VENDOR_STRING         "AuthcAMDenti"
+#define CPUID_CYRIX_VENDOR_STRING       "CyriteadxIns"
+#define CPUID_VIA_VENDOR_STRING         "CentaulsaurH"
+
+#define CPUID_HYPERV_HYPERVISOR_VENDOR_STRING  "Microsoft Hv"
+#define CPUID_KVM_HYPERVISOR_VENDOR_STRING     "KVMKVMKVM\0\0\0"
+#define CPUID_VMWARE_HYPERVISOR_VENDOR_STRING  "VMwareVMware"
+#define CPUID_XEN_HYPERVISOR_VENDOR_STRING     "XenVMMXenVMM"
+
+#define CPUID_INTEL_VENDOR_STRING_FIXED "GenuineIntel"
+#define CPUID_AMD_VENDOR_STRING_FIXED   "AuthenticAMD"
+#define CPUID_CYRIX_VENDOR_STRING_FIXED "CyrixInstead"
+#define CPUID_VIA_VENDOR_STRING_FIXED   "CentaurHauls"
+
+/*
+ * FIELD can be defined to process the CPUID information provided
+ * in the following CPUID_FIELD_DATA macro.  The first parameter is
+ * the CPUID level of the feature (must be defined in
+ * CPUID_ALL_LEVELS, above.  The second parameter is the CPUID result
+ * register in which the field is returned (defined in CPUID_REGS).
+ * The third field is the vendor(s) this feature applies to.  "COMMON"
+ * means all vendors apply.  UNKNOWN may not be used here.  The fourth
+ * and fifth parameters are the bit position of the field and the
+ * width, respectively.  The sixth is the text name of the field.
+ *
+ * The seventh parameters specifies the monitor support
+ * characteristics for this field.  The value must be a valid
+ * CpuidFieldSupported value (omitting CPUID_FIELD_SUPPORT_ for
+ * convenience).  The meaning of those values are described below.
+ *
+ * The eighth parameter describes whether the feature is capable of
+ * being used by usermode code (TRUE), or just CPL0 kernel code
+ * (FALSE).
+ *
+ * FLAG is defined identically to FIELD, but its accessors are more
+ * appropriate for 1-bit flags, and compile-time asserts enforce that
+ * the size is 1 bit wide.
+ */
+
+
+/*
+ * CpuidFieldSupported is made up of the following values:
+ *
+ *     NO: A feature/field that IS NOT SUPPORTED by the monitor.  Even
+ *     if the host supports this feature, we will never expose it to
+ *     the guest.
+ *
+ *     YES: A feature/field that IS SUPPORTED by the monitor.  If the
+ *     host supports this feature, we will expose it to the guest.  If
+ *     not, then we will not set the feature.
+ *
+ *     ANY: A feature/field that IS ALWAYS SUPPORTED by the monitor.
+ *     Even if the host does not support the feature, the monitor can
+ *     expose the feature to the guest. As with "YES", the guest cpuid
+ *     value defaults to the host/evc cpuid value.  But usually the
+ *     guest cpuid value is recomputed at power on, ignoring the default
+ *     value.
+ *
+ *
+ *     NA: Only legal for levels not masked/tested by default (see
+ *     above for this definition).  Such fields must always be marked
+ *     as NA.
+ *
+ * These distinctions, when combined with the feature's CPL3
+ * properties can be translated into a common CPUID mask string as
+ * follows:
+ *
+ *     NO + CPL3 --> "R" (Reserved).  We don't support the feature,
+ *     but we can't properly hide this from applications when using
+ *     direct execution or HV with apps that do try/catch/fail, so we
+ *     must still perform compatibility checks.
+ *
+ *     NO + !CPL3 --> "0" (Masked).  We can hide this from the guest.
+ *
+ *     YES --> "H" (Host).  We support the feature, so show it to the
+ *     guest if the host has the feature.
+ *
+ *     ANY/NA --> "X" (Ignore).  By default, don't perform checks for
+ *     this feature bit.  Per-GOS masks may choose to set this bit in
+ *     the guest.  (e.g. the APIC feature bit is always set to 1.)
+ *
+ *     See lib/cpuidcompat/cpuidcompat.c for any possible overrides to
+ *     these defaults.
+ */
+typedef enum {
+   CPUID_FIELD_SUPPORTED_NO,
+   CPUID_FIELD_SUPPORTED_YES,
+   CPUID_FIELD_SUPPORTED_ANY,
+   CPUID_FIELD_SUPPORTED_NA,
+   CPUID_NUM_FIELD_SUPPORTEDS
+} CpuidFieldSupported;
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_0                                               \
+FIELD(  0,  0, EAX,  0, 32, NUMLEVELS,                             ANY, FALSE) \
+FIELD(  0,  0, EBX,  0, 32, VENDOR1,                               YES, TRUE)  \
+FIELD(  0,  0, ECX,  0, 32, VENDOR3,                               YES, TRUE)  \
+FIELD(  0,  0, EDX,  0, 32, VENDOR2,                               YES, TRUE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_1                                               \
+FIELD(  1,  0, EAX,  0,  4, STEPPING,                              ANY, FALSE) \
+FIELD(  1,  0, EAX,  4,  4, MODEL,                                 ANY, FALSE) \
+FIELD(  1,  0, EAX,  8,  4, FAMILY,                                YES, FALSE) \
+FIELD(  1,  0, EAX, 12,  2, TYPE,                                  ANY, FALSE) \
+FIELD(  1,  0, EAX, 16,  4, EXTENDED_MODEL,                        ANY, FALSE) \
+FIELD(  1,  0, EAX, 20,  8, EXTENDED_FAMILY,                       YES, FALSE) \
+FIELD(  1,  0, EBX,  0,  8, BRAND_ID,                              ANY, FALSE) \
+FIELD(  1,  0, EBX,  8,  8, CLFL_SIZE,                             ANY, FALSE) \
+FIELD(  1,  0, EBX, 16,  8, LCPU_COUNT,                            ANY, FALSE) \
+FIELD(  1,  0, EBX, 24,  8, APICID,                                ANY, FALSE) \
+FLAG(   1,  0, ECX,  0,  1, SSE3,                                  YES, TRUE)  \
+FLAG(   1,  0, ECX,  1,  1, PCLMULQDQ,                             YES, TRUE)  \
+FLAG(   1,  0, ECX,  2,  1, DTES64,                                NO,  FALSE) \
+FLAG(   1,  0, ECX,  3,  1, MWAIT,                                 YES, FALSE) \
+FLAG(   1,  0, ECX,  4,  1, DSCPL,                                 NO,  FALSE) \
+FLAG(   1,  0, ECX,  5,  1, VMX,                                   YES, FALSE) \
+FLAG(   1,  0, ECX,  6,  1, SMX,                                   NO,  FALSE) \
+FLAG(   1,  0, ECX,  7,  1, EIST,                                  NO,  FALSE) \
+FLAG(   1,  0, ECX,  8,  1, TM2,                                   NO,  FALSE) \
+FLAG(   1,  0, ECX,  9,  1, SSSE3,                                 YES, TRUE)  \
+FLAG(   1,  0, ECX, 10,  1, CNXTID,                                NO,  FALSE) \
+FLAG(   1,  0, ECX, 11,  1, SDBG,                                  NO,  FALSE) \
+FLAG(   1,  0, ECX, 12,  1, FMA,                                   YES, TRUE)  \
+FLAG(   1,  0, ECX, 13,  1, CMPXCHG16B,                            YES, TRUE)  \
+FLAG(   1,  0, ECX, 14,  1, xTPR,                                  NO,  FALSE) \
+FLAG(   1,  0, ECX, 15,  1, PDCM,                                  NO,  FALSE) \
+FLAG(   1,  0, ECX, 17,  1, PCID,                                  YES, FALSE) \
+FLAG(   1,  0, ECX, 18,  1, DCA,                                   NO,  FALSE) \
+FLAG(   1,  0, ECX, 19,  1, SSE41,                                 YES, TRUE)  \
+FLAG(   1,  0, ECX, 20,  1, SSE42,                                 YES, TRUE)  \
+FLAG(   1,  0, ECX, 21,  1, x2APIC,                                ANY, FALSE) \
+FLAG(   1,  0, ECX, 22,  1, MOVBE,                                 YES, TRUE)  \
+FLAG(   1,  0, ECX, 23,  1, POPCNT,                                YES, TRUE)  \
+FLAG(   1,  0, ECX, 24,  1, TSC_DEADLINE,                          ANY, FALSE) \
+FLAG(   1,  0, ECX, 25,  1, AES,                                   YES, TRUE)  \
+FLAG(   1,  0, ECX, 26,  1, XSAVE,                                 YES, FALSE) \
+FLAG(   1,  0, ECX, 27,  1, OSXSAVE,                               ANY, FALSE) \
+FLAG(   1,  0, ECX, 28,  1, AVX,                                   YES, FALSE) \
+FLAG(   1,  0, ECX, 29,  1, F16C,                                  YES, TRUE)  \
+FLAG(   1,  0, ECX, 30,  1, RDRAND,                                YES, TRUE)  \
+FLAG(   1,  0, ECX, 31,  1, HYPERVISOR,                            ANY, TRUE)  \
+FLAG(   1,  0, EDX,  0,  1, FPU,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX,  1,  1, VME,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  2,  1, DE,                                    YES, FALSE) \
+FLAG(   1,  0, EDX,  3,  1, PSE,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  4,  1, TSC,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX,  5,  1, MSR,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  6,  1, PAE,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  7,  1, MCE,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  8,  1, CX8,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX,  9,  1, APIC,                                  ANY, FALSE) \
+FLAG(   1,  0, EDX, 11,  1, SEP,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX, 12,  1, MTRR,                                  YES, FALSE) \
+FLAG(   1,  0, EDX, 13,  1, PGE,                                   YES, FALSE) \
+FLAG(   1,  0, EDX, 14,  1, MCA,                                   YES, FALSE) \
+FLAG(   1,  0, EDX, 15,  1, CMOV,                                  YES, TRUE)  \
+FLAG(   1,  0, EDX, 16,  1, PAT,                                   YES, FALSE) \
+FLAG(   1,  0, EDX, 17,  1, PSE36,                                 YES, FALSE) \
+FLAG(   1,  0, EDX, 18,  1, PSN,                                   YES, FALSE) \
+FLAG(   1,  0, EDX, 19,  1, CLFSH,                                 YES, TRUE)  \
+FLAG(   1,  0, EDX, 21,  1, DS,                                    YES, FALSE) \
+FLAG(   1,  0, EDX, 22,  1, ACPI,                                  ANY, FALSE) \
+FLAG(   1,  0, EDX, 23,  1, MMX,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX, 24,  1, FXSR,                                  YES, TRUE)  \
+FLAG(   1,  0, EDX, 25,  1, SSE,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX, 26,  1, SSE2,                                  YES, TRUE)  \
+FLAG(   1,  0, EDX, 27,  1, SS,                                    YES, FALSE) \
+FLAG(   1,  0, EDX, 28,  1, HTT,                                   ANY, FALSE) \
+FLAG(   1,  0, EDX, 29,  1, TM,                                    NO,  FALSE) \
+FLAG(   1,  0, EDX, 30,  1, IA64,                                  NO,  FALSE) \
+FLAG(   1,  0, EDX, 31,  1, PBE,                                   NO,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_2                                               \
+FIELD(  2,  0, EAX,  0,  8, LEAF2_COUNT,                           NA, FALSE)  \
+FIELD(  2,  0, EAX,  8,  8, LEAF2_CACHE1,                          NA, FALSE)  \
+FIELD(  2,  0, EAX, 16,  8, LEAF2_CACHE2,                          NA, FALSE)  \
+FIELD(  2,  0, EAX, 24,  8, LEAF2_CACHE3,                          NA, FALSE)  \
+FIELD(  2,  0, EBX,  0,  8, LEAF2_CACHE4,                          NA, FALSE)  \
+FIELD(  2,  0, EBX,  8,  8, LEAF2_CACHE5,                          NA, FALSE)  \
+FIELD(  2,  0, EBX, 16,  8, LEAF2_CACHE6,                          NA, FALSE)  \
+FIELD(  2,  0, EBX, 24,  8, LEAF2_CACHE7,                          NA, FALSE)  \
+FIELD(  2,  0, ECX,  0,  8, LEAF2_CACHE8,                          NA, FALSE)  \
+FIELD(  2,  0, ECX,  8,  8, LEAF2_CACHE9,                          NA, FALSE)  \
+FIELD(  2,  0, ECX, 16,  8, LEAF2_CACHE10,                         NA, FALSE)  \
+FIELD(  2,  0, ECX, 24,  8, LEAF2_CACHE11,                         NA, FALSE)  \
+FIELD(  2,  0, EDX,  0,  8, LEAF2_CACHE12,                         NA, FALSE)  \
+FIELD(  2,  0, EDX,  8,  8, LEAF2_CACHE13,                         NA, FALSE)  \
+FIELD(  2,  0, EDX, 16,  8, LEAF2_CACHE14,                         NA, FALSE)  \
+FIELD(  2,  0, EDX, 24,  8, LEAF2_CACHE15,                         NA, FALSE)  \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_4                                               \
+FIELD(  4,  0, EAX,  0,  5, LEAF4_CACHE_TYPE,                      NA,  FALSE) \
+FIELD(  4,  0, EAX,  5,  3, LEAF4_CACHE_LEVEL,                     NA,  FALSE) \
+FLAG(   4,  0, EAX,  8,  1, LEAF4_CACHE_SELF_INIT,                 NA,  FALSE) \
+FLAG(   4,  0, EAX,  9,  1, LEAF4_CACHE_FULLY_ASSOC,               NA,  FALSE) \
+FIELD(  4,  0, EAX, 14, 12, LEAF4_CACHE_NUMHT_SHARING,             NA,  FALSE) \
+FIELD(  4,  0, EAX, 26,  6, LEAF4_CORE_COUNT,                      NA,  FALSE) \
+FIELD(  4,  0, EBX,  0, 12, LEAF4_CACHE_LINE,                      NA,  FALSE) \
+FIELD(  4,  0, EBX, 12, 10, LEAF4_CACHE_PART,                      NA,  FALSE) \
+FIELD(  4,  0, EBX, 22, 10, LEAF4_CACHE_WAYS,                      NA,  FALSE) \
+FIELD(  4,  0, ECX,  0, 32, LEAF4_CACHE_SETS,                      NA,  FALSE) \
+FLAG(   4,  0, EDX,  0,  1, LEAF4_CACHE_WBINVD_NOT_GUARANTEED,     NA,  FALSE) \
+FLAG(   4,  0, EDX,  1,  1, LEAF4_CACHE_IS_INCLUSIVE,              NA,  FALSE) \
+FLAG(   4,  0, EDX,  2,  1, LEAF4_CACHE_COMPLEX_INDEXING,          NA,  FALSE)
+
+/*     LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                 MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_5                                               \
+FIELD(  5,  0, EAX,  0, 16, MWAIT_MIN_SIZE,                        NA,  FALSE) \
+FIELD(  5,  0, EBX,  0, 16, MWAIT_MAX_SIZE,                        NA,  FALSE) \
+FLAG(   5,  0, ECX,  0,  1, MWAIT_EXTENSIONS,                      NA,  FALSE) \
+FLAG(   5,  0, ECX,  1,  1, MWAIT_INTR_BREAK,                      NA,  FALSE) \
+FIELD(  5,  0, EDX,  0,  4, MWAIT_C0_SUBSTATE,                     NA,  FALSE) \
+FIELD(  5,  0, EDX,  4,  4, MWAIT_C1_SUBSTATE,                     NA,  FALSE) \
+FIELD(  5,  0, EDX,  8,  4, MWAIT_C2_SUBSTATE,                     NA,  FALSE) \
+FIELD(  5,  0, EDX, 12,  4, MWAIT_C3_SUBSTATE,                     NA,  FALSE) \
+FIELD(  5,  0, EDX, 16,  4, MWAIT_C4_SUBSTATE,                     NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_6                                               \
+FLAG(   6,  0, EAX,  0,  1, THERMAL_SENSOR,                        NA,  FALSE) \
+FLAG(   6,  0, EAX,  1,  1, TURBO_MODE,                            NA,  FALSE) \
+FLAG(   6,  0, EAX,  2,  1, APIC_INVARIANT,                        NA,  FALSE) \
+FLAG(   6,  0, EAX,  4,  1, PLN,                                   NA,  FALSE) \
+FLAG(   6,  0, EAX,  5,  1, ECMD,                                  NA,  FALSE) \
+FLAG(   6,  0, EAX,  6,  1, PTM,                                   NA,  FALSE) \
+FLAG(   6,  0, EAX,  7,  1, HWP,                                   NA,  FALSE) \
+FLAG(   6,  0, EAX,  8,  1, HWP_NOTIFICATION,                      NA,  FALSE) \
+FLAG(   6,  0, EAX,  9,  1, HWP_ACTIVITY_WINDOW,                   NA,  FALSE) \
+FLAG(   6,  0, EAX, 10,  1, HWP_ENERGY_PERFORMANCE_PREFERENCE,     NA,  FALSE) \
+FLAG(   6,  0, EAX, 11,  1, HWP_PACKAGE_LEVEL_REQUEST,             NA,  FALSE) \
+FLAG(   6,  0, EAX, 13,  1, HDC,                                   NA,  FALSE) \
+FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,                   NA,  FALSE) \
+FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                     NA,  FALSE) \
+FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                      NA,  FALSE)
+
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_7                                               \
+FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                              YES, FALSE) \
+FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                            ANY, FALSE) \
+FLAG(   7,  0, EBX,  3,  1, BMI1,                                  YES, TRUE)  \
+FLAG(   7,  0, EBX,  2,  1, SGX,                                   NO,  FALSE) \
+FLAG(   7,  0, EBX,  4,  1, HLE,                                   YES, TRUE)  \
+FLAG(   7,  0, EBX,  5,  1, AVX2,                                  YES, TRUE)  \
+FLAG(   7,  0, EBX,  7,  1, SMEP,                                  YES, FALSE) \
+FLAG(   7,  0, EBX,  8,  1, BMI2,                                  YES, TRUE)  \
+FLAG(   7,  0, EBX,  9,  1, ENFSTRG,                               YES, FALSE) \
+FLAG(   7,  0, EBX, 10,  1, INVPCID,                               YES, FALSE) \
+FLAG(   7,  0, EBX, 11,  1, RTM,                                   YES, TRUE)  \
+FLAG(   7,  0, EBX, 12,  1, PQM,                                   NO,  FALSE) \
+FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                       ANY, TRUE)  \
+FLAG(   7,  0, EBX, 15,  1, PQE,                                   NO,  FALSE) \
+FLAG(   7,  0, EBX, 18,  1, RDSEED,                                YES, TRUE)  \
+FLAG(   7,  0, EBX, 19,  1, ADX,                                   YES, TRUE)  \
+FLAG(   7,  0, EBX, 20,  1, SMAP,                                  YES, FALSE) \
+FLAG(   7,  0, EBX, 25,  1, PT,                                    NO,  FALSE) \
+FLAG(   7,  0, ECX,  0,  1, PREFETCHWT1,                           NO,  TRUE)
+
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_A                                               \
+FIELD(  A,  0, EAX,  0,  8, PMC_VERSION,                           NA,  FALSE) \
+FIELD(  A,  0, EAX,  8,  8, PMC_NUM_GEN,                           NA,  FALSE) \
+FIELD(  A,  0, EAX, 16,  8, PMC_WIDTH_GEN,                         NA,  FALSE) \
+FIELD(  A,  0, EAX, 24,  8, PMC_EBX_LENGTH,                        NA,  FALSE) \
+FLAG(   A,  0, EBX,  0,  1, PMC_CORE_CYCLES,                       NA,  FALSE) \
+FLAG(   A,  0, EBX,  1,  1, PMC_INSTR_RETIRED,                     NA,  FALSE) \
+FLAG(   A,  0, EBX,  2,  1, PMC_REF_CYCLES,                        NA,  FALSE) \
+FLAG(   A,  0, EBX,  3,  1, PMC_LAST_LVL_CREF,                     NA,  FALSE) \
+FLAG(   A,  0, EBX,  4,  1, PMC_LAST_LVL_CMISS,                    NA,  FALSE) \
+FLAG(   A,  0, EBX,  5,  1, PMC_BR_INST_RETIRED,                   NA,  FALSE) \
+FLAG(   A,  0, EBX,  6,  1, PMC_BR_MISS_RETIRED,                   NA,  FALSE) \
+FIELD(  A,  0, EDX,  0,  5, PMC_NUM_FIXED,                         NA,  FALSE) \
+FIELD(  A,  0, EDX,  5,  8, PMC_WIDTH_FIXED,                       NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_B                                               \
+FIELD(  B,  0, EAX,  0,  5, TOPOLOGY_MASK_WIDTH,                   NA,  FALSE) \
+FIELD(  B,  0, EBX,  0, 16, TOPOLOGY_CPUS_SHARING_LEVEL,           NA,  FALSE) \
+FIELD(  B,  0, ECX,  0,  8, TOPOLOGY_LEVEL_NUMBER,                 NA,  FALSE) \
+FIELD(  B,  0, ECX,  8,  8, TOPOLOGY_LEVEL_TYPE,                   NA,  FALSE) \
+FIELD(  B,  0, EDX,  0, 32, TOPOLOGY_X2APIC_ID,                    NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_D                                               \
+FLAG(   D,  0, EAX,  0,  1, XCR0_MASTER_LEGACY_FP,                 YES, FALSE) \
+FLAG(   D,  0, EAX,  1,  1, XCR0_MASTER_SSE,                       YES, FALSE) \
+FLAG(   D,  0, EAX,  2,  1, XCR0_MASTER_YMM_H,                     YES, FALSE) \
+FIELD(  D,  0, EAX,  3, 29, XCR0_MASTER_LOWER,                     NO,  FALSE) \
+FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                    ANY, FALSE) \
+FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                        YES, FALSE) \
+FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                     NO,  FALSE) \
+FLAG(   D,  0, EDX, 30,  1, XCR0_MASTER_LWP,                       NO,  FALSE) \
+FLAG(   D,  0, EDX, 31,  1, XCR0_MASTER_EXTENDED_XSAVE,            NO,  FALSE) \
+FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                              YES, FALSE) \
+FLAG(   D,  1, EAX,  1,  1, XSAVEC,                                NO,  FALSE) \
+FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                           NO,  FALSE) \
+FLAG(   D,  1, EAX,  3,  1, XSAVES,                                NO,  FALSE) \
+FIELD(  D,  1, EBX,  0, 32, XSAVE_XSS_SIZE,                        NO,  FALSE) \
+FIELD(  D,  1, ECX,  0, 32, XSS_LOWER,                             NO,  FALSE) \
+FIELD(  D,  1, EDX,  0, 32, XSS_UPPER,                             NO,  FALSE) \
+FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                        YES, FALSE) \
+FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                      YES, FALSE) \
+FIELD(  D,  2, ECX,  0, 32, XSAVE_YMM_RSVD1,                       YES, FALSE) \
+FIELD(  D,  2, EDX,  0, 32, XSAVE_YMM_RSVD2,                       YES, FALSE) \
+FIELD(  D, 62, EAX,  0, 32, XSAVE_LWP_SIZE,                        NO,  FALSE) \
+FIELD(  D, 62, EBX,  0, 32, XSAVE_LWP_OFFSET,                      NO,  FALSE) \
+FIELD(  D, 62, ECX,  0, 32, XSAVE_LWP_RSVD1,                       NO,  FALSE) \
+FIELD(  D, 62, EDX,  0, 32, XSAVE_LWP_RSVD2,                       NO,  FALSE)
+
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_12                                              \
+FLAG(  12,  0, EAX,  0,  1, SGX1,                                  NA,  FALSE) \
+FLAG(  12,  0, EAX,  1,  1, SGX2,                                  NA,  FALSE) \
+FLAG(  12,  0, EBX, 31,  1, SGX_MISCSELECT,                        NA,  FALSE) \
+FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,                NA,  FALSE) \
+FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,                   NA,  FALSE) \
+FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                      NA,  FALSE) \
+FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                      NA,  FALSE) \
+FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                      NA,  FALSE) \
+FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                      NA,  FALSE) \
+FIELD( 12,  2, EAX,  0,  4, EPC00_VALID,                           NA,  FALSE) \
+FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                        NA,  FALSE) \
+FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                       NA,  FALSE) \
+FIELD( 12,  2, ECX,  0,  4, EPC00_PROTECTED,                       NA,  FALSE) \
+FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                        NA,  FALSE) \
+FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                       NA,  FALSE) \
+FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                           NA,  FALSE) \
+FIELD( 12,  3, EAX, 12, 20, EPC01_BASE_LOW,                        NA,  FALSE) \
+FIELD( 12,  3, EBX,  0, 20, EPC01_BASE_HIGH,                       NA,  FALSE) \
+FIELD( 12,  3, ECX,  0,  4, EPC01_PROTECTED,                       NA,  FALSE) \
+FIELD( 12,  3, ECX, 12, 20, EPC01_SIZE_LOW,                        NA,  FALSE) \
+FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                       NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_400                                             \
+FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                         NA,  FALSE) \
+FIELD(400,  0, EBX,  0, 32, HYPERVISOR_VENDOR0,                    NA,  FALSE) \
+FIELD(400,  0, ECX,  0, 32, HYPERVISOR_VENDOR1,                    NA,  FALSE) \
+FIELD(400,  0, EDX,  0, 32, HYPERVISOR_VENDOR2,                    NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_401                                             \
+FIELD(401,  0, EAX,  0, 32, HV_INTERFACE_SIGNATURE,                NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_402                                             \
+FIELD(402,  0, EAX,  0, 32, BUILD_NUMBER,                          NA,  FALSE) \
+FIELD(402,  0, EBX,  0, 16, MINOR_VERSION,                         NA,  FALSE) \
+FIELD(402,  0, EBX, 16, 16, MAJOR_VERSION,                         NA,  FALSE) \
+FIELD(402,  0, ECX,  0, 32, SERVICE_PACK,                          NA,  FALSE) \
+FIELD(402,  0, EDX,  0, 24, SERVICE_NUMBER,                        NA,  FALSE) \
+FIELD(402,  0, EDX, 24,  8, SERVICE_BRANCH,                        NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_403                                             \
+FLAG( 403,  0, EAX,  0,  1, VP_RUNTIME_AVAIL,                      NA,  FALSE) \
+FLAG( 403,  0, EAX,  1,  1, REF_COUNTER_AVAIL,                     NA,  FALSE) \
+FLAG( 403,  0, EAX,  2,  1, BASIC_SYNIC_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EAX,  3,  1, SYNTH_TIMER_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EAX,  4,  1, APIC_ACCESS_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EAX,  5,  1, HYPERCALL_MSRS_AVAIL,                  NA,  FALSE) \
+FLAG( 403,  0, EAX,  6,  1, VP_INDEX_MSR_AVAIL,                    NA,  FALSE) \
+FLAG( 403,  0, EAX,  7,  1, VIRT_RESET_MSR_AVAIL,                  NA,  FALSE) \
+FLAG( 403,  0, EAX,  8,  1, STATS_PAGES_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EAX,  9,  1, REF_TSC_AVAIL,                         NA,  FALSE) \
+FLAG( 403,  0, EAX, 10,  1, GUEST_IDLE_MSR_AVAIL,                  NA,  FALSE) \
+FLAG( 403,  0, EAX, 11,  1, FREQUENCY_MSRS_AVAIL,                  NA,  FALSE) \
+FLAG( 403,  0, EAX, 12,  1, SYNTH_DEBUG_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EBX,  0,  1, CREATE_PARTITIONS_FLAG,                NA,  FALSE) \
+FLAG( 403,  0, EBX,  1,  1, ACCESS_PARTITION_ID_FLAG,              NA,  FALSE) \
+FLAG( 403,  0, EBX,  2,  1, ACCESS_MEMORY_POOL_FLAG,               NA,  FALSE) \
+FLAG( 403,  0, EBX,  3,  1, ADJUST_MESSAGE_BUFFERS_FLAG,           NA,  FALSE) \
+FLAG( 403,  0, EBX,  4,  1, POST_MESSAGES_FLAG,                    NA,  FALSE) \
+FLAG( 403,  0, EBX,  5,  1, SIGNAL_EVENTS_FLAG,                    NA,  FALSE) \
+FLAG( 403,  0, EBX,  6,  1, CREATE_PORT_FLAG,                      NA,  FALSE) \
+FLAG( 403,  0, EBX,  7,  1, CONNECT_PORT_FLAG,                     NA,  FALSE) \
+FLAG( 403,  0, EBX,  8,  1, ACCESS_STATS_FLAG,                     NA,  FALSE) \
+FLAG( 403,  0, EBX, 11,  1, DEBUGGING_FLAG,                        NA,  FALSE) \
+FLAG( 403,  0, EBX, 12,  1, CPU_MANAGEMENT_FLAG,                   NA,  FALSE) \
+FLAG( 403,  0, EBX, 13,  1, CONFIGURE_PROFILER_FLAG,               NA,  FALSE) \
+FLAG( 403,  0, EBX, 14,  1, ENABLE_EXPANDED_STACKWALKING_FLAG,     NA,  FALSE) \
+FIELD(403,  0, ECX,  0,  4, MAX_POWER_STATE,                       NA,  FALSE) \
+FLAG( 403,  0, ECX,  4,  1, HPET_NEEDED_FOR_C3,                    NA,  FALSE) \
+FLAG( 403,  0, EDX,  0,  1, MWAIT_AVAIL,                           NA,  FALSE) \
+FLAG( 403,  0, EDX,  1,  1, GUEST_DEBUGGING_AVAIL,                 NA,  FALSE) \
+FLAG( 403,  0, EDX,  2,  1, PERFORMANCE_MONITOR_AVAIL,             NA,  FALSE) \
+FLAG( 403,  0, EDX,  3,  1, CPU_DYN_PARTITIONING_AVAIL,            NA,  FALSE) \
+FLAG( 403,  0, EDX,  4,  1, XMM_REGISTERS_FOR_HYPERCALL_AVAIL,     NA,  FALSE) \
+FLAG( 403,  0, EDX,  5,  1, GUEST_IDLE_AVAIL,                      NA,  FALSE) \
+FLAG( 403,  0, EDX,  6,  1, HYPERVISOR_SLEEP_STATE_AVAIL,          NA,  FALSE) \
+FLAG( 403,  0, EDX,  7,  1, NUMA_DISTANCE_QUERY_AVAIL,             NA,  FALSE) \
+FLAG( 403,  0, EDX,  8,  1, TIMER_FREQUENCY_AVAIL,                 NA,  FALSE) \
+FLAG( 403,  0, EDX,  9,  1, SYNTH_MACHINE_CHECK_AVAIL,             NA,  FALSE) \
+FLAG( 403,  0, EDX, 10,  1, GUEST_CRASH_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EDX, 11,  1, DEBUG_MSRS_AVAIL,                      NA,  FALSE) \
+FLAG( 403,  0, EDX, 12,  1, NPIEP1_AVAIL,                          NA,  FALSE) \
+FLAG( 403,  0, EDX, 13,  1, DISABLE_HYPERVISOR_AVAIL,              NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_404                                             \
+FLAG( 404,  0, EAX,  0,  1, USE_HYPERCALL_TO_SWITCH_ADDR_SPACE,    NA,  FALSE) \
+FLAG( 404,  0, EAX,  1,  1, USE_HYPERCALL_TO_FLUSH_TLB,            NA,  FALSE) \
+FLAG( 404,  0, EAX,  2,  1, USE_HYPERCALL_FOR_TLB_SHOOTDOWN,       NA,  FALSE) \
+FLAG( 404,  0, EAX,  3,  1, USE_MSRS_FOR_EOI_ICR_TPR,              NA,  FALSE) \
+FLAG( 404,  0, EAX,  4,  1, USE_MSR_FOR_RESET,                     NA,  FALSE) \
+FLAG( 404,  0, EAX,  5,  1, USE_RELAXED_TIMING,                    NA,  FALSE) \
+FLAG( 404,  0, EAX,  6,  1, USE_DMA_REMAPPING,                     NA,  FALSE) \
+FLAG( 404,  0, EAX,  7,  1, USE_INTERRUPT_REMAPPING,               NA,  FALSE) \
+FLAG( 404,  0, EAX,  8,  1, USE_X2APIC,                            NA,  FALSE) \
+FLAG( 404,  0, EAX,  9,  1, DEPRECATE_AUTOEOI,                     NA,  FALSE) \
+FIELD(404,  0, EBX,  0, 32, SPINLOCK_RETRIES,                      NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_405                                             \
+FIELD(405,  0, EAX,  0, 32, MAX_VCPU,                              NA,  FALSE) \
+FIELD(405,  0, EBX,  0, 32, MAX_LCPU,                              NA,  FALSE) \
+FIELD(405,  0, ECX,  0, 32, MAX_REMAPPABLE_VECTORS,                NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_406                                             \
+FLAG( 406,  0, EAX,  0,  1, APIC_OVERLAY_ASSIST,                   NA,  FALSE) \
+FLAG( 406,  0, EAX,  1,  1, MSR_BITMAPS,                           NA,  FALSE) \
+FLAG( 406,  0, EAX,  2,  1, ARCH_PMCS,                             NA,  FALSE) \
+FLAG( 406,  0, EAX,  3,  1, SLAT,                                  NA,  FALSE) \
+FLAG( 406,  0, EAX,  4,  1, DMA_REMAPPING,                         NA,  FALSE) \
+FLAG( 406,  0, EAX,  5,  1, INTERRUPT_REMAPPING,                   NA,  FALSE) \
+FLAG( 406,  0, EAX,  6,  1, MEMORY_PATROL_SCRUBBER,                NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_410                                             \
+FIELD(410,  0, EAX,  0, 32, TSC_HZ,                                NA,  FALSE) \
+FIELD(410,  0, EBX,  0, 32, ACPIBUS_HZ,                            NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_80                                              \
+FIELD( 80,  0, EAX,  0, 32, NUM_EXT_LEVELS,                        NA,  FALSE) \
+FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                        NA,  FALSE) \
+FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                        NA,  FALSE) \
+FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                        NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81                                              \
+FIELD( 81,  0, EAX,  0, 32, UNKNOWN81EAX,                          ANY, FALSE) \
+FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                       ANY, FALSE) \
+FIELD( 81,  0, EAX,  4,  4, LEAF81_MODEL,                          ANY, FALSE) \
+FIELD( 81,  0, EAX,  8,  4, LEAF81_FAMILY,                         ANY, FALSE) \
+FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                           ANY, FALSE) \
+FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,                 ANY, FALSE) \
+FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,                ANY, FALSE) \
+FIELD( 81,  0, EBX,  0, 32, UNKNOWN81EBX,                          ANY, FALSE) \
+FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                       ANY, FALSE) \
+FIELD( 81,  0, EBX, 16, 16, UNDEF,                                 ANY, FALSE) \
+FLAG(  81,  0, ECX,  0,  1, LAHF64,                                YES, TRUE)  \
+FLAG(  81,  0, ECX,  1,  1, CMPLEGACY,                             ANY, FALSE) \
+FLAG(  81,  0, ECX,  2,  1, SVM,                                   YES, FALSE) \
+FLAG(  81,  0, ECX,  3,  1, EXTAPICSPC,                            YES, FALSE) \
+FLAG(  81,  0, ECX,  4,  1, CR8AVAIL,                              YES, FALSE) \
+FLAG(  81,  0, ECX,  5,  1, ABM,                                   YES, TRUE)  \
+FLAG(  81,  0, ECX,  6,  1, SSE4A,                                 YES, TRUE)  \
+FLAG(  81,  0, ECX,  7,  1, MISALIGNED_SSE,                        YES, TRUE)  \
+FLAG(  81,  0, ECX,  8,  1, 3DNPREFETCH,                           YES, TRUE)  \
+FLAG(  81,  0, ECX,  9,  1, OSVW,                                  ANY, FALSE) \
+FLAG(  81,  0, ECX, 10,  1, IBS,                                   NO,  FALSE) \
+FLAG(  81,  0, ECX, 11,  1, XOP,                                   YES, TRUE)  \
+FLAG(  81,  0, ECX, 12,  1, SKINIT,                                NO,  FALSE) \
+FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                              NO,  FALSE) \
+FLAG(  81,  0, ECX, 15,  1, LWP,                                   NO,  FALSE) \
+FLAG(  81,  0, ECX, 16,  1, FMA4,                                  YES, TRUE)  \
+FLAG(  81,  0, ECX, 17,  1, TCE,                                   NO,  FALSE) \
+FLAG(  81,  0, ECX, 19,  1, NODEID_MSR,                            NO,  FALSE) \
+FLAG(  81,  0, ECX, 21,  1, TBM,                                   YES, TRUE)  \
+FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                              NO,  FALSE) \
+FLAG(  81,  0, ECX, 23,  1, PERFCORE,                              ANY, TRUE)  \
+FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                            YES, TRUE)  \
+FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  2,  1, LEAF81_DE,                             YES, FALSE) \
+FLAG(  81,  0, EDX,  3,  1, LEAF81_PSE,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  4,  1, LEAF81_TSC,                            YES, TRUE)  \
+FLAG(  81,  0, EDX,  5,  1, LEAF81_MSR,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  6,  1, LEAF81_PAE,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  7,  1, LEAF81_MCE,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  8,  1, LEAF81_CX8,                            YES, TRUE)  \
+FLAG(  81,  0, EDX,  9,  1, LEAF81_APIC,                           ANY, FALSE) \
+FLAG(  81,  0, EDX, 11,  1, SYSC,                                  ANY, TRUE)  \
+FLAG(  81,  0, EDX, 12,  1, LEAF81_MTRR,                           YES, FALSE) \
+FLAG(  81,  0, EDX, 13,  1, LEAF81_PGE,                            YES, FALSE) \
+FLAG(  81,  0, EDX, 14,  1, LEAF81_MCA,                            YES, FALSE) \
+FLAG(  81,  0, EDX, 15,  1, LEAF81_CMOV,                           YES, TRUE)  \
+FLAG(  81,  0, EDX, 16,  1, LEAF81_PAT,                            YES, FALSE) \
+FLAG(  81,  0, EDX, 17,  1, LEAF81_PSE36,                          YES, FALSE) \
+FLAG(  81,  0, EDX, 20,  1, NX,                                    YES, FALSE) \
+FLAG(  81,  0, EDX, 22,  1, MMXEXT,                                YES, TRUE)  \
+FLAG(  81,  0, EDX, 23,  1, LEAF81_MMX,                            YES, TRUE)  \
+FLAG(  81,  0, EDX, 24,  1, LEAF81_FXSR,                           YES, TRUE)  \
+FLAG(  81,  0, EDX, 25,  1, FFXSR,                                 YES, FALSE) \
+FLAG(  81,  0, EDX, 26,  1, PDPE1GB,                               YES, FALSE) \
+FLAG(  81,  0, EDX, 27,  1, RDTSCP,                                YES, TRUE)  \
+FLAG(  81,  0, EDX, 29,  1, LM,                                    YES, FALSE) \
+FLAG(  81,  0, EDX, 30,  1, 3DNOWPLUS,                             YES, TRUE)  \
+FLAG(  81,  0, EDX, 31,  1, 3DNOW,                                 YES, TRUE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_82                                              \
+FIELD( 82,  0, EAX,  0, 32, LEAF82_BRAND_STRING_EAX,               NA,  FALSE) \
+FIELD( 82,  0, EBX,  0, 32, LEAF82_BRAND_STRING_EBX,               NA,  FALSE) \
+FIELD( 82,  0, ECX,  0, 32, LEAF82_BRAND_STRING_ECX,               NA,  FALSE) \
+FIELD( 82,  0, EDX,  0, 32, LEAF82_BRAND_STRING_EDX,               NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_83                                              \
+FIELD( 83,  0, EAX,  0, 32, LEAF83_BRAND_STRING_EAX,               NA,  FALSE) \
+FIELD( 83,  0, EBX,  0, 32, LEAF83_BRAND_STRING_EBX,               NA,  FALSE) \
+FIELD( 83,  0, ECX,  0, 32, LEAF83_BRAND_STRING_ECX,               NA,  FALSE) \
+FIELD( 83,  0, EDX,  0, 32, LEAF83_BRAND_STRING_EDX,               NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_84                                              \
+FIELD( 84,  0, EAX,  0, 32, LEAF84_BRAND_STRING_EAX,               NA,  FALSE) \
+FIELD( 84,  0, EBX,  0, 32, LEAF84_BRAND_STRING_EBX,               NA,  FALSE) \
+FIELD( 84,  0, ECX,  0, 32, LEAF84_BRAND_STRING_ECX,               NA,  FALSE) \
+FIELD( 84,  0, EDX,  0, 32, LEAF84_BRAND_STRING_EDX,               NA,  FALSE)
+
+#define CPUID_8A_EDX_11 \
+FLAG(  8A,  0, EDX, 11,  1, SVMEDX_RSVD1,                          NO,  FALSE)
+#define CPUID_8A_EDX_14_31 \
+FIELD( 8A,  0, EDX, 14, 18, SVMEDX_RSVD2,                          NO,  FALSE)
+
+/*    LEVEL, REG, POS, SIZE, NAME,                             MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_8x                                              \
+FIELD( 85,  0, EAX,  0,  8, ITLB_ENTRIES_2M4M_PGS,                 NA,  FALSE) \
+FIELD( 85,  0, EAX,  8,  8, ITLB_ASSOC_2M4M_PGS,                   NA,  FALSE) \
+FIELD( 85,  0, EAX, 16,  8, DTLB_ENTRIES_2M4M_PGS,                 NA,  FALSE) \
+FIELD( 85,  0, EAX, 24,  8, DTLB_ASSOC_2M4M_PGS,                   NA,  FALSE) \
+FIELD( 85,  0, EBX,  0,  8, ITLB_ENTRIES_4K_PGS,                   NA,  FALSE) \
+FIELD( 85,  0, EBX,  8,  8, ITLB_ASSOC_4K_PGS,                     NA,  FALSE) \
+FIELD( 85,  0, EBX, 16,  8, DTLB_ENTRIES_4K_PGS,                   NA,  FALSE) \
+FIELD( 85,  0, EBX, 24,  8, DTLB_ASSOC_4K_PGS,                     NA,  FALSE) \
+FIELD( 85,  0, ECX,  0,  8, L1_DCACHE_LINE_SIZE,                   NA,  FALSE) \
+FIELD( 85,  0, ECX,  8,  8, L1_DCACHE_LINES_PER_TAG,               NA,  FALSE) \
+FIELD( 85,  0, ECX, 16,  8, L1_DCACHE_ASSOC,                       NA,  FALSE) \
+FIELD( 85,  0, ECX, 24,  8, L1_DCACHE_SIZE,                        NA,  FALSE) \
+FIELD( 85,  0, EDX,  0,  8, L1_ICACHE_LINE_SIZE,                   NA,  FALSE) \
+FIELD( 85,  0, EDX,  8,  8, L1_ICACHE_LINES_PER_TAG,               NA,  FALSE) \
+FIELD( 85,  0, EDX, 16,  8, L1_ICACHE_ASSOC,                       NA,  FALSE) \
+FIELD( 85,  0, EDX, 24,  8, L1_ICACHE_SIZE,                        NA,  FALSE) \
+FIELD( 86,  0, EAX,  0, 12, L2_ITLB_ENTRIES_2M4M_PGS,              NA,  FALSE) \
+FIELD( 86,  0, EAX, 12,  4, L2_ITLB_ASSOC_2M4M_PGS,                NA,  FALSE) \
+FIELD( 86,  0, EAX, 16, 12, L2_DTLB_ENTRIES_2M4M_PGS,              NA,  FALSE) \
+FIELD( 86,  0, EAX, 28,  4, L2_DTLB_ASSOC_2M4M_PGS,                NA,  FALSE) \
+FIELD( 86,  0, EBX,  0, 12, L2_ITLB_ENTRIES_4K_PGS,                NA,  FALSE) \
+FIELD( 86,  0, EBX, 12,  4, L2_ITLB_ASSOC_4K_PGS,                  NA,  FALSE) \
+FIELD( 86,  0, EBX, 16, 12, L2_DTLB_ENTRIES_4K_PGS,                NA,  FALSE) \
+FIELD( 86,  0, EBX, 28,  4, L2_DTLB_ASSOC_4K_PGS,                  NA,  FALSE) \
+FIELD( 86,  0, ECX,  0,  8, L2CACHE_LINE,                          NA,  FALSE) \
+FIELD( 86,  0, ECX,  8,  4, L2CACHE_LINE_PER_TAG,                  NA,  FALSE) \
+FIELD( 86,  0, ECX, 12,  4, L2CACHE_WAYS,                          NA,  FALSE) \
+FIELD( 86,  0, ECX, 16, 16, L2CACHE_SIZE,                          NA,  FALSE) \
+FIELD( 86,  0, EDX,  0,  8, L3CACHE_LINE,                          NA,  FALSE) \
+FIELD( 86,  0, EDX,  8,  4, L3CACHE_LINE_PER_TAG,                  NA,  FALSE) \
+FIELD( 86,  0, EDX, 12,  4, L3CACHE_WAYS,                          NA,  FALSE) \
+FIELD( 86,  0, EDX, 18, 14, L3CACHE_SIZE,                          NA,  FALSE) \
+FLAG(  87,  0, EDX,  0,  1, TS,                                    NA,  FALSE) \
+FLAG(  87,  0, EDX,  1,  1, FID,                                   NA,  FALSE) \
+FLAG(  87,  0, EDX,  2,  1, VID,                                   NA,  FALSE) \
+FLAG(  87,  0, EDX,  3,  1, TTP,                                   NA,  FALSE) \
+FLAG(  87,  0, EDX,  4,  1, LEAF87_TM,                             NA,  FALSE) \
+FLAG(  87,  0, EDX,  5,  1, STC,                                   NA,  FALSE) \
+FLAG(  87,  0, EDX,  6,  1, 100MHZSTEPS,                           NA,  FALSE) \
+FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                              NA,  FALSE) \
+FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                         NA,  FALSE) \
+FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                       NA,  FALSE) \
+FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                             NA,  FALSE) \
+FIELD( 88,  0, EAX,  8,  8, VIRT_BITS,                             NA,  FALSE) \
+FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                    NA,  FALSE) \
+FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                     NA,  FALSE) \
+FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                    NA,  FALSE) \
+FIELD( 8A,  0, EAX,  0,  8, SVM_REVISION,                          YES, FALSE) \
+FLAG(  8A,  0, EAX,  8,  1, SVM_HYPERVISOR,                        NO,  FALSE) \
+FIELD( 8A,  0, EAX,  9, 23, SVMEAX_RSVD,                           NO,  FALSE) \
+FIELD( 8A,  0, EBX,  0, 32, SVM_NUM_ASIDS,                         YES, FALSE) \
+FIELD( 8A,  0, ECX,  0, 32, SVMECX_RSVD,                           NO,  FALSE) \
+FLAG(  8A,  0, EDX,  0,  1, SVM_NPT,                               YES, FALSE) \
+FLAG(  8A,  0, EDX,  1,  1, SVM_LBR,                               NO,  FALSE) \
+FLAG(  8A,  0, EDX,  2,  1, SVM_LOCK,                              ANY, FALSE) \
+FLAG(  8A,  0, EDX,  3,  1, SVM_NRIP,                              YES, FALSE) \
+FLAG(  8A,  0, EDX,  4,  1, SVM_TSC_RATE_MSR,                      NO,  FALSE) \
+FLAG(  8A,  0, EDX,  5,  1, SVM_VMCB_CLEAN,                        YES, FALSE) \
+FLAG(  8A,  0, EDX,  6,  1, SVM_FLUSH_BY_ASID,                     YES, FALSE) \
+FLAG(  8A,  0, EDX,  7,  1, SVM_DECODE_ASSISTS,                    YES, FALSE) \
+FIELD( 8A,  0, EDX,  8,  2, SVMEDX_RSVD0,                          NO,  FALSE) \
+FLAG(  8A,  0, EDX, 10,  1, SVM_PAUSE_FILTER,                      NO,  FALSE) \
+CPUID_8A_EDX_11 \
+FLAG(  8A,  0, EDX, 12,  1, SVM_PAUSE_THRESHOLD,                   NO,  FALSE) \
+FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                              NO,  FALSE) \
+CPUID_8A_EDX_14_31
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81x                                             \
+FIELD(819,  0, EAX,  0, 12, L1_ITLB_ENTRIES_1G_PGS,                NA,  FALSE) \
+FIELD(819,  0, EAX, 12,  4, L1_ITLB_ASSOC_1G_PGS,                  NA,  FALSE) \
+FIELD(819,  0, EAX, 16, 12, L1_DTLB_ENTRIES_1G_PGS,                NA,  FALSE) \
+FIELD(819,  0, EAX, 28,  4, L1_DTLB_ASSOC_1G_PGS,                  NA,  FALSE) \
+FIELD(819,  0, EBX,  0, 12, L2_ITLB_ENTRIES_1G_PGS,                NA,  FALSE) \
+FIELD(819,  0, EBX, 12,  4, L2_ITLB_ASSOC_1G_PGS,                  NA,  FALSE) \
+FIELD(819,  0, EBX, 16, 12, L2_DTLB_ENTRIES_1G_PGS,                NA,  FALSE) \
+FIELD(819,  0, EBX, 28,  4, L2_DTLB_ASSOC_1G_PGS,                  NA,  FALSE) \
+FLAG( 81A,  0, EAX,  0,  1, FP128,                                 NA,  FALSE) \
+FLAG( 81A,  0, EAX,  1,  1, MOVU,                                  NA,  FALSE) \
+FLAG( 81B,  0, EAX,  0,  1, IBS_FFV,                               NA,  FALSE) \
+FLAG( 81B,  0, EAX,  1,  1, IBS_FETCHSAM,                          NA,  FALSE) \
+FLAG( 81B,  0, EAX,  2,  1, IBS_OPSAM,                             NA,  FALSE) \
+FLAG( 81B,  0, EAX,  3,  1, RW_OPCOUNT,                            NA,  FALSE) \
+FLAG( 81B,  0, EAX,  4,  1, OPCOUNT,                               NA,  FALSE) \
+FLAG( 81B,  0, EAX,  5,  1, BRANCH_TARGET_ADDR,                    NA,  FALSE) \
+FLAG( 81B,  0, EAX,  6,  1, OPCOUNT_EXT,                           NA,  FALSE) \
+FLAG( 81B,  0, EAX,  7,  1, RIP_INVALID_CHECK,                     NA,  FALSE) \
+FLAG( 81C,  0, EAX,  0,  1, LWP_AVAIL,                             NA,  FALSE) \
+FLAG( 81C,  0, EAX,  1,  1, LWP_VAL_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  2,  1, LWP_IRE_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  3,  1, LWP_BRE_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  4,  1, LWP_DME_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  5,  1, LWP_CNH_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  6,  1, LWP_RNH_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX, 31,  1, LWP_INT_AVAIL,                         NA,  FALSE) \
+FIELD(81C,  0, EBX,  0,  8, LWP_CB_SIZE,                           NA,  FALSE) \
+FIELD(81C,  0, EBX,  8,  8, LWP_EVENT_SIZE,                        NA,  FALSE) \
+FIELD(81C,  0, EBX, 16,  8, LWP_MAX_EVENTS,                        NA,  FALSE) \
+FIELD(81C,  0, EBX, 24,  8, LWP_EVENT_OFFSET,                      NA,  FALSE) \
+FIELD(81C,  0, ECX,  0,  4, LWP_LATENCY_MAX,                       NA,  FALSE) \
+FLAG( 81C,  0, ECX,  5,  1, LWP_DATA_ADDR_VALID,                   NA,  FALSE) \
+FIELD(81C,  0, ECX,  6,  3, LWP_LATENCY_ROUND,                     NA,  FALSE) \
+FIELD(81C,  0, ECX,  9,  7, LWP_VERSION,                           NA,  FALSE) \
+FIELD(81C,  0, ECX, 16,  8, LWP_MIN_BUF_SIZE,                      NA,  FALSE) \
+FLAG( 81C,  0, ECX, 28,  1, LWP_BRANCH_PRED,                       NA,  FALSE) \
+FLAG( 81C,  0, ECX, 29,  1, LWP_IP_FILTERING,                      NA,  FALSE) \
+FLAG( 81C,  0, ECX, 30,  1, LWP_CACHE_LEVEL,                       NA,  FALSE) \
+FLAG( 81C,  0, ECX, 31,  1, LWP_CACHE_LATENCY,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  0,  1, LWP_SUPPORTED,                         NA,  FALSE) \
+FLAG( 81C,  0, EDX,  1,  1, LWP_VAL_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  2,  1, LWP_IRE_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  3,  1, LWP_BRE_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  4,  1, LWP_DME_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  5,  1, LWP_CNH_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  6,  1, LWP_RNH_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX, 31,  1, LWP_INT_SUPPORTED,                     NA,  FALSE) \
+FIELD(81D,  0, EAX,  0,  5, LEAF81D_CACHE_TYPE,                    NA,  FALSE) \
+FIELD(81D,  0, EAX,  5,  3, LEAF81D_CACHE_LEVEL,                   NA,  FALSE) \
+FLAG( 81D,  0, EAX,  8,  1, LEAF81D_CACHE_SELF_INIT,               NA,  FALSE) \
+FLAG( 81D,  0, EAX,  9,  1, LEAF81D_CACHE_FULLY_ASSOC,             NA,  FALSE) \
+FIELD(81D,  0, EAX, 14, 12, LEAF81D_NUM_SHARING_CACHE,             NA,  FALSE) \
+FIELD(81D,  0, EBX,  0, 12, LEAF81D_CACHE_LINE_SIZE,               NA,  FALSE) \
+FIELD(81D,  0, EBX, 12, 10, LEAF81D_CACHE_PHYS_PARTITIONS,         NA,  FALSE) \
+FIELD(81D,  0, EBX, 22, 10, LEAF81D_CACHE_WAYS,                    NA,  FALSE) \
+FIELD(81D,  0, ECX,  0, 32, LEAF81D_CACHE_NUM_SETS,                NA,  FALSE) \
+FLAG( 81D,  0, EDX,  0,  1, LEAF81D_CACHE_WBINVD,                  NA,  FALSE) \
+FLAG( 81D,  0, EDX,  1,  1, LEAF81D_CACHE_INCLUSIVE,               NA,  FALSE) \
+FIELD(81E,  0, EAX,  0, 32, EXTENDED_APICID,                       NA,  FALSE) \
+FIELD(81E,  0, EBX,  0,  8, COMPUTE_UNIT_ID,                       NA,  FALSE) \
+FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,                NA,  FALSE) \
+FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                            NA,  FALSE) \
+FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                         NA,  FALSE)
+
+#define INTEL_CPUID_FIELD_DATA
+
+#define AMD_CPUID_FIELD_DATA
+
+#define CPUID_FIELD_DATA                                              \
+   CPUID_FIELD_DATA_LEVEL_0                                           \
+   CPUID_FIELD_DATA_LEVEL_1                                           \
+   CPUID_FIELD_DATA_LEVEL_2                                           \
+   CPUID_FIELD_DATA_LEVEL_4                                           \
+   CPUID_FIELD_DATA_LEVEL_5                                           \
+   CPUID_FIELD_DATA_LEVEL_6                                           \
+   CPUID_FIELD_DATA_LEVEL_7                                           \
+   CPUID_FIELD_DATA_LEVEL_A                                           \
+   CPUID_FIELD_DATA_LEVEL_B                                           \
+   CPUID_FIELD_DATA_LEVEL_D                                           \
+   CPUID_FIELD_DATA_LEVEL_12                                          \
+   CPUID_FIELD_DATA_LEVEL_400                                         \
+   CPUID_FIELD_DATA_LEVEL_401                                         \
+   CPUID_FIELD_DATA_LEVEL_402                                         \
+   CPUID_FIELD_DATA_LEVEL_403                                         \
+   CPUID_FIELD_DATA_LEVEL_404                                         \
+   CPUID_FIELD_DATA_LEVEL_405                                         \
+   CPUID_FIELD_DATA_LEVEL_406                                         \
+   CPUID_FIELD_DATA_LEVEL_410                                         \
+   CPUID_FIELD_DATA_LEVEL_80                                          \
+   CPUID_FIELD_DATA_LEVEL_81                                          \
+   CPUID_FIELD_DATA_LEVEL_82                                          \
+   CPUID_FIELD_DATA_LEVEL_83                                          \
+   CPUID_FIELD_DATA_LEVEL_84                                          \
+   CPUID_FIELD_DATA_LEVEL_8x                                          \
+   CPUID_FIELD_DATA_LEVEL_81x                                         \
+   INTEL_CPUID_FIELD_DATA                                             \
+   AMD_CPUID_FIELD_DATA
+
+/*
+ * Define all field and flag values as an enum.  The result is a full
+ * set of values taken from the table above in the form:
+ *
+ * CPUID_<name>_MASK  == mask for feature/field
+ * CPUID_<name>_SHIFT == offset of field
+ *
+ * e.g. - CPUID_VIRT_BITS_MASK  = 0xff00
+ *      - CPUID_VIRT_BITS_SHIFT = 8
+ *
+ * Note: The MASK definitions must use some gymnastics to get
+ * around a warning when shifting left by 32.
+ */
+#define VMW_BIT_MASK(shift)  (((1 << (shift - 1)) << 1) - 1)
+
+#define FIELD(lvl, ecxIn, reg, bitpos, size, name, s, c3)      \
+   CPUID_##name##_SHIFT        = bitpos,                       \
+   CPUID_##name##_MASK         = VMW_BIT_MASK(size) << bitpos, \
+   CPUID_INTERNAL_SHIFT_##name = bitpos,                       \
+   CPUID_INTERNAL_MASK_##name  = VMW_BIT_MASK(size) << bitpos, \
+   CPUID_INTERNAL_REG_##name   = CPUID_REG_##reg,              \
+   CPUID_INTERNAL_EAXIN_##name = CPUID_LEVEL_VAL_##lvl,        \
+   CPUID_INTERNAL_ECXIN_##name = ecxIn,
+
+#define FLAG FIELD
+
+enum {
+   /* Define data for every CPUID field we have */
+   CPUID_FIELD_DATA
+};
+#undef VMW_BIT_MASK
+#undef FIELD
+#undef FLAG
+
+/*
+ * Legal CPUID config file mask characters.  For a description of the
+ * cpuid masking system, please see:
+ *
+ * http://vmweb.vmware.com/~mts/cgi-bin/view.cgi/Apps/CpuMigrationChecks
+ */
+
+#define CPUID_MASK_HIDE_CHR    '0'
+#define CPUID_MASK_HIDE_STR    "0"
+#define CPUID_MASK_FORCE_CHR   '1'
+#define CPUID_MASK_FORCE_STR   "1"
+#define CPUID_MASK_PASS_CHR    '-'
+#define CPUID_MASK_PASS_STR    "-"
+#define CPUID_MASK_TRUE_CHR    'T'
+#define CPUID_MASK_TRUE_STR    "T"
+#define CPUID_MASK_FALSE_CHR   'F'
+#define CPUID_MASK_FALSE_STR   "F"
+#define CPUID_MASK_IGNORE_CHR  'X'
+#define CPUID_MASK_IGNORE_STR  "X"
+#define CPUID_MASK_HOST_CHR    'H'
+#define CPUID_MASK_HOST_STR    "H"
+#define CPUID_MASK_RSVD_CHR    'R'
+#define CPUID_MASK_RSVD_STR    "R"
+#define CPUID_MASK_INSTALL_CHR 'I'
+#define CPUID_MASK_INSTALL_STR "I"
+
+/*
+ * When LM is disabled, we overlay the following masks onto the
+ * guest's default masks.  Any level that is not defined below should
+ * be treated as all "-"s
+ */
+
+#define CPT_ID1ECX_LM_DISABLED  "----:----:----:----:--0-:----:----:----"
+#define CPT_ID81EDX_LM_DISABLED "--0-:----:----:----:----:----:----:----"
+#define CPT_ID81ECX_LM_DISABLED "----:----:----:----:----:----:----:---0"
+
+#define CPT_GET_LM_DISABLED_MASK(lvl, reg)                                  \
+   ((lvl == 1 && reg == CPUID_REG_ECX) ? CPT_ID1ECX_LM_DISABLED :           \
+    (lvl == 0x80000001 && reg == CPUID_REG_ECX) ? CPT_ID81ECX_LM_DISABLED : \
+    (lvl == 0x80000001 && reg == CPUID_REG_EDX) ? CPT_ID81EDX_LM_DISABLED : \
+    NULL)
+
+/*
+ * CPUID_MASK --
+ * CPUID_SHIFT --
+ * CPUID_ISSET --
+ * CPUID_GET --
+ * CPUID_SET --
+ * CPUID_CLEAR --
+ * CPUID_SETTO --
+ *
+ * Accessor macros for all CPUID consts/fields/flags.  Level and reg are not
+ * required, but are used to force compile-time asserts which help verify that
+ * the flag is being used on the right CPUID input and result register.
+ *
+ * Note: ASSERT_ON_COMPILE is duplicated rather than factored into its own
+ * macro, because token concatenation does not work as expected if an input is
+ * #defined (e.g. APIC) when macros are nested.  Also, compound statements
+ * within parenthes is a GCC extension, so we must use runtime asserts with
+ * other compilers.
+ */
+
+#if defined(__GNUC__) && !defined(__clang__)
+
+#define CPUID_MASK(eaxIn, reg, flag)                                    \
+   ({                                                                   \
+      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
+              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
+      CPUID_INTERNAL_MASK_##flag;                                       \
+   })
+
+#define CPUID_SHIFT(eaxIn, reg, flag)                                   \
+   ({                                                                   \
+      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
+              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
+      CPUID_INTERNAL_SHIFT_##flag;                                      \
+   })
+
+#define CPUID_ISSET(eaxIn, reg, flag, data)                             \
+   ({                                                                   \
+      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
+              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
+      (((data) & CPUID_INTERNAL_MASK_##flag) != 0);                     \
+   })
+
+#define CPUID_GET(eaxIn, reg, field, data)                              \
+   ({                                                                   \
+      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##field &&        \
+              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field); \
+      (((uint32)(data) & CPUID_INTERNAL_MASK_##field) >>                \
+       CPUID_INTERNAL_SHIFT_##field);                                   \
+   })
+
+#else
+
+/*
+ * CPUIDCheck --
+ *
+ * Return val after verifying parameters.
+ */
+
+static INLINE uint32
+CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
+           CpuidReg reg, CpuidReg regCheck, uint32 val)
+{
+   ASSERT(eaxIn == eaxInCheck && reg == regCheck);
+   return val;
+}
+
+#define CPUID_MASK(eaxIn, reg, flag)                                    \
+   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                       \
+              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,     \
+              CPUID_INTERNAL_MASK_##flag)
+
+#define CPUID_SHIFT(eaxIn, reg, flag)                                   \
+   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                       \
+              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,     \
+              CPUID_INTERNAL_SHIFT_##flag)
+
+#define CPUID_ISSET(eaxIn, reg, flag, data)                             \
+   (CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                      \
+               CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,    \
+               CPUID_INTERNAL_MASK_##flag & (data)) != 0)
+
+#define CPUID_GET(eaxIn, reg, field, data)                              \
+   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##field,                      \
+              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##field,    \
+              ((uint32)(data) & CPUID_INTERNAL_MASK_##field) >>         \
+              CPUID_INTERNAL_SHIFT_##field)
+
+#endif
+
+
+#define CPUID_SET(eaxIn, reg, flag, dataPtr)                            \
+   do {                                                                 \
+      ASSERT_ON_COMPILE(                                                \
+         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##flag &&      \
+         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);       \
+      *(dataPtr) |= CPUID_INTERNAL_MASK_##flag;                         \
+   } while (0)
+
+#define CPUID_CLEAR(eaxIn, reg, flag, dataPtr)                          \
+   do {                                                                 \
+      ASSERT_ON_COMPILE(                                                \
+         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##flag &&      \
+         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);       \
+      *(dataPtr) &= ~CPUID_INTERNAL_MASK_##flag;                        \
+   } while (0)
+
+#define CPUID_SETTO(eaxIn, reg, field, dataPtr, val)                    \
+   do {                                                                 \
+      uint32 _v = val;                                                  \
+      uint32 *_d = dataPtr;                                             \
+      ASSERT_ON_COMPILE(                                                \
+         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##field &&     \
+         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field);      \
+      *_d = (*_d & ~CPUID_INTERNAL_MASK_##field) |                      \
+         (_v << CPUID_INTERNAL_SHIFT_##field);                          \
+      ASSERT(_v == (*_d & CPUID_INTERNAL_MASK_##field) >>               \
+             CPUID_INTERNAL_SHIFT_##field);                             \
+   } while (0)
+
+#define CPUID_SETTO_SAFE(eaxIn, reg, field, dataPtr, val)               \
+   do {                                                                 \
+      uint32 _v = val &                                                 \
+         (CPUID_INTERNAL_MASK_##field >> CPUID_INTERNAL_SHIFT_##field); \
+      uint32 *_d = dataPtr;                                             \
+      ASSERT_ON_COMPILE(                                                \
+         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##field &&     \
+         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field);      \
+      *_d = (*_d & ~CPUID_INTERNAL_MASK_##field) |                      \
+         (_v << CPUID_INTERNAL_SHIFT_##field);                          \
+   } while (0)
+
+
+/*
+ * Definitions of various fields' values and more complicated
+ * macros/functions for reading cpuid fields.
+ */
+
+#define CPUID_FAMILY_EXTENDED        15
+
+/* Effective Intel CPU Families */
+#define CPUID_FAMILY_486              4
+#define CPUID_FAMILY_P5               5
+#define CPUID_FAMILY_P6               6
+#define CPUID_FAMILY_P4              15
+
+/* Effective AMD CPU Families */
+#define CPUID_FAMILY_5x86            0x4
+#define CPUID_FAMILY_K5              0x5
+#define CPUID_FAMILY_K6              0x5
+#define CPUID_FAMILY_K7              0x6
+#define CPUID_FAMILY_K8              0xf
+#define CPUID_FAMILY_K8L             0x10
+#define CPUID_FAMILY_K8MOBILE        0x11
+#define CPUID_FAMILY_LLANO           0x12
+#define CPUID_FAMILY_BOBCAT          0x14
+#define CPUID_FAMILY_BULLDOZER       0x15  // Bulldozer Piledriver Steamroller
+#define CPUID_FAMILY_KYOTO           0x16  // Note: Jaguar microarch
+
+/* Effective VIA CPU Families */
+#define CPUID_FAMILY_C7               6
+
+/* Intel model information */
+#define CPUID_MODEL_PPRO              1
+#define CPUID_MODEL_PII_03            3
+#define CPUID_MODEL_PII_05            5
+#define CPUID_MODEL_CELERON_06        6
+#define CPUID_MODEL_PM_09             9
+#define CPUID_MODEL_PM_0D            13
+#define CPUID_MODEL_PM_0E            14  // Yonah / Sossaman
+#define CPUID_MODEL_CORE_0F          15  // Conroe / Merom
+#define CPUID_MODEL_CORE_17        0x17  // Penryn
+#define CPUID_MODEL_NEHALEM_1A     0x1a  // Nehalem / Gainestown
+#define CPUID_MODEL_ATOM_1C        0x1c  // Silverthorne / Diamondville
+#define CPUID_MODEL_CORE_1D        0x1d  // Dunnington
+#define CPUID_MODEL_NEHALEM_1E     0x1e  // Lynnfield
+#define CPUID_MODEL_NEHALEM_1F     0x1f  // Havendale
+#define CPUID_MODEL_NEHALEM_25     0x25  // Westmere / Clarkdale
+#define CPUID_MODEL_ATOM_26        0x26  // Lincroft
+#define CPUID_MODEL_ATOM_27        0x27  // Saltwell
+#define CPUID_MODEL_SANDYBRIDGE_2A 0x2a  // Sandybridge (desktop/mobile)
+#define CPUID_MODEL_NEHALEM_2C     0x2c  // Westmere-EP
+#define CPUID_MODEL_SANDYBRIDGE_2D 0x2d  // Sandybridge-EP
+#define CPUID_MODEL_NEHALEM_2E     0x2e  // Nehalem-EX
+#define CPUID_MODEL_NEHALEM_2F     0x2f  // Westmere-EX
+#define CPUID_MODEL_ATOM_35        0x35  // Cloverview
+#define CPUID_MODEL_ATOM_36        0x36  // Cedarview
+#define CPUID_MODEL_ATOM_37        0x37  // Bay Trail
+#define CPUID_MODEL_SANDYBRIDGE_3A 0x3a  // Ivy Bridge
+#define CPUID_MODEL_HASWELL_3C     0x3c  // Haswell DT
+#define CPUID_MODEL_BROADWELL_3D   0x3d  // Broadwell-Ult
+#define CPUID_MODEL_SANDYBRIDGE_3E 0x3e  // Ivy Bridge-EP
+#define CPUID_MODEL_HASWELL_3F     0x3f  // Haswell EP/EN/EX
+#define CPUID_MODEL_HASWELL_45     0x45  // Haswell Ultrathin
+#define CPUID_MODEL_HASWELL_46     0x46  // Haswell (Crystal Well)
+#define CPUID_MODEL_BROADWELL_47   0x47  // Broadwell (Denlow)
+#define CPUID_MODEL_ATOM_4A        0x4a  // Future Silvermont
+#define CPUID_MODEL_ATOM_4C        0x4c  // Airmont
+#define CPUID_MODEL_ATOM_4D        0x4d  // Avoton
+#define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y
+#define CPUID_MODEL_BROADWELL_4F   0x4f  // Broadwell EP/EN/EX
+#define CPUID_MODEL_BROADWELL_56   0x56  // Broadwell DE
+#define CPUID_MODEL_ATOM_5A        0x5a  // Future Silvermont
+#define CPUID_MODEL_ATOM_5D        0x5d  // Future Silvermont
+#define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S
+
+#define CPUID_MODEL_PIII_07    7
+#define CPUID_MODEL_PIII_08    8
+#define CPUID_MODEL_PIII_0A    10
+
+/* AMD model information */
+#define CPUID_MODEL_BARCELONA_02      0x02 // Barcelona (Opteron & Phenom)
+#define CPUID_MODEL_SHANGHAI_04       0x04 // Shanghai RB
+#define CPUID_MODEL_SHANGHAI_05       0x05 // Shanghai BL
+#define CPUID_MODEL_SHANGHAI_06       0x06 // Shanghai DA
+#define CPUID_MODEL_ISTANBUL_MAGNY_08 0x08 // Istanbul (6 core) & Magny-cours (12) HY
+#define CPUID_MODEL_ISTANBUL_MAGNY_09 0x09 // HY - G34 package
+#define CPUID_MODEL_PHAROAH_HOUND_0A  0x0A // Pharoah Hound
+#define CPUID_MODEL_PILEDRIVER_1F     0x1F // Max piledriver model defined in BKDG
+#define CPUID_MODEL_PILEDRIVER_10     0x10 // family == CPUID_FAMILY_BULLDOZER
+#define CPUID_MODEL_PILEDRIVER_02     0x02 // family == CPUID_FAMILY_BULLDOZER
+#define CPUID_MODEL_OPTERON_REVF_41   0x41 // family == CPUID_FAMILY_K8
+#define CPUID_MODEL_KYOTO_00          0x00 // family == CPUID_FAMILY_KYOTO
+
+/* VIA model information */
+#define CPUID_MODEL_NANO       15     // Isaiah
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_IsVendor{AMD,Intel,VIA} --
+ *
+ *      Determines if the vendor string in cpuid id0 is from {AMD,Intel,VIA}.
+ *
+ * Results:
+ *      True iff vendor string is CPUID_{AMD,INTEL,VIA}_VENDOR_STRING
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+CPUID_IsRawVendor(CPUIDRegs *id0, const char* vendor)
+{
+   // hard to get strcmp() in some environments, so do it in the raw
+   return (id0->ebx == *(const uint32 *) (vendor + 0) &&
+           id0->ecx == *(const uint32 *) (vendor + 4) &&
+           id0->edx == *(const uint32 *) (vendor + 8));
+}
+
+static INLINE Bool
+CPUID_IsVendorAMD(CPUIDRegs *id0)
+{
+   return CPUID_IsRawVendor(id0, CPUID_AMD_VENDOR_STRING);
+}
+
+static INLINE Bool
+CPUID_IsVendorIntel(CPUIDRegs *id0)
+{
+   return CPUID_IsRawVendor(id0, CPUID_INTEL_VENDOR_STRING);
+}
+
+static INLINE Bool
+CPUID_IsVendorVIA(CPUIDRegs *id0)
+{
+   return CPUID_IsRawVendor(id0, CPUID_VIA_VENDOR_STRING);
+}
+
+static INLINE uint32
+CPUID_EFFECTIVE_FAMILY(uint32 v) /* %eax from CPUID with %eax=1. */
+{
+   uint32 f = CPUID_GET(1, EAX, FAMILY, v);
+   return f != CPUID_FAMILY_EXTENDED ? f : f +
+      CPUID_GET(1, EAX, EXTENDED_FAMILY, v);
+}
+
+/* Normally only used when FAMILY==CPUID_FAMILY_EXTENDED, but Intel is
+ * now using the extended model field for FAMILY==CPUID_FAMILY_P6 to
+ * refer to the newer Core2 CPUs
+ */
+static INLINE uint32
+CPUID_EFFECTIVE_MODEL(uint32 v) /* %eax from CPUID with %eax=1. */
+{
+   uint32 m = CPUID_GET(1, EAX, MODEL, v);
+   uint32 em = CPUID_GET(1, EAX, EXTENDED_MODEL, v);
+   return m + (em << 4);
+}
+
+/*
+ * Notice that CPUID families for Intel and AMD overlap. The following macros
+ * should only be used AFTER the manufacturer has been established (through
+ * the use of CPUID standard function 0).
+ */
+static INLINE Bool
+CPUID_FAMILY_IS_486(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_486;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_P5(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P5;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_P6(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P6;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_PENTIUM4(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P4;
+}
+
+/*
+ * Intel Pentium M processors are Yonah/Sossaman or an older P-M
+ */
+static INLINE Bool
+CPUID_UARCH_IS_PENTIUM_M(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_09 ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_0D ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_0E);
+}
+
+/*
+ * Intel Core processors are Merom, Conroe, Woodcrest, Clovertown,
+ * Penryn, Dunnington, Kentsfield, Yorktown, Harpertown, ........
+ */
+static INLINE Bool
+CPUID_UARCH_IS_CORE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   uint32 model = CPUID_EFFECTIVE_MODEL(v);
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          model >= CPUID_MODEL_CORE_0F &&
+          (model < CPUID_MODEL_NEHALEM_1A ||
+           model == CPUID_MODEL_CORE_1D);
+}
+
+/*
+ * Intel Nehalem processors are: Nehalem, Gainestown, Lynnfield, Clarkdale.
+ */
+static INLINE Bool
+CPUID_UARCH_IS_NEHALEM(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_NEHALEM_1A ||
+           effectiveModel == CPUID_MODEL_NEHALEM_1E ||
+           effectiveModel == CPUID_MODEL_NEHALEM_1F ||
+           effectiveModel == CPUID_MODEL_NEHALEM_25 ||
+           effectiveModel == CPUID_MODEL_NEHALEM_2C ||
+           effectiveModel == CPUID_MODEL_NEHALEM_2E ||
+           effectiveModel == CPUID_MODEL_NEHALEM_2F);
+}
+
+
+static INLINE Bool
+CPUID_UARCH_IS_SANDYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_SANDYBRIDGE_2A ||
+           effectiveModel == CPUID_MODEL_SANDYBRIDGE_2D ||
+           effectiveModel == CPUID_MODEL_SANDYBRIDGE_3E ||
+           effectiveModel == CPUID_MODEL_SANDYBRIDGE_3A);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_BROADWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_BROADWELL_3D ||
+           effectiveModel == CPUID_MODEL_BROADWELL_47 ||
+           effectiveModel == CPUID_MODEL_BROADWELL_4F ||
+           effectiveModel == CPUID_MODEL_BROADWELL_56);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_HASWELL_3C ||
+           effectiveModel == CPUID_MODEL_HASWELL_3F ||
+           effectiveModel == CPUID_MODEL_HASWELL_45 ||
+           effectiveModel == CPUID_MODEL_HASWELL_46);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E);
+}
+
+
+static INLINE Bool
+CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) && CPUID_MODEL_IS_SKYLAKE(v);
+}
+
+
+static INLINE Bool
+CPUID_UARCH_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_MODEL_IS_BROADWELL(v) || CPUID_MODEL_IS_HASWELL(v));
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_CENTERTON(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_1C;
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_AVOTON(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_4D;
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_WESTMERE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_NEHALEM_25 || // Clarkdale
+           effectiveModel == CPUID_MODEL_NEHALEM_2C || // Westmere-EP
+           effectiveModel == CPUID_MODEL_NEHALEM_2F);  // Westmere-EX
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_SANDYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_SANDYBRIDGE_2A ||
+           effectiveModel == CPUID_MODEL_SANDYBRIDGE_2D);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_IVYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) && (
+       effectiveModel == CPUID_MODEL_SANDYBRIDGE_3E ||
+       effectiveModel == CPUID_MODEL_SANDYBRIDGE_3A);
+}
+
+
+static INLINE Bool
+CPUID_FAMILY_IS_K7(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K7;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8EXT(uint32 eax)
+{
+   /*
+    * We check for this pattern often enough that it's
+    * worth a separate function, for syntactic sugar.
+    */
+   return CPUID_FAMILY_IS_K8(eax) &&
+          CPUID_GET(1, EAX, EXTENDED_MODEL, eax) != 0;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8L(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8L ||
+          CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_LLANO;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_LLANO(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_LLANO;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8MOBILE(uint32 eax)
+{
+   /* Essentially a K8 (not K8L) part, but with mobile features. */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8MOBILE;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8STAR(uint32 eax)
+{
+   /*
+    * Read function name as "K8*", as in wildcard.
+    * Matches K8 or K8L or K8MOBILE
+    */
+   return CPUID_FAMILY_IS_K8(eax) || CPUID_FAMILY_IS_K8L(eax) ||
+          CPUID_FAMILY_IS_K8MOBILE(eax);
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_BOBCAT(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BOBCAT;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_BULLDOZER(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_KYOTO(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_KYOTO;
+}
+
+/*
+ * AMD Barcelona (of either Opteron or Phenom kind).
+ */
+static INLINE Bool
+CPUID_MODEL_IS_BARCELONA(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is AMD. */
+   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
+          CPUID_EFFECTIVE_MODEL(v)  == CPUID_MODEL_BARCELONA_02;
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_SHANGHAI(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is AMD. */
+   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
+          (CPUID_MODEL_SHANGHAI_04  <= CPUID_EFFECTIVE_MODEL(v) &&
+           CPUID_EFFECTIVE_MODEL(v) <= CPUID_MODEL_SHANGHAI_06);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_ISTANBUL_MAGNY(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is AMD. */
+   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
+          (CPUID_MODEL_ISTANBUL_MAGNY_08 <= CPUID_EFFECTIVE_MODEL(v) &&
+           CPUID_EFFECTIVE_MODEL(v)      <= CPUID_MODEL_ISTANBUL_MAGNY_09);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_PHAROAH_HOUND(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is AMD. */
+   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
+          CPUID_EFFECTIVE_MODEL(v)  == CPUID_MODEL_PHAROAH_HOUND_0A;
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_BULLDOZER(uint32 eax)
+{
+   /*
+    * Bulldozer is models of family 0x15 that are below 10 excluding
+    * Piledriver 02.
+    */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
+          CPUID_EFFECTIVE_MODEL(eax)  < CPUID_MODEL_PILEDRIVER_10 &&
+          CPUID_EFFECTIVE_MODEL(eax) != CPUID_MODEL_PILEDRIVER_02;
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_PILEDRIVER(uint32 eax)
+{
+   /* Piledriver is models 0x02 & 0x10 of family 0x15 (so far). */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
+          ((CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_PILEDRIVER_10 &&
+            CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_PILEDRIVER_1F) ||
+           CPUID_EFFECTIVE_MODEL(eax) == CPUID_MODEL_PILEDRIVER_02);
+}
+
+
+
+
+static INLINE Bool
+CPUID_MODEL_IS_KYOTO(uint32 eax)
+{
+   /* Kyoto is models 0x00 of family 0x16 (so far). */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_KYOTO &&
+          CPUID_EFFECTIVE_MODEL(eax) == CPUID_MODEL_KYOTO_00;
+}
+
+#define CPUID_TYPE_PRIMARY     0
+#define CPUID_TYPE_OVERDRIVE   1
+#define CPUID_TYPE_SECONDARY   2
+
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_NULL      0
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_DATA      1
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_INST      2
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_UNIF      3
+#define CPUID_LEAF4_CACHE_TYPE_NULL      0
+#define CPUID_LEAF4_CACHE_TYPE_DATA      1
+#define CPUID_LEAF4_CACHE_TYPE_INST      2
+#define CPUID_LEAF4_CACHE_TYPE_UNIF      3
+#define CPUID_LEAF4_CACHE_INDEXING_DIRECT  0
+#define CPUID_LEAF4_CACHE_INDEXING_COMPLEX 1
+
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_SELF_INIT      0x00000100
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_FULLY_ASSOC    0x00000200
+#define CPUID_LEAF4_CACHE_SELF_INIT      0x00000100
+#define CPUID_LEAF4_CACHE_FULLY_ASSOC    0x00000200
+
+#define CPUID_INTEL_IDBECX_LEVEL_TYPE_INVALID   0
+#define CPUID_INTEL_IDBECX_LEVEL_TYPE_SMT       1
+#define CPUID_INTEL_IDBECX_LEVEL_TYPE_CORE      2
+#define CPUID_TOPOLOGY_LEVEL_TYPE_INVALID   0
+#define CPUID_TOPOLOGY_LEVEL_TYPE_SMT       1
+#define CPUID_TOPOLOGY_LEVEL_TYPE_CORE      2
+
+
+/*
+ * For certain AMD processors, an lfence instruction is necessary at various
+ * places to ensure ordering.
+ */
+
+static INLINE Bool
+CPUID_VendorRequiresFence(CpuidVendor vendor)
+{
+   return vendor == CPUID_VENDOR_AMD;
+}
+
+static INLINE Bool
+CPUID_VersionRequiresFence(uint32 version)
+{
+   return CPUID_EFFECTIVE_FAMILY(version) == CPUID_FAMILY_K8 &&
+          CPUID_EFFECTIVE_MODEL(version) < 0x40;
+}
+
+static INLINE Bool
+CPUID_ID0RequiresFence(CPUIDRegs *id0)
+{
+   if (id0->eax == 0) {
+      return FALSE;
+   }
+   return CPUID_IsVendorAMD(id0);
+}
+
+static INLINE Bool
+CPUID_ID1RequiresFence(CPUIDRegs *id1)
+{
+   return CPUID_VersionRequiresFence(id1->eax);
+}
+
+static INLINE Bool
+CPUID_RequiresFence(CpuidVendor vendor, // IN
+                    uint32 version)      // IN: %eax from CPUID with %eax=1.
+{
+   return CPUID_VendorRequiresFence(vendor) &&
+          CPUID_VersionRequiresFence(version);
+}
+
+
+/*
+ * The following low-level functions compute the number of
+ * cores per cpu.  They should be used cautiously because
+ * they do not necessarily work on all types of CPUs.
+ * High-level functions that are correct for all CPUs are
+ * available elsewhere: see lib/cpuidInfo/cpuidInfo.c.
+ */
+
+static INLINE uint32
+CPUID_IntelCoresPerPackage(uint32 v) /* %eax from CPUID with %eax=4 and %ecx=0. */
+{
+   // Note: This is not guaranteed to work on older Intel CPUs.
+   return 1 + CPUID_GET(4, EAX, LEAF4_CORE_COUNT, v);
+}
+
+
+static INLINE uint32
+CPUID_AMDCoresPerPackage(uint32 v) /* %ecx from CPUID with %eax=0x80000008. */
+{
+   // Note: This is not guaranteed to work on older AMD CPUs.
+   return 1 + CPUID_GET(0x80000008, ECX, LEAF88_CORE_COUNT, v);
+}
+
+
+/*
+ * Hypervisor CPUID space is 0x400000XX.
+ */
+static INLINE Bool
+CPUID_IsHypervisorLevel(uint32 level)
+{
+   return (level & 0xffffff00) == 0x40000000;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_LevelUsesEcx --
+ *
+ *      Returns TRUE for leaves that support input ECX != 0 (subleaves).
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+CPUID_LevelUsesEcx(uint32 level) {
+   return level == 4 || level == 7 || level == 0xb || level == 0xd ||
+          level == 0x8000001d;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_IsValid*Subleaf --
+ *
+ *      Functions to determine the last subleaf for the level specified
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+CPUID_IsValidBSubleaf(uint32 ebx)  // IN: %ebx = cpuid.b.sublevel.ebx
+{
+   return ebx != 0;
+}
+
+static INLINE Bool
+CPUID_IsValid4Subleaf(uint32 eax)  // IN: %eax = cpuid.4.sublevel.eax
+{
+   return eax != 0;
+}
+
+static INLINE Bool
+CPUID_IsValid7Subleaf(uint32 eax, uint32 subleaf)  // IN: %eax = cpuid.7.0.eax
+{
+   /*
+    * cpuid.7.0.eax is the max ecx (subleaf) index
+    */
+   return subleaf <= eax;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_IsValidDSubleaf --
+ *
+ *    It is the caller's repsonsibility to determine if the processor
+ *    supports XSAVE and therefore has D sub-leaves.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+CPUID_IsValidDSubleaf(uint32 subleaf)  // IN: subleaf to check
+{
+   return subleaf <= 63;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_SupportsMsrPlatformInfo --
+ *
+ *    Uses vendor and cpuid.1.0.eax to determine if the processor
+ *    supports MSR_PLATFORM_INFO.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+CPUID_SupportsMsrPlatformInfo(CpuidVendor vendor, uint32 version)
+{
+   return vendor == CPUID_VENDOR_INTEL &&
+          (CPUID_UARCH_IS_NEHALEM(version)     ||
+           CPUID_UARCH_IS_SANDYBRIDGE(version) ||
+           CPUID_UARCH_IS_HASWELL(version)     ||
+           CPUID_UARCH_IS_SKYLAKE(version)     ||
+           CPUID_MODEL_IS_AVOTON(version));
+}
+
+#endif
diff --git a/vmmon-only/include/x86cpuid_asm.h b/vmmon-only/include/x86cpuid_asm.h
new file mode 100644
index 00000000..5a96ea65
--- /dev/null
+++ b/vmmon-only/include/x86cpuid_asm.h
@@ -0,0 +1,445 @@
+/*********************************************************
+ * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86cpuid_asm.h
+ *
+ *      CPUID-related assembly functions.
+ */
+
+#ifndef _X86CPUID_ASM_H_
+#define _X86CPUID_ASM_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_asm.h"
+#include "x86cpuid.h"
+
+
+/*
+ * x86-64 windows doesn't support inline asm so we have to use these
+ * intrinsic functions defined in the compiler.  Not all of these are well
+ * documented.  There is an array in the compiler dll (c1.dll) which has
+ * an array of the names of all the intrinsics minus the leading
+ * underscore.  Searching around in the ntddk.h file can also be helpful.
+ *
+ * The declarations for the intrinsic functions were taken from the DDK.
+ * Our declarations must match the ddk's otherwise the 64-bit c++ compiler
+ * will complain about second linkage of the intrinsic functions.
+ * We define the intrinsic using the basic types corresponding to the
+ * Windows typedefs. This avoids having to include windows header files
+ * to get to the windows types.
+ */
+#ifdef _MSC_VER
+#ifdef __cplusplus
+extern "C" {
+#endif
+#ifdef VM_X86_64
+/*
+ * intrinsic functions only supported by x86-64 windows as of 2k3sp1
+ */
+void __cpuid(int regs[4], int eax);
+#pragma intrinsic(__cpuid)
+#endif /* VM_X86_64 */
+
+#ifdef __cplusplus
+}
+#endif
+#endif /* _MSC_VER */
+
+
+#ifdef __GNUC__ // {
+
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ *
+ * Need __volatile__ and "memory" since CPUID has a synchronizing effect.
+ * The CPUID may also change at runtime (APIC flag, etc).
+ *
+ */
+
+/*
+ * %ebx is reserved on i386 PIC.  Apple's gcc-5493 (gcc 4.0) compiling
+ * for x86_64 incorrectly errors out saying %ebx is reserved.  This is
+ * Apple bug 7304232.
+ */
+#if vm_x86_64 ? (defined __APPLE_CC__ && __APPLE_CC__ == 5493) : defined __PIC__
+#if vm_x86_64
+/*
+ * Note that this generates movq %rbx,%rbx; cpuid; xchgq %rbx,%rbx ...
+ * Unfortunately Apple's assembler does not have .ifnes, and I cannot
+ * figure out how to do that with .if.   If we ever enable this code
+ * on other 64bit systems, both movq & xchgq should be surrounded by
+ * .ifnes \"%%rbx\", \"%q1\" & .endif
+ */
+#define VM_CPUID_BLOCK  "movq %%rbx, %q1\n\t" \
+                        "cpuid\n\t"           \
+                        "xchgq %%rbx, %q1\n\t"
+#define VM_EBX_OUT(reg) "=&r"(reg)
+#else
+#define VM_CPUID_BLOCK  "movl %%ebx, %1\n\t" \
+                        "cpuid\n\t"          \
+                        "xchgl %%ebx, %1\n\t"
+#define VM_EBX_OUT(reg) "=&rm"(reg)
+#endif
+#else
+#define VM_CPUID_BLOCK  "cpuid"
+#define VM_EBX_OUT(reg) "=b"(reg)
+#endif
+
+static INLINE void
+__GET_CPUID(int eax,         // IN
+            CPUIDRegs *regs) // OUT
+{
+   __asm__ __volatile__(
+      VM_CPUID_BLOCK
+      : "=a" (regs->eax), VM_EBX_OUT(regs->ebx), "=c" (regs->ecx), "=d" (regs->edx)
+      : "a" (eax)
+      : "memory"
+   );
+}
+
+static INLINE void
+__GET_CPUID2(int eax,         // IN
+             int ecx,         // IN
+             CPUIDRegs *regs) // OUT
+{
+   __asm__ __volatile__(
+      VM_CPUID_BLOCK
+      : "=a" (regs->eax), VM_EBX_OUT(regs->ebx), "=c" (regs->ecx), "=d" (regs->edx)
+      : "a" (eax), "c" (ecx)
+      : "memory"
+   );
+}
+
+static INLINE uint32
+__GET_EAX_FROM_CPUID(int eax) // IN
+{
+   uint32 ebx;
+
+   __asm__ __volatile__(
+      VM_CPUID_BLOCK
+      : "=a" (eax), VM_EBX_OUT(ebx)
+      : "a" (eax)
+      : "memory", "%ecx", "%edx"
+   );
+
+   return eax;
+}
+
+static INLINE uint32
+__GET_EBX_FROM_CPUID(int eax) // IN
+{
+   uint32 ebx;
+
+   __asm__ __volatile__(
+      VM_CPUID_BLOCK
+      : "=a" (eax), VM_EBX_OUT(ebx)
+      : "a" (eax)
+      : "memory", "%ecx", "%edx"
+   );
+
+   return ebx;
+}
+
+static INLINE uint32
+__GET_ECX_FROM_CPUID(int eax) // IN
+{
+   uint32 ecx;
+   uint32 ebx;
+
+   __asm__ __volatile__(
+      VM_CPUID_BLOCK
+      : "=a" (eax), VM_EBX_OUT(ebx), "=c" (ecx)
+      : "a" (eax)
+      : "memory", "%edx"
+   );
+
+   return ecx;
+}
+
+static INLINE uint32
+__GET_EDX_FROM_CPUID(int eax) // IN
+{
+   uint32 edx;
+   uint32 ebx;
+
+   __asm__ __volatile__(
+      VM_CPUID_BLOCK
+      : "=a" (eax), VM_EBX_OUT(ebx), "=d" (edx)
+      : "a" (eax)
+      : "memory", "%ecx"
+   );
+
+   return edx;
+}
+
+
+static INLINE uint32
+__GET_EAX_FROM_CPUID4(int ecx) // IN
+{
+   uint32 eax;
+   uint32 ebx;
+
+   __asm__ __volatile__(
+      VM_CPUID_BLOCK
+      : "=a" (eax), VM_EBX_OUT(ebx), "=c" (ecx)
+      : "a" (4), "c" (ecx)
+      : "memory", "%edx"
+   );
+
+   return eax;
+}
+
+#undef VM_CPUID_BLOCK
+#undef VM_EBX_OUT
+
+#elif defined(_MSC_VER) // } {
+
+static INLINE void
+__GET_CPUID(int input, CPUIDRegs *regs)
+{
+#ifdef VM_X86_64
+   __cpuid((int *)regs, input);
+#else
+   __asm push esi
+   __asm push ebx
+   __asm push ecx
+   __asm push edx
+
+   __asm mov  eax, input
+   __asm mov  esi, regs
+   __asm _emit 0x0f __asm _emit 0xa2
+   __asm mov 0x0[esi], eax
+   __asm mov 0x4[esi], ebx
+   __asm mov 0x8[esi], ecx
+   __asm mov 0xC[esi], edx
+
+   __asm pop edx
+   __asm pop ecx
+   __asm pop ebx
+   __asm pop esi
+#endif
+}
+
+#ifdef VM_X86_64
+
+/*
+ * No inline assembly in Win64. Implemented in bora/lib/misc in
+ * cpuidMasm64.asm.
+ */
+
+extern void
+__GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs);
+
+#else // VM_X86_64
+
+static INLINE void
+__GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs)
+{
+   __asm push esi
+   __asm push ebx
+   __asm push ecx
+   __asm push edx
+
+   __asm mov  eax, inputEax
+   __asm mov  ecx, inputEcx
+   __asm mov  esi, regs
+   __asm _emit 0x0f __asm _emit 0xa2
+   __asm mov 0x0[esi], eax
+   __asm mov 0x4[esi], ebx
+   __asm mov 0x8[esi], ecx
+   __asm mov 0xC[esi], edx
+
+   __asm pop edx
+   __asm pop ecx
+   __asm pop ebx
+   __asm pop esi
+}
+#endif
+
+static INLINE uint32
+__GET_EAX_FROM_CPUID(int input)
+{
+#ifdef VM_X86_64
+   CPUIDRegs regs;
+   __cpuid((int *)&regs, input);
+   return regs.eax;
+#else
+   uint32 output;
+
+   //NOT_TESTED();
+   __asm push ebx
+   __asm push ecx
+   __asm push edx
+
+   __asm mov  eax, input
+   __asm _emit 0x0f __asm _emit 0xa2
+   __asm mov  output, eax
+
+   __asm pop edx
+   __asm pop ecx
+   __asm pop ebx
+
+   return output;
+#endif
+}
+
+static INLINE uint32
+__GET_EBX_FROM_CPUID(int input)
+{
+#ifdef VM_X86_64
+   CPUIDRegs regs;
+   __cpuid((int *)&regs, input);
+   return regs.ebx;
+#else
+   uint32 output;
+
+   //NOT_TESTED();
+   __asm push ebx
+   __asm push ecx
+   __asm push edx
+
+   __asm mov  eax, input
+   __asm _emit 0x0f __asm _emit 0xa2
+   __asm mov  output, ebx
+
+   __asm pop edx
+   __asm pop ecx
+   __asm pop ebx
+
+   return output;
+#endif
+}
+
+static INLINE uint32
+__GET_ECX_FROM_CPUID(int input)
+{
+#ifdef VM_X86_64
+   CPUIDRegs regs;
+   __cpuid((int *)&regs, input);
+   return regs.ecx;
+#else
+   uint32 output;
+
+   //NOT_TESTED();
+   __asm push ebx
+   __asm push ecx
+   __asm push edx
+
+   __asm mov  eax, input
+   __asm _emit 0x0f __asm _emit 0xa2
+   __asm mov  output, ecx
+
+   __asm pop edx
+   __asm pop ecx
+   __asm pop ebx
+
+   return output;
+#endif
+}
+
+static INLINE uint32
+__GET_EDX_FROM_CPUID(int input)
+{
+#ifdef VM_X86_64
+   CPUIDRegs regs;
+   __cpuid((int *)&regs, input);
+   return regs.edx;
+#else
+   uint32 output;
+
+   //NOT_TESTED();
+   __asm push ebx
+   __asm push ecx
+   __asm push edx
+
+   __asm mov  eax, input
+   __asm _emit 0x0f __asm _emit 0xa2
+   __asm mov  output, edx
+
+   __asm pop edx
+   __asm pop ecx
+   __asm pop ebx
+
+   return output;
+#endif
+}
+
+#ifdef VM_X86_64
+
+/*
+ * No inline assembly in Win64. Implemented in bora/lib/misc in
+ * cpuidMasm64.asm.
+ */
+
+extern uint32
+__GET_EAX_FROM_CPUID4(int inputEcx);
+
+#else // VM_X86_64
+
+static INLINE uint32
+__GET_EAX_FROM_CPUID4(int inputEcx)
+{
+   uint32 output;
+
+   //NOT_TESTED();
+   __asm push ebx
+   __asm push ecx
+   __asm push edx
+
+   __asm mov  eax, 4
+   __asm mov  ecx, inputEcx
+   __asm _emit 0x0f __asm _emit 0xa2
+   __asm mov  output, eax
+
+   __asm pop edx
+   __asm pop ecx
+   __asm pop ebx
+
+   return output;
+}
+
+#endif // VM_X86_64
+
+#else // }
+#error
+#endif
+
+#define CPUID_FOR_SIDE_EFFECTS() ((void)__GET_EAX_FROM_CPUID(0))
+
+/* The first parameter is used as an rvalue and then as an lvalue. */
+#define GET_CPUID(_ax, _bx, _cx, _dx) { \
+   CPUIDRegs regs;                      \
+   __GET_CPUID(_ax, &regs);             \
+   _ax = regs.eax;                      \
+   _bx = regs.ebx;                      \
+   _cx = regs.ecx;                      \
+   _dx = regs.edx;                      \
+}
+
+
+#endif
diff --git a/vmmon-only/include/x86desc.h b/vmmon-only/include/x86desc.h
new file mode 100644
index 00000000..01529b50
--- /dev/null
+++ b/vmmon-only/include/x86desc.h
@@ -0,0 +1,601 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _X86DESC_H_
+#define _X86DESC_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "x86segdescrs.h"
+#include "vm_assert.h"
+
+/*
+ * Symbolic names for various offsets used to construct segment descriptors.
+ */
+/* Lower dword */
+#define X86DESC_BASE_LO_SHIFT  16
+#define X86DESC_LIMIT_LO_SHIFT  0
+/* Upper dword */
+#define X86DESC_BASE_HI_SHIFT  24
+#define X86DESC_GRAN_SHIFT     23
+#define X86DESC_DB_SHIFT       22
+#define X86DESC_LONG_SHIFT     21
+#define X86DESC_AVL_SHIFT      20
+#define X86DESC_LIMIT_HI_SHIFT 16
+#define X86DESC_P_SHIFT        15
+#define X86DESC_DPL_SHIFT      13
+#define X86DESC_S_SHIFT        12
+#define X86DESC_TYPE_SHIFT      8
+#define X86DESC_BASE_MID_SHIFT  0
+
+#define X86DESC_TYPE_WIDTH      4
+
+
+/* 
+ * Descriptors store a 32-bit or 64-bit segment base in 3 parts
+ * (low, mid, high) and the 20-bit limit in 2 parts (low, high).
+ * The following macros extract these components from the original
+ * base and limit.
+ */
+
+#define BASE_LO(_dw)              ((uint32)((_dw) & 0xffff))
+#define BASE_MID(_dw)             ((uint32)(((_dw) >> 16) & 0xff))
+#define BASE_HI(_dw)              ((uint32)(((_dw) >> 24) & 0xff))
+#define BASE64_LO(_qw)            ((uint64)((_qw) & 0xffffff))
+#define BASE64_MID(_qw)           ((uint64)(((_qw) >> 24) & 0xff))
+#define BASE64_HI(_qw)            ((uint64)((_qw) >> 32))
+#define LIMIT_LO(_dw)             ((uint32)((_dw) & 0xffff)) /* Descriptor */
+#define LIMIT_HI(_dw)             ((uint32)(((_dw) >> 16) & 0xf))
+#define OFFSET_LO(_dw)            ((uint32)((_dw) & 0xffff)) /* CallGate */
+#define OFFSET_HI(_dw)            ((uint32)(((_dw) >> 16) & 0xffff))
+
+/*
+ * Accessor functions for descriptors.  
+ * 
+ * Note: The fields of a descriptor should always be accessed with the
+ * following functions.  ANSI C specifies that any expression
+ * involving integer types smaller than an int have all the variables
+ * automatically promoted to a *signed* int.  This means that
+ * expressions that use the fields of a descriptor directly will
+ * treat them as signed quantities.  This could have unwanted effects,
+ * e.g. base and limit added together could result in a negative
+ * quantity.  The functions that read the bitfields always return an
+ * unsigned integer so as to avoid any potential signed/unsigned
+ * problems.  Functions to write the bitfields are also provided for
+ * consistency.  
+ */
+
+static INLINE uint32 Desc_Type(const Descriptor *d)     { return d->type; }
+static INLINE uint32 Desc_S(const Descriptor *d)        { return d->S; }
+static INLINE uint32 Desc_DPL(const Descriptor *d)      { return d->DPL; }
+static INLINE uint32 Desc_Present(const Descriptor *d)  { return d->present; }
+static INLINE uint32 Desc_AVL(const Descriptor *d)      { return d->AVL; }
+static INLINE uint32 Desc_LongMode(const Descriptor *d) { return d->longmode; }
+static INLINE uint32 Desc_DB(const Descriptor *d)       { return d->DB; }
+static INLINE uint32 Desc_Gran(const Descriptor *d)     { return d->gran; }
+
+static INLINE uint32 Desc64_Type(const Descriptor64 *d)     { return d->type; }
+static INLINE uint32 Desc64_S(const Descriptor64 *d)        { return d->S; }
+static INLINE uint32 Desc64_DPL(const Descriptor64 *d)      { return d->DPL; }
+static INLINE uint32 Desc64_Present(const Descriptor64 *d)  { return d->present; }
+static INLINE uint32 Desc64_AVL(const Descriptor64 *d)      { return d->AVL; }
+static INLINE uint32 Desc64_Gran(const Descriptor64 *d)     { return d->gran; }
+static INLINE uint32 Desc64_ExtAttrs(const Descriptor64 *d) { return d->ext_attrs; }
+
+static INLINE LA32
+Desc_GetBase(const Descriptor *d)
+{
+   return (d->base_hi << 24) | (d->base_mid << 16) | d->base_lo;
+}
+
+static INLINE LA64
+Desc64_GetBase(const Descriptor64 *d)
+{
+   return ((uint64)d->base_hi << 32)  | 
+          ((uint64)d->base_mid << 24) | (uint32)d->base_lo;
+}
+
+static INLINE LA32
+Desc64_GetBaseHi(const Descriptor64 *d)
+{
+   return d->base_hi;
+}
+
+static INLINE VA32
+Desc_GetLimit(const Descriptor *d)
+{
+   return (d->limit_hi << 16) | d->limit_lo;
+}
+
+static INLINE VA32
+Desc64_GetLimit(const Descriptor64 *d)
+{
+   return ((uint32)d->limit_hi << 16) | (uint32)d->limit_lo;
+}
+
+static INLINE Bool
+Desc_EqualIgnoreAccessed(const Descriptor *d1, const Descriptor *d2)
+{
+   const DescriptorUnion *du1 = (const DescriptorUnion*) d1;
+   const DescriptorUnion *du2 = (const DescriptorUnion*) d2;
+   uint32 mask = ~0u;
+   if (Desc_S(d1)) {
+      mask = ~(1u << 8);
+   }
+   return du1->word[0] == du2->word[0] &&
+      (du1->word[1] & mask) == (du2->word[1] & mask);
+}
+
+static INLINE Bool
+Desc64_EqualIgnoreAccessed(const Descriptor64 *d1, const Descriptor64 *d2)
+{
+   const Descriptor64Union *du1 = (const Descriptor64Union*) d1;
+   const Descriptor64Union *du2 = (const Descriptor64Union*) d2;
+   uint32 mask = ~0u;
+   if (Desc64_S(d1)) {
+      mask = ~(1u << 8);
+   }
+   return du1->word[0] == du2->word[0] &&
+          (du1->word[1] & mask) == (du2->word[1] & mask) &&
+          du1->qword[1] == du2->qword[1];
+}
+
+static INLINE void Desc_SetType(Descriptor *d, uint32 val)     { d->type     = val; }
+static INLINE void Desc_SetS(Descriptor *d, uint32 val)        { d->S        = val; }
+static INLINE void Desc_SetDPL(Descriptor *d, uint32 val)      { d->DPL      = val; }
+static INLINE void Desc_SetPresent(Descriptor *d, uint32 val)  { d->present  = val; }
+static INLINE void Desc_SetDB(Descriptor *d, uint32 val)       { d->DB       = val; }
+static INLINE void Desc_SetLongmode(Descriptor *d, uint32 val) { d->longmode = val; }
+static INLINE void Desc_SetGran(Descriptor *d, uint32 val)     { d->gran     = val; }
+
+static INLINE void Desc64_SetType(Descriptor64 *d, uint32 val)    { d->type     = val; }
+static INLINE void Desc64_SetS(Descriptor64 *d, uint32 val)       { d->S        = val; }
+static INLINE void Desc64_SetDPL(Descriptor64 *d, uint32 val)     { d->DPL      = val; }
+static INLINE void Desc64_SetPresent(Descriptor64 *d, uint32 val) { d->present  = val; }
+static INLINE void Desc64_SetGran(Descriptor64 *d, uint32 val)    { d->gran     = val; }
+
+static INLINE void
+Desc_SetBase(Descriptor *d, LA32 newBase)
+{
+   d->base_hi  = BASE_HI(newBase);
+   d->base_mid = BASE_MID(newBase);
+   d->base_lo  = BASE_LO(newBase);
+   ASSERT(Desc_GetBase(d) == newBase);
+}
+
+static INLINE void
+Desc64_SetBase(Descriptor64 *d, LA64 newBase)
+{
+   d->base_hi  = (uint32)BASE64_HI(newBase);
+   d->base_mid = (uint32)BASE64_MID(newBase);
+   d->base_lo  = (uint32)BASE64_LO(newBase);
+   ASSERT(Desc64_GetBase(d) == newBase);
+}
+
+static INLINE void
+Desc_SetLimit(Descriptor *d, VA32 newLimit)
+{
+   d->limit_lo = LIMIT_LO(newLimit);
+   d->limit_hi = LIMIT_HI(newLimit);
+   ASSERT(Desc_GetLimit(d) == newLimit);
+}
+
+static INLINE void
+Desc64_SetLimit(Descriptor64 *d, VA32 newLimit)
+{
+   d->limit_lo = LIMIT_LO(newLimit);
+   d->limit_hi = LIMIT_HI(newLimit);
+   ASSERT(Desc64_GetLimit(d) == newLimit);
+}
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Desc_SetDescriptor --
+ *
+ *      Set a descriptor with the specified properties.
+ *
+ *      NOTE: the implementation of Desc_SetDescriptor() assumes a 
+ *      little-endian byte order.  
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE void 
+Desc_SetDescriptor(Descriptor *d, LA32 base, VA32 limit, uint32 type, 
+                   uint32 S, uint32 DPL, uint32 present, uint32 DB, 
+                   uint32 gran)
+{
+   DescriptorUnion *desc = (DescriptorUnion *) d;
+
+   desc->word[0] = BASE_LO(base)   << X86DESC_BASE_LO_SHIFT  |
+                   LIMIT_LO(limit) << X86DESC_LIMIT_LO_SHIFT;
+
+   desc->word[1] = BASE_HI(base)   << X86DESC_BASE_HI_SHIFT  | 
+                   gran            << X86DESC_GRAN_SHIFT     | 
+                   DB              << X86DESC_DB_SHIFT       | 
+                   LIMIT_HI(limit) << X86DESC_LIMIT_HI_SHIFT | 
+                   present         << X86DESC_P_SHIFT        | 
+                   DPL             << X86DESC_DPL_SHIFT      |
+                   S               << X86DESC_S_SHIFT        | 
+                   type            << X86DESC_TYPE_SHIFT     | 
+                   BASE_MID(base)  << X86DESC_BASE_MID_SHIFT;
+
+   /* 
+    * Assert that all the fields were properly filled in.
+    */
+
+   ASSERT(Desc_GetBase(d) == base);
+   ASSERT(Desc_GetLimit(d) == limit);
+   ASSERT(Desc_Type(d) == type);
+   ASSERT(Desc_S(d) == S);
+   ASSERT(Desc_DPL(d) == DPL);
+   ASSERT(Desc_Present(d) == present);
+   ASSERT(Desc_DB(d) == DB);
+   ASSERT(Desc_Gran(d) == gran);
+   ASSERT(d->AVL == 0);
+   ASSERT(d->longmode == 0);
+}
+
+
+/*
+ * Accessor functions that operate directly on a descriptor.  These
+ * are included only for backwards compatibility with existing macros.  
+ */
+
+static INLINE uint32 DESC_TYPE(Descriptor d)       { return d.type; }
+static INLINE uint32 DESC_S(Descriptor d)          { return d.S; }
+static INLINE uint32 DESC_DPL(Descriptor d)        { return d.DPL; }
+static INLINE uint32 DESC_PRESENT(Descriptor d)    { return d.present; }
+
+#define DT_CODE(_d)               ( DESC_S(_d) && (DESC_TYPE(_d) & 0x8) == 0x8)
+#define DT_CONFORMING_CODE(_d)    ( DESC_S(_d) && (DESC_TYPE(_d) & 0xc) == 0xc)
+#define DT_NONCONFORMING_CODE(_d) ( DESC_S(_d) && (DESC_TYPE(_d) & 0xc) == 0x8)
+#define DT_READABLE_CODE(_d)      ( DESC_S(_d) && (DESC_TYPE(_d) & 0xa) == 0xa)
+#define DT_DATA(_d)               ( DESC_S(_d) && (DESC_TYPE(_d) & 0x8) == 0x0)
+#define DT_WRITEABLE_DATA(_d)     ( DESC_S(_d) && (DESC_TYPE(_d) & 0xa) == 0x2)
+#define DT_EXPAND_DOWN(_d)        ( DESC_S(_d) && (DESC_TYPE(_d) & 0xc) == 0x4)
+#define DT_CALL_GATE(_d)          (!DESC_S(_d) && (DESC_TYPE(_d) & 0x7) == 0x4)
+#define DT_CALL_GATE32(_d)        (!DESC_S(_d) && (DESC_TYPE(_d) & 0xf) == 0xc)
+#define DT_LDT(_d)                (!DESC_S(_d) && (DESC_TYPE(_d) & 0xf) == 0x2)
+#define DT_TASK_GATE(_d)          (!DESC_S(_d) && (DESC_TYPE(_d) & 0xf) == 0x5)
+#define DT_TSS(_d)                (!DESC_S(_d) && (DESC_TYPE(_d) & 0x5) == 0x1)
+#define DT_AVAIL_TSS(_d)          (!DESC_S(_d) && (DESC_TYPE(_d) & 0x7) == 0x1)
+
+#define DT64_TSS(_d)              (!Desc64_S(&_d) && (Desc64_Type(&_d) & 0xd) == 0x9)
+#define DT64_AVAIL_TSS(_d)        (!Desc64_S(&_d) && Desc64_Type(&_d) == 0x9)
+#define DT64_LDT(_d)              (!Desc64_S(&_d) && Desc64_Type(&_d) == 0x2)
+
+#define DT_ACCESS                 0x1
+#define DT_32BIT                  0x8
+#define DT_TSS_BUSY               0x2
+
+#define DATA_DESC                 0x2
+#define CODE_DESC                 0xa
+#define LDT_DESC                  0x2
+#define TASK_DESC                 0x9  // TSS available
+#define TASK_DESC_BUSY            0xb  // TSS busy
+#define TASK16_DESC               0x1  // 16-bit TSS available
+#define TASK16_DESC_BUSY          0x3  // 16-bit TSS busy
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Desc_SetSystemDescriptor64 --
+ *
+ *      Set a 16 byte long mode system descriptor with the specified properties.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void 
+Desc_SetSystemDescriptor64(Descriptor *d, uint64 base, uint32 limit, uint32 type, 
+                           uint32 DPL, uint32 present, uint32 DB, uint32 gran)
+{
+   uint32 baseHi = (uint32) (base >> 32);
+   uint32 baseLo = (uint32) base;
+
+   /*
+    * The first half of a 16-byte descriptor is a valid 8-byte descriptor
+    * so allow TASK16_DESC
+    */
+   ASSERT(type == TASK_DESC || type == TASK_DESC_BUSY ||
+          type == TASK16_DESC || type == TASK16_DESC_BUSY || type == LDT_DESC);
+
+   Desc_SetDescriptor(d, baseLo, limit, type, 0, DPL, present, DB, gran);
+   *(uint32 *)(++d) = baseHi; // High 32 bits of base.
+   *(((uint32 *)d) + 1) = 0;  // Bits 8-12 of highest word are 0, rest ignored.
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ * Desc_DBSize --
+ *   Given descriptor, return the code/stack size that it specifies.
+ *----------------------------------------------------------------------
+ */
+static INLINE int
+Desc_DBSize(const Descriptor *desc)
+{
+   /*
+    * Code/stack size is determined by the D/B bit; bit 22 of the 2nd word.
+    * Shift the bit to position 1, mask it out, add 2. Result: 2 or 4.
+    */
+   int cSz = ((((const uint32*)desc)[1] >> 21) & 2) + 2;
+   ASSERT(cSz == (Desc_DB(desc) ? 4 : 2));
+   return cSz;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Desc_ExpandedLimit --
+ *
+ *      Return the limit in bytes of the descriptor.  This is correct for both
+ *      expand up and expand down limits.  For expand down limits, the page 
+ *      corresponding to the limit << 12 is *not* included in the segment when
+ *      the granularity bit is set.  This makes it correct to append 0xfff to
+ *      make sure accesses to this first page raise a GP.  
+ *
+ * Results:
+ *      The limit in bytes of the descriptor.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE VA32
+Desc_ExpandedLimit(const Descriptor *d)
+{
+   VA32 limit = Desc_GetLimit(d);
+   if (Desc_Gran(d)) {
+      limit <<= 12;
+      limit |= 0xfff;
+   }
+   return limit;
+}
+
+static INLINE VA32
+Desc64_ExpandedLimit(const Descriptor64 *d)
+{
+   VA32 limit = Desc64_GetLimit(d);
+   if (Desc64_Gran(d)) {
+      limit <<= 12;
+      limit |= 0xfff;
+   }
+   return limit;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Desc_PackLimit --
+ *
+ *      Convert the limit of a descriptor into a 21-bit packed representation
+ *
+ * Results:
+ *      packed representation of the limit
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Desc_PackLimit(VA32 limit)
+{
+   if (limit < (1 << 20)) {
+      return limit;
+   } else {
+      ASSERT((limit & 0xfff) == 0xfff);
+      return (limit >> 12) | (1 << 20);
+   }
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Desc_UnpackLimit --
+ *
+ *      Decode the representation of the limit as encoded by Desk_PackLimit
+ *
+ * Results:
+ *      unpacked representation of the limit
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE VA
+Desc_UnpackLimit(uint32 limit)
+{
+   ASSERT(limit < (1 << 21));
+   if (limit & (1 << 20)) {
+      limit = (limit << 12) | 0xfff;
+   }
+   return limit;
+}
+
+
+/*
+ * For expand-down segments, valid offsets range from limit+1 to 
+ * 0xffff or 0xffffffff, depending on the D/B bit in the descriptor.  
+ */
+static INLINE Bool
+Desc_InBoundsExpandDown(VA vaddr, VA limit, uint32 size, VA supremum)
+{
+   ASSERT(supremum == 0xffff || supremum == 0xffffffff);
+   return vaddr > limit && vaddr <= supremum && size - 1 <= supremum - vaddr;
+}
+
+
+/* For expand-up segments, valid offsets range from 0 to limit. */
+static INLINE Bool
+Desc_InBoundsExpandUp(VA vaddr, VA limit, uint32 size)
+{
+   return vaddr <= limit && size - 1 <= limit - vaddr;
+}
+
+
+/* Interrupt Gates
+ *
+ */
+
+typedef struct InterruptGate32 {
+   unsigned   offset_lo : 16;
+   unsigned   segment   : 16;
+   unsigned   unused    : 5;
+   unsigned   zero      : 3;
+   unsigned   type      : 5;
+   unsigned   DPL       : 2;
+   unsigned   present   : 1;
+   unsigned   offset_hi : 16;
+} InterruptGate32;
+
+/*
+ * Call Gates.
+ */
+
+typedef struct Gate {
+   unsigned   offset_lo : 16;
+   unsigned   segment   : 16;
+   unsigned   params    : 5;
+   unsigned   unused    : 3;
+   unsigned   type      : 5;
+   unsigned   DPL       : 2;
+   unsigned   present   : 1;
+   unsigned   offset_hi : 16;
+} Gate;
+
+#define GATE_OFFSET(_gate)       (((_gate).offset_hi << 16) | (_gate).offset_lo)
+
+#define GATE_OFFSET_LO(_dw)      (((int)(_dw)) & 0xffff)
+#define GATE_OFFSET_HI(_dw)      ((((int)(_dw)) >> 16) & 0xffff)
+
+#define CALL_GATE                0x04
+#define TASK_GATE                0x05
+#define INTER_GATE               0x0e
+#define TRAP_GATE                0x0f
+#define INTER_GATE_16            0x06
+#define TRAP_GATE_16             0x07
+
+#define GT_CALL(_gate)           (((_gate).type & 0x17) == 0x04)
+#define GT_TASK(_gate)           (((_gate).type & 0x1f) == 0x05)
+#define GT_INTR(_gate)           (((_gate).type & 0x17) == 0x06)
+#define GT_TRAP(_gate)           (((_gate).type & 0x17) == 0x07)
+#define GT_32BIT                 0x08
+#define GT_32BIT_INTR            0xe
+#define GT_32BIT_TRAP            0xf
+
+#define GT_64BIT_INTR            0xe
+#define GT_64BIT_TRAP            0xf
+#define GT_64BIT_CALL            0xc
+#define GT64_INTR(_gate)         ((_gate).type == GT_64BIT_INTR)
+#define GT64_TRAP(_gate)         ((_gate).type == GT_64BIT_TRAP)
+#define GT64_CALL(_gate)         ((_gate).type == GT_64BIT_CALL)
+
+
+static INLINE VA
+CallGate_GetOffset(const Gate *cg)
+{
+   return (cg->offset_hi << 16) | cg->offset_lo;
+}
+
+static INLINE void
+CallGate_SetOffset(Gate *cg, VA32 offset)
+{
+   cg->offset_lo = GATE_OFFSET_LO(offset);
+   cg->offset_hi = GATE_OFFSET_HI(offset);
+   ASSERT(CallGate_GetOffset(cg) == offset);
+}
+
+/*
+ * Long mode interrupt/trap Gates.
+ */
+
+typedef struct Gate64 {
+   unsigned   offset_0_15  : 16;
+   unsigned   segment      : 16;
+   unsigned   ist          : 3;
+   unsigned   reserved0    : 5;
+   unsigned   type         : 5;
+   unsigned   DPL          : 2;
+   unsigned   present      : 1;
+   unsigned   offset_16_31 : 16;
+   unsigned   offset_32_63 : 32;
+   unsigned   reserved1    : 32;
+} Gate64;
+
+#define GATE64_OFFSET_HI(_gate)  ((uint64)(_gate).offset_32_63 << 32)
+#define GATE64_OFFSET(_gate)     ((uint64)(_gate).offset_32_63 << 32 | \
+                                  (uint64)(_gate).offset_16_31 << 16 | \
+                                  (uint64)(_gate).offset_0_15)
+
+/*
+ * Descriptor Table Registers.
+ */
+
+
+/* 
+ * Need to pack the DTR struct so the offset starts right after the
+ * limit.  
+ */
+#pragma pack(push, 1)
+typedef struct DTR32 {
+   uint16 limit;
+   uint32 offset;
+} DTR32;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct DTR64 {
+   uint16 limit;
+   uint64 offset;
+} DTR64;
+#pragma pack(pop)
+
+#if defined VMM || defined FROBOS_LONGMODE || defined VM_X86_64
+typedef DTR64 DTR;
+#else
+typedef DTR32 DTR;
+#endif
+
+typedef union DTRWords32 {
+   DTR32 dtr;
+   uint32 word[2];
+} DTRWords32;
+
+typedef union DTRWords64 {
+   DTR64 dtr;
+   uint64 word[2];
+} DTRWords64;
+
+#endif //_X86DESC_H_
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
new file mode 100644
index 00000000..e1675bde
--- /dev/null
+++ b/vmmon-only/include/x86msr.h
@@ -0,0 +1,505 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/* 
+ * x86msr.h --
+ *
+ *      MSR number definitions.
+ */
+
+#ifndef _X86MSR_H_
+#define _X86MSR_H_
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMX
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "community_source.h"
+
+/*
+ * Results of calling rdmsr(msrNum) on all logical processors.
+ */
+#ifdef _MSC_VER
+#pragma warning (disable :4200) // non-std extension: zero-sized array in struct
+#endif
+
+typedef
+#include "vmware_pack_begin.h"
+struct MSRReply {
+   /*
+    * Unique host logical CPU identifier. It does not change across queries, so
+    * we use it to correlate the replies of multiple queries.
+    */
+   uint64 tag;              // OUT
+
+   uint64 msrVal;           // OUT
+
+   uint8  implemented;      // OUT
+
+   uint8  _pad[7];
+}
+#include "vmware_pack_end.h"
+MSRReply;
+
+typedef
+#include "vmware_pack_begin.h"
+struct MSRQuery {
+   uint32 msrNum;           // IN
+   uint32 numLogicalCPUs;   // IN/OUT
+   MSRReply logicalCPUs[0]; // OUT
+}
+#include "vmware_pack_end.h"
+MSRQuery;
+
+#define MSR_TSC               0x00000010
+#define MSR_PLATFORM_ID       0x00000017
+#define MSR_APIC_BASE         0x0000001b
+#define MSR_SMI_COUNT         0x00000034 // Intel Nehalem Family
+#define MSR_FEATCTL           0x0000003a
+#define MSR_TSC_ADJUST        0x0000003b
+#define MSR_BIOS_UPDT_TRIG    0x00000079
+#define MSR_BIOS_SIGN_ID      0x0000008b
+#define MSR_PERFCTR0          0x000000c1
+#define MSR_PERFCTR1          0x000000c2
+#define MSR_PLATFORM_INFO     0x000000ce // Intel Nehalem Family
+#define MSR_MTRR_CAP          0x000000fe
+#define MSR_L2CFG             0x0000011e
+#define MSR_SYSENTER_CS       0x00000174
+#define MSR_SYSENTER_ESP      0x00000175
+#define MSR_SYSENTER_EIP      0x00000176
+#define MSR_MCG_CAP           0x00000179
+#define MSR_MCG_STATUS        0x0000017a
+#define MSR_MCG_CTL           0x0000017b
+#define MSR_EVNTSEL0          0x00000186
+#define MSR_EVNTSEL1          0x00000187
+#define MSR_FLEX_RATIO        0x00000194 // Intel Nehalem Family
+#define MSR_CLOCK_MODULATION  0x0000019a
+#define MSR_MISC_ENABLE       0x000001a0
+#define MSR_DEBUGCTL          0x000001d9
+#define MSR_TSC_DEADLINE      0x000006e0
+#define MSR_EFER              0xc0000080
+#define MSR_FSBASE            0xc0000100
+#define MSR_GSBASE            0xc0000101
+#define MSR_KERNELGSBASE      0xc0000102
+#define MSR_TSC_AUX           0xc0000103
+#define MSR_BD_TSC_RATIO      0xc0000104
+
+#define MSR_MISC_FEATURES_ENABLES            0x140
+
+/* Intel Core Architecture and later: use only architected counters. */
+#define IA32_MSR_PERF_CAPABILITIES                0x345
+#define MSR_PERF_CAPABILITIES_LBRFMT_SHIFT        0
+#define MSR_PERF_CAPABILITIES_LBRFMT_MASK         0x3f
+#define MSR_PERF_CAPABILITIES_PEBSTRAP            (1u << 6)
+#define MSR_PERF_CAPABILITIES_PEBSSAVEARCHREGS    (1u << 7)
+#define MSR_PERF_CAPABILITIES_PEBSRECORDFMT_SHIFT 8
+#define MSR_PERF_CAPABILITIES_PEBSRECORDFMT_MASK  0xf
+#define MSR_PERF_CAPABILITIES_FREEZE_WHILE_SMM    (1u << 12)
+#define MSR_PERF_CAPABILITIES_FULL_WIDTH_WRITES   (1u << 13)
+
+#define IA32_MSR_PEBS_ENABLE                      0x3f1
+
+typedef enum {
+   SL_PMC_FLAGS_NONE             = 0x00, /* No flags.                      */
+   SL_PMC_FLAGS_LBR_VA32         = 0x01, /* LBR format: 32-bit VA.         */
+   SL_PMC_FLAGS_LBR_LA64         = 0x02, /* LBR format: 64-bit LA.         */
+   SL_PMC_FLAGS_LBR_VA64         = 0x04, /* LBR format: 64-bit VA.         */
+   SL_PMC_FLAGS_LBR_PACKED_VA32  = 0x08, /* LBR format: 2x32-bit VAs.      */
+} StateLoggerPMCFlags;
+
+#define MSR_MTRR_BASE0        0x00000200
+#define MSR_MTRR_MASK0        0x00000201
+#define MSR_MTRR_BASE1        0x00000202
+#define MSR_MTRR_MASK1        0x00000203
+#define MSR_MTRR_BASE2        0x00000204
+#define MSR_MTRR_MASK2        0x00000205
+#define MSR_MTRR_BASE3        0x00000206
+#define MSR_MTRR_MASK3        0x00000207
+#define MSR_MTRR_BASE4        0x00000208
+#define MSR_MTRR_MASK4        0x00000209
+#define MSR_MTRR_BASE5        0x0000020a
+#define MSR_MTRR_MASK5        0x0000020b
+#define MSR_MTRR_BASE6        0x0000020c
+#define MSR_MTRR_MASK6        0x0000020d
+#define MSR_MTRR_BASE7        0x0000020e
+#define MSR_MTRR_MASK7        0x0000020f
+#define MSR_MTRR_FIX64K_00000 0x00000250
+#define MSR_MTRR_FIX16K_80000 0x00000258
+#define MSR_MTRR_FIX16K_A0000 0x00000259
+#define MSR_MTRR_FIX4K_C0000  0x00000268
+#define MSR_MTRR_FIX4K_C8000  0x00000269
+#define MSR_MTRR_FIX4K_D0000  0x0000026a
+#define MSR_MTRR_FIX4K_D8000  0x0000026b
+#define MSR_MTRR_FIX4K_E0000  0x0000026c
+#define MSR_MTRR_FIX4K_E8000  0x0000026d
+#define MSR_MTRR_FIX4K_F0000  0x0000026e
+#define MSR_MTRR_FIX4K_F8000  0x0000026f
+#define MSR_MTRR_DEF_TYPE     0x000002ff
+
+#define MSR_CR_PAT           0x00000277
+
+#define MSR_MC0_CTL          0x00000400
+#define MSR_MC0_STATUS       0x00000401
+#define MSR_MC0_ADDR         0x00000402
+#define MSR_MC0_MISC         0x00000403
+#define MSR_MC0_CTL2         0x00000280
+
+#define MSR_DS_AREA          0x00000600
+
+#define MSR_LASTBRANCHFROMIP 0x000001db // Intel P6 Family
+#define MSR_LASTBRANCHTOIP   0x000001dc // Intel P6 Family
+#define MSR_LASTINTFROMIP    0x000001dd // Intel P6 Family
+#define MSR_LASTINTTOIP      0x000001de // Intel P6 Family
+
+#define MSR_LER_FROM_LIP     0x000001d7 // Intel Pentium4 Family
+#define MSR_LER_TO_LIP       0x000001d8 // Intel Pentium4 Family
+#define MSR_LASTBRANCH_TOS   0x000001da // Intel Pentium4 Family
+#define MSR_LASTBRANCH_0     0x000001db // Intel Pentium4 Family
+#define MSR_LASTBRANCH_1     0x000001dc // Intel Pentium4 Family
+#define MSR_LASTBRANCH_2     0x000001dd // Intel Pentium4 Family
+#define MSR_LASTBRANCH_3     0x000001de // Intel Pentium4 Family
+
+#define CORE_LBR_SIZE        8
+#define CORE2_LBR_SIZE       4
+
+/* Power Management MSRs */
+#define MSR_PERF_STATUS      0x00000198 // Current Performance State (ro)
+#define MSR_PERF_CTL         0x00000199 // Target Performance State (rw)
+#define MSR_POWER_CTL        0x000001fc // Power Control Register
+#define MSR_CST_CONFIG_CTL   0x000000e2 // C-state Configuration (CORE)
+#define MSR_MISC_PWR_MGMT    0x000001aa // Misc Power Management (NHM)
+#define MSR_ENERGY_PERF_BIAS 0x000001b0 // Performance Energy Bias Hint
+#define MSR_PKG_C2_RESIDENCY 0x0000060d
+#define MSR_PKG_C3_RESIDENCY 0x000003f8
+#define MSR_PKG_C6_RESIDENCY 0x000003f9
+#define MSR_PKG_C7_RESIDENCY 0x000003fa
+#define MSR_CORE_C3_RESIDENCY 0x000003fc
+#define MSR_CORE_C6_RESIDENCY 0x000003fd
+#define MSR_CORE_C7_RESIDENCY 0x000003fe
+
+/* MSR_POWER_CTL bits (Intel) */
+#define MSR_POWER_CTL_C1E    0x00000002 // C1E enable (NHM)
+
+/* P-State Hardware Coordination Feedback Capability (Intel) */
+#define MSR_MPERF            0x000000e7 // Maximum Performance (rw)
+#define MSR_APERF            0x000000e8 // Actual Performance (rw)
+
+/* Software Controlled Clock Modulation and Thermal Monitors (Intel) */
+#define MSR_CLOCK_MODULATION 0x0000019a // Thermal Monitor Control (rw)
+#define MSR_THERM_INTERRUPT  0x0000019b // Thermal Interrupt Control (rw)
+#define MSR_THERM_STATUS     0x0000019c // Thermal Monitor Status (rw)
+#define MSR_THERM2_CTL       0x0000019d // Thermal Monitor 2 Control (ro)
+
+/* x2APIC MSRs */
+#define MSR_X2APIC_BASE      0x00000800
+#define MSR_X2APIC_MAX       0x0000083f
+#define MSR_X2APIC_LIMIT     0x00000bff
+#define MSR_X2APIC_ID        0x00000802
+#define MSR_X2APIC_VERSION   0x00000803
+#define MSR_X2APIC_TPR       0x00000808
+#define MSR_X2APIC_PPR       0x0000080a
+#define MSR_X2APIC_EOI       0x0000080b
+#define MSR_X2APIC_LDR       0x0000080d
+#define MSR_X2APIC_SVR       0x0000080f
+#define MSR_X2APIC_ISR       0x00000810
+#define MSR_X2APIC_TMR       0x00000818
+#define MSR_X2APIC_IRR       0x00000820
+#define MSR_X2APIC_ESR       0x00000828
+#define MSR_X2APIC_CMCILVT   0x0000082f
+#define MSR_X2APIC_ICRLO     0x00000830
+#define MSR_X2APIC_TIMERLVT  0x00000832
+#define MSR_X2APIC_THERMLVT  0x00000833
+#define MSR_X2APIC_PCLVT     0x00000834
+#define MSR_X2APIC_LVT0      0x00000835
+#define MSR_X2APIC_LVT1      0x00000836
+#define MSR_X2APIC_ERRLVT    0x00000837
+#define MSR_X2APIC_INITCNT   0x00000838
+#define MSR_X2APIC_CURCNT    0x00000839
+#define MSR_X2APIC_DIVIDER   0x0000083e
+#define MSR_X2APIC_SELFIPI   0x0000083f
+
+
+/* MSR_CR_PAT power-on value */
+#define MSR_CR_PAT_DEFAULT   0x0007040600070406ULL
+
+/* MSR_MISC_ENABLE bits (Intel) */
+#define MSR_MISC_ENABLE_FAST_STRINGS     (1LL<<0)  // Enable Fast string ops
+#define MSR_MISC_ENABLE_FOPCODE_COMPAT   (1LL<<2)
+#define MSR_MISC_ENABLE_TM1              (1LL<<3)  // Enable Thermal Monitor 1
+#define MSR_MISC_ENABLE_EMON_AVAILABLE   (1LL<<7)  // Perf Monitoring Available
+#define MSR_MISC_ENABLE_BTS_UNAVAILABLE  (1LL<<11)
+#define MSR_MISC_ENABLE_PEBS_UNAVAILABLE (1LL<<12)
+#define MSR_MISC_ENABLE_TM2              (1LL<<13) // Enable Thermal Monitor 2
+#define MSR_MISC_ENABLE_ESS              (1LL<<16) // Enable Enhanced SpeedStep
+#define MSR_MISC_ENABLE_LIMIT_CPUID      (1LL<<22) // Enable CPUID maxval
+#define MSR_MISC_ENABLE_C1E              (1LL<<25) // C1E enable (Merom/Penryn)
+#define MSR_MISC_ENABLE_ACNT2            (1LL<<27) // ACNT2 (Nehalem only, deprecated)
+#define MSR_MISC_ENABLE_TURBO_DISABLE    (1LL<<38) // Turbo Mode Disabled
+
+/* DebugCtlMSR bits */
+#define MSR_DEBUGCTL_LBR                   0x00000001
+#define MSR_DEBUGCTL_BTF                   0x00000002
+#define MSR_DEBUGCTL_TR                    0x00000040
+#define MSR_DEBUGCTL_BTS                   0x00000080
+#define MSR_DEBUGCTL_BTINT                 0x00000100
+#define MSR_DEBUGCTL_BTS_OFF_OS            0x00000200
+#define MSR_DEBUGCTL_BTS_OFF_USR           0x00000400
+#define MSR_DEBUGCTL_FREEZE_LBRS_ON_PMI    0x00000800
+#define MSR_DEBUGCTL_FREEZE_PERFMON_ON_PMI 0x00001000
+#define MSR_DEBUGCTL_ENABLE_UNCORE_PMI     0x00002000
+#define MSR_DEBUGCTL_FREEZE_WHILE_SMM      0x00004000
+#define MSR_DEBUGCTL_RTM                   0x00008000
+#define MSR_DEBUGCTL_RSVD          0xffffffffffff003cULL
+
+/* Feature control bits */
+#define MSR_FEATCTL_LOCK     0x00000001
+#define MSR_FEATCTL_SMXE     0x00000002
+#define MSR_FEATCTL_VMXE     0x00000004
+#define MSR_FEATCTL_SGXE     0x00040000
+
+/* MSR_EFER bits. */
+#define MSR_EFER_SCE         0x0000000000000001ULL  /* Sys call ext'ns:  r/w */
+#define MSR_EFER_RAZ         0x00000000000000feULL  /* Read as zero          */
+#define MSR_EFER_LME         0x0000000000000100ULL  /* Long mode enable: r/w */
+#define MSR_EFER_LMA         0x0000000000000400ULL  /* Long mode active: r/o */
+#define MSR_EFER_NXE         0x0000000000000800ULL  /* No-exec enable:   r/w */
+#define MSR_EFER_SVME        0x0000000000001000ULL  /* SVM(AMD) enabled? r/w */
+#define MSR_EFER_LMSLE       0x0000000000002000ULL  /* LM seg lim enable:r/w */
+#define MSR_EFER_FFXSR       0x0000000000004000ULL  /* Fast FXSAVE:      r/w */
+#define MSR_EFER_TCE         0x0000000000008000ULL  /* Trans. cache ext. r/w */
+#define MSR_EFER_MBZ         0xffffffffffff0200ULL  /* Must be zero (resrvd) */
+
+#define MSR_AMD_PATCH_LOADER 0xc0010020
+
+/* This ifndef is necessary because this is defined by some kernel headers. */
+#ifndef MSR_K7_HWCR
+#define MSR_K7_HWCR                0xc0010015    // Available on AMD processors
+#endif
+#define MSR_K7_HWCR_SSEDIS         0x00008000ULL // Disable SSE bit
+#define MSR_K7_HWCR_MONMWAITUSEREN 0x00000400ULL // Enable MONITOR/MWAIT CPL>0
+#define MSR_K7_HWCR_TLBFFDIS       0x00000040ULL // Disable TLB Flush Filter
+#define MSR_K7_HWCR_SMMLOCK        0x00000001ULL // Lock SMM environment
+
+#ifndef MSR_K8_SYSCFG
+#define MSR_K8_SYSCFG        0xc0010010
+#endif
+#define MSR_K8_SYSCFG_MTRRTOM2EN         (1ULL<<21)
+#define MSR_K8_SYSCFG_TOM2FORCEMEMTYPEWB (1ULL<<22)
+#define MSR_K8_TOPMEM2       0xc001001d
+
+/* AMD "Greyhound" MSRs */
+#define MSR_GH_CMPHLT            0xc0010055  // Interrupt Pending & CMP Halt
+#define MSR_GH_CMPHLT_C1E        (1ULL<<27)  // C1E on CMP Halt is enabled
+#define MSR_GH_CMPHLT_SMI        (1ULL<<28)  // SMI on CMP Halt is enabled
+
+#define MSR_GH_OSVW_LENGTH       0xc0010140  // OS visible workaround length
+#define MSR_GH_OSVW_STATUS       0xc0010141  // OS visible workaround bits
+#define MSR_GH_OSVW_C1E          (1ULL<<1)   // Workaround for C1E not needed
+
+#define MSR_GH_PSTATE_LIMIT      0xc0010061  // P-state Limit Register
+#define MSR_GH_PSTATE_CONTROL    0xc0010062  // P-state Control Register [2:0]
+#define MSR_GH_PSTATE_STATUS     0xc0010063  // P-state Status Register [2:0]
+#define MSR_GH_PSTATE0           0xc0010064  // P-state 0
+#define MSR_GH_PSTATE1           0xc0010065  // P-state 1
+#define MSR_GH_PSTATE2           0xc0010066  // P-state 2
+#define MSR_GH_PSTATE3           0xc0010067  // P-state 3
+#define MSR_GH_PSTATE4           0xc0010068  // P-state 4
+#define MSR_GH_COFVID_CONTROL    0xc0010070  // COFVID Control Register
+#define MSR_GH_COFVID_STATUS     0xc0010071  // COFVID Status Register
+
+/* SVM related MSRs */
+#define MSR_VM_CR                  0xc0010114
+#define MSR_IGNNE                  0xc0010115
+#define MSR_SMM_CTL                0xc0010116
+#define MSR_VM_HSAVE_PA            0xc0010117
+
+#define MSR_VM_CR_DPD              0x0000000000000001ULL // Disable HDT
+#define MSR_VM_CR_R_INIT           0x0000000000000002ULL
+#define MSR_VM_CR_DIS_A20M         0x0000000000000004ULL
+#define MSR_VM_CR_SVM_LOCK         0x0000000000000008ULL
+#define MSR_VM_CR_SVME_DISABLE     0x0000000000000010ULL
+#define MSR_VM_CR_RESERVED         0xffffffffffffffe0ULL
+
+
+/* Syscall/Sysret related MSRs (x86_64) */
+#define MSR_STAR             0xc0000081 // Also present on Athlons.
+#define MSR_LSTAR            0xc0000082
+#define MSR_CSTAR            0xc0000083
+#define MSR_SFMASK           0xc0000084
+
+
+/*
+ * Hyper-V synthetic MSRs.
+ */
+
+#define MSR_HYPERV_GUEST_OS_ID                   0x40000000
+#define MSR_HYPERV_HYPERCALL                     0x40000001
+#define MSR_HYPERV_VP_INDEX                      0x40000002
+#define MSR_HYPERV_RESET                         0x40000003
+#define MSR_HYPERV_VP_RUNTIME                    0x40000010
+#define MSR_HYPERV_TIME_REF_COUNT                0x40000020
+#define MSR_HYPERV_REFERENCE_TSC                 0x40000021
+#define MSR_HYPERV_TIME_TSC_FREQUENCY            0x40000022
+#define MSR_HYPERV_TIME_APIC_FREQUENCY           0x40000023
+#define MSR_HYPERV_EOI                           0x40000070
+#define MSR_HYPERV_ICR                           0x40000071
+#define MSR_HYPERV_TPR                           0x40000072
+#define MSR_HYPERV_APIC_ASSIST_PAGE              0x40000073
+#define MSR_HYPERV_SCONTROL                      0x40000080
+#define MSR_HYPERV_SVERSION                      0x40000081
+#define MSR_HYPERV_SIEFP                         0x40000082
+#define MSR_HYPERV_SIMP                          0x40000083
+#define MSR_HYPERV_EOM                           0x40000084
+#define MSR_HYPERV_SINT0                         0x40000090
+#define MSR_HYPERV_SINT1                         0x40000091
+#define MSR_HYPERV_SINT2                         0x40000092
+#define MSR_HYPERV_SINT3                         0x40000093
+#define MSR_HYPERV_SINT4                         0x40000094
+#define MSR_HYPERV_SINT5                         0x40000095
+#define MSR_HYPERV_SINT6                         0x40000096
+#define MSR_HYPERV_SINT7                         0x40000097
+#define MSR_HYPERV_SINT8                         0x40000098
+#define MSR_HYPERV_SINT9                         0x40000099
+#define MSR_HYPERV_SINT10                        0x4000009A
+#define MSR_HYPERV_SINT11                        0x4000009B
+#define MSR_HYPERV_SINT12                        0x4000009C
+#define MSR_HYPERV_SINT13                        0x4000009D
+#define MSR_HYPERV_SINT14                        0x4000009E
+#define MSR_HYPERV_SINT15                        0x4000009F
+#define MSR_HYPERV_STIMER0_CONFIG                0x400000B0
+#define MSR_HYPERV_STIMER0_COUNT                 0x400000B1
+#define MSR_HYPERV_STIMER1_CONFIG                0x400000B2
+#define MSR_HYPERV_STIMER1_COUNT                 0x400000B3
+#define MSR_HYPERV_STIMER2_CONFIG                0x400000B4
+#define MSR_HYPERV_STIMER2_COUNT                 0x400000B5
+#define MSR_HYPERV_STIMER3_CONFIG                0x400000B6
+#define MSR_HYPERV_STIMER3_COUNT                 0x400000B7
+#define MSR_HYPERV_POWER_STATE_TRIGGER_C1        0x400000C1
+#define MSR_HYPERV_POWER_STATE_TRIGGER_C2        0x400000C2
+#define MSR_HYPERV_POWER_STATE_TRIGGER_C3        0x400000C3
+#define MSR_HYPERV_POWER_STATE_CONFIG_C1         0x400000D1
+#define MSR_HYPERV_POWER_STATE_CONFIG_C2         0x400000D2
+#define MSR_HYPERV_POWER_STATE_CONFIG_C3         0x400000D3
+#define MSR_HYPERV_STATS_PARTITION_RETAIL_PAGE   0x400000E0
+#define MSR_HYPERV_STATS_PARTITION_INTERNAL_PAGE 0x400000E1
+#define MSR_HYPERV_STATS_VP_RETAIL_PAGE          0x400000E2
+#define MSR_HYPERV_STATS_VP_INTERNAL_PAGE        0x400000E3
+#define MSR_HYPERV_GUEST_IDLE                    0x400000F0
+#define MSR_HYPERV_SYNTH_DEBUG_CONTROL           0x400000F1
+#define MSR_HYPERV_SYNTH_DEBUG_STATUS            0x400000F2
+#define MSR_HYPERV_SYNTH_DEBUG_SEND_BUFFER       0x400000F3
+#define MSR_HYPERV_SYNTH_DEBUG_RECEIVE_BUFFER    0x400000F4
+#define MSR_HYPERV_SYNTH_DEBUG_PENDING_BUFFER    0x400000F5
+
+/* Guest Crash Enlightenment MSRs */
+#define MSR_HYPERV_CRASH_P0                      0x40000100
+#define MSR_HYPERV_CRASH_P1                      0x40000101
+#define MSR_HYPERV_CRASH_P2                      0x40000102
+#define MSR_HYPERV_CRASH_P3                      0x40000103
+#define MSR_HYPERV_CRASH_P4                      0x40000104
+#define MSR_HYPERV_CRASH_CTL                     0x40000105
+
+#define MSR_HYPERV_HYPERCALL_EN                  1ULL
+#define MSR_HYPERV_REFERENCE_TSC_EN              1ULL
+
+#define MSR_HYPERV_GUESTOSID_VENDOR_SHIFT        48
+#define MSR_HYPERV_GUESTOSID_VENDOR_MASK         0xfULL
+#define MSR_HYPERV_GUESTOSID_VENDOR_MICROSOFT    1ULL
+
+#define MSR_HYPERV_GUESTOSID_OS_SHIFT            40
+#define MSR_HYPERV_GUESTOSID_OS_MASK             0xfULL
+#define MSR_HYPERV_GUESTOSID_OS_WINNT_DERIVATIVE 4ULL
+
+
+/*
+ * MTRR bit description
+ */
+#define MTRR_CAP_WC           0x400
+#define MTRR_CAP_FIX          0x100
+#define MTRR_CAP_VCNT_MASK    0xff
+
+#define MTRR_DEF_ENABLE       0x800
+#define MTRR_DEF_FIXED_ENABLE 0x400
+#define MTRR_DEF_TYPE_MASK    0xff
+
+#define MTRR_BASE_TYPE_MASK   0xff
+
+#define MTRR_MASK_VALID       0x800
+
+#define MTRR_TYPE_UC          0
+#define MTRR_TYPE_WC          1
+#define MTRR_TYPE_WT          4
+#define MTRR_TYPE_WP          5
+#define MTRR_TYPE_WB          6
+/* PAT Memory Type Only */
+/* UC- is equivalent to UC, except that the MTRR values take precedence */
+#define MTRR_TYPE_UCM         7
+
+/*
+ * PERF_STATUS bits
+ */
+#define MSR_PERF_STATUS_MAX_BUS_RATIO_SHIFT 40
+#define MSR_PERF_STATUS_MAX_BUS_RATIO_MASK  0x1f
+
+/*
+ * PLATFORM_INFO bits
+ */
+#define MSR_PLATFORM_INFO_CPUID_FAULTING (1UL << 31)  // Faulting is supported
+#define MSR_PLATFORM_INFO_MIN_RATIO_SHIFT 40
+#define MSR_PLATFORM_INFO_MIN_RATIO_MASK 0xff
+#define MSR_PLATFORM_INFO_MAX_NONTURBO_RATIO_SHIFT 8
+#define MSR_PLATFORM_INFO_MAX_NONTURBO_RATIO_MASK 0xff
+
+/*
+ * MISC_FEATURES_ENABLES bits
+ */
+#define MSR_MISC_FEATURES_ENABLES_CPUID_FAULTING 1
+
+
+
+
+
+static INLINE uint32
+X86MSR_SysCallEIP(uint64 star)
+{
+   return (uint32)star;
+}
+
+
+static INLINE uint16
+X86MSR_SysCallCS(uint64 star)
+{
+   return (uint16)(star >> 32);
+}
+
+
+static INLINE uint16
+X86MSR_SysRetCS(uint64 star)
+{
+   return (uint16)(star >> 48);
+}
+
+
+#endif /* _X86MSR_H_ */
diff --git a/vmmon-only/include/x86perfctr.h b/vmmon-only/include/x86perfctr.h
new file mode 100644
index 00000000..606c898e
--- /dev/null
+++ b/vmmon-only/include/x86perfctr.h
@@ -0,0 +1,976 @@
+/*********************************************************
+ * Copyright (C) 1998-2012,2014-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86perfctr.h --
+ *
+ */
+
+#ifndef _X86PERFCTR_H_
+#define _X86PERFCTR_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+
+#include "includeCheck.h"
+#include "vm_asm.h"
+#include "x86cpuid_asm.h"
+#include "perfctr_generic.h"
+
+#define PERFCTR_PENTIUM4_NUM_COUNTERS            18
+#define PERFCTR_PENTIUM4_NUM_COUNTERS_WITH_L3    26
+#define PERFCTR_AMD_NUM_COUNTERS                 4 
+#define PERFCTR_BD_NUM_COUNTERS                  6
+#define PERFCTR_P6_NUM_COUNTERS                  2
+#define PERFCTR_NEHALEM_NUM_GEN_COUNTERS         4
+#define PERFCTR_NEHALEM_NUM_FIXED_COUNTERS       3
+#define PERFCTR_SANDYBRIDGE_NUM_GEN_COUNTERS     8 /* When HT is disabled */
+#define PERFCTR_CORE_NUM_ARCH_EVENTS             7
+#define PERFCTR_PENTIUM4_VAL_MASK                0xffffffffffLL
+#define PERFCTR_AMD_VAL_MASK                     0xffffffffffffLL
+#define PERF_EVENT_NAME_LEN                      64
+/*
+ * Even though the performance counters in P6 are 40 bits,
+ * we can only write to the lower 32 bits.  Bit 31 is
+ * used to sign-extend the upper 8 bits.
+ */
+#define PERFCTR_P6_VAL_MASK                      0xffffffffffLL
+#define PERFCTR_P6_WRITE_MASK                    0xffffffff
+
+/*
+ * Performance counter width is determined at runtime in CORE.
+ * But the writables bits are fixed. we can only write to the 
+ * lower 32 bits.  Bit 31 is used to sign-extend the upper 8 bits.
+ */
+#define PERFCTR_CORE_WRITE_MASK                  0xffffffff
+
+/* Common Event Selection MSR bits. */
+#define PERFCTR_CPU_EVENT_MASK                   0x000000ff
+#define PERFCTR_CPU_EVENT_SHIFT                  0
+#define PERFCTR_CPU_UNIT_MASK                    0x0000ff00
+#define PERFCTR_CPU_UNIT_SHIFT                   8
+#define PERFCTR_CPU_USER_MODE                    0x00010000
+#define PERFCTR_CPU_KERNEL_MODE                  0x00020000
+#define PERFCTR_CPU_EDGE_DETECT                  0x00040000
+#define PERFCTR_CPU_PIN_CONTROL                  0x00080000
+#define PERFCTR_CPU_APIC_INTR                    0x00100000
+#define PERFCTR_CPU_ENABLE                       0x00400000
+#define PERFCTR_CPU_INVERT_COUNTER_MASK          0x00800000
+#define PERFCTR_CPU_COUNTER_MASK                 0xff000000
+#define PERFCTR_CPU_COUNTER_MASK_SHIFT           24
+#define PERFCTR_CPU_EVENT_IN_USE                 0x3C /* Unhalted Core cycles */
+
+/*
+ * ----------------------------------------------------------------------
+ *
+ * AMD K8
+ *
+ * ----------------------------------------------------------------------
+ */
+
+/* AMD Event Selection MSRs */
+#define PERFCTR_AMD_EVENT_MASK                   PERFCTR_CPU_EVENT_MASK
+#define PERFCTR_AMD_EXT_EVENT_MASK               (0xfULL << 32)
+#define PERFCTR_AMD_EVENT_SHIFT                  PERFCTR_CPU_EVENT_SHIFT
+#define PERFCTR_AMD_UNIT_MASK                    PERFCTR_CPU_UNIT_MASK
+#define PERFCTR_AMD_UNIT_SHIFT                   PERFCTR_CPU_UNIT_SHIFT
+#define PERFCTR_AMD_USER_MODE                    PERFCTR_CPU_USER_MODE
+#define PERFCTR_AMD_KERNEL_MODE                  PERFCTR_CPU_KERNEL_MODE
+#define PERFCTR_AMD_EDGE_DETECT                  PERFCTR_CPU_EDGE_DETECT
+#define PERFCTR_AMD_PIN_CONTROL                  PERFCTR_CPU_PIN_CONTROL
+#define PERFCTR_AMD_APIC_INTR                    PERFCTR_CPU_APIC_INTR
+#define PERFCTR_AMD_ENABLE                       PERFCTR_CPU_ENABLE
+#define PERFCTR_AMD_INVERT_COUNTER_MASK          PERFCTR_CPU_INVERT_COUNTER_MASK
+#define PERFCTR_AMD_COUNTER_MASK                 PERFCTR_CPU_COUNTER_MASK
+#define PERFCTR_AMD_COUNTER_MASK_SHIFT           PERFCTR_CPU_COUNTER_MASK_SHIFT
+#define PERFCTR_AMD_SHIFT_BY_UNITMASK(e)         ((e) << 8 )
+#define PERFCTR_AMD_EVTSEL_HOST                  (CONST64U(1) << 41)
+#define PERFCTR_AMD_EVTSEL_GUEST                 (CONST64U(1) << 40)
+
+/* AMD Performance Counter MSR Definitions */
+#define PERFCTR_AMD_PERFEVTSEL0_ADDR             0xC0010000
+#define PERFCTR_AMD_PERFCTR0_ADDR                0xC0010004
+#define PERFCTR_BD_BASE_ADDR                     0xC0010200
+#define PERFCTR_BD_EVENTSEL                      0
+#define PERFCTR_BD_CTR                           1
+#define PERFCTR_BD_MSR_STRIDE                    2
+
+/* AMD Clocks */
+#define PERFCTR_AMD_CPU_CLK_UNHALTED                           0x76
+
+/* AMD Load/Store unit events */
+#define PERFCTR_AMD_SEGMENT_REGISTER_LOADS                     0x20 
+#define PERFCTR_AMD_LS_BUFFER2_FULL                            0x23
+
+/*
+ * Event 0x2b counts SMIs on Opteron Rev.G (with upatch) and on
+ * GH >= Rev.B0 without patches. GH Rev.A has no such capability.
+ */
+#define PERFCTR_AMD_SMI_COUNT                                  0x2b
+
+/* AMD Data Cache Events */
+#define PERFCTR_AMD_DATA_CACHE_ACCESSES                        0x40
+#define PERFCTR_AMD_DATA_CACHE_MISSES                          0x41
+#define PERFCTR_AMD_DATA_CACHE_REFILLS_FROM_L2_OR_SYSTEM       0x42
+#define PERFCTR_AMD_DATA_CACHE_REFILLS_FROM_SYSTEM             0x43
+#define PERFCTR_AMD_DATA_CACHE_LINES_EVICTED                   0x44
+#define PERFCTR_AMD_L1_DTLB_MISS_AND_L2_DTLB_HIT               0x45
+#define PERFCTR_AMD_L1_DTLB_AND_L2_DTLB_MISS                   0x46
+#define PERFCTR_AMD_MISALIGNED_ACCESSES                        0x47
+#define PERFCTR_AMD_PREFETCH_INSTRS_DISPATCHED                 0x4b
+#define PERFCTR_AMD_DCACHE_MISSES_BY_LOCKED_INSTR              0x4c
+
+/* AMD L2 Cache */
+#define PERFCTR_AMD_REQUESTS_TO_L2                             0x7d
+#define PERFCTR_AMD_L2_MISS                                    0x7e
+#define PERFCTR_AMD_L2_FILL_WRITEBACK                          0x7f
+
+/* AMD L3 Cache */
+#define PERFCTR_AMD_REQUESTS_TO_L3                             (0x4e0 | 0xf000)
+#define PERFCTR_AMD_L3_MISS                                    (0x4e1 | 0xf000)
+
+/* AMD Instruction Cache Events */
+
+#define PERFCTR_AMD_INSTR_FETCHES                              0x80
+#define PERFCTR_AMD_INSTR_MISSES                               0x81
+#define PERFCTR_AMD_INSTR_REFILLS_FROM_L2                      0x82
+#define PERFCTR_AMD_INSTR_REFILLS_FROM_SYSTEM                  0x83
+#define PERFCTR_AMD_L1_ITLB_MISS_L2_ITLB_HIT                   0x84
+#define PERFCTR_AMD_L1_ITLB_MISS_L2_ITLB_MISS                  0x85
+#define PERFCTR_AMD_INSTR_FETCH_STALL                          0x87
+
+/* AMD Execution Unit Events */
+#define PERFCTR_AMD_RET_INSTR                                  0xc0
+#define PERFCTR_AMD_RET_UOPS                                   0xc1
+#define PERFCTR_AMD_RET_BRANCH_INSTR                           0xc2
+#define PERFCTR_AMD_RET_MISPRED_BRANCH_INSTR                   0xc3
+#define PERFCTR_AMD_RET_TAKEN_BRANCH_INSTR                     0xc4
+#define PERFCTR_AMD_RET_TAKEN_BRANCH_INSTR_MISPRED             0xc5
+#define PERFCTR_AMD_RET_FAR_CONTROL_TRANSFERS                  0xc6
+#define PERFCTR_AMD_RET_BRANCH_RESYNCS                         0xc7
+#define PERFCTR_AMD_RET_NEAR_RETURNS                           0xc8
+#define PERFCTR_AMD_RET_NEAR_RETURNS_MISPRED                   0xc9
+#define PERFCTR_AMD_RET_INDIRECT_BRANCHES_MISPRED              0xca
+#define PERFCTR_AMD_RET_MMX_FP_INSTR                           0xcb
+#define PERFCTR_AMD_INT_MASKED_CYCLES                          0xcd
+#define PERFCTR_AMD_INT_MASKED_CYCLES_WITH_INT_PEND            0xce
+
+#define PERFCTR_AMD_INT_MASKED_COUNT \
+  ((0xcd) | PERFCTR_AMD_EDGE_DETECT)
+
+#define PERFCTR_AMD_INT_MASKED_COUNT_WITH_INT_PEND \
+  ((0xce) | PERFCTR_AMD_EDGE_DETECT)
+
+#define PERFCTR_AMD_INT_TAKEN                                       0xcf
+#define PERFCTR_AMD_DECODER_EMPTY_CYCLES                            0xd0
+#define PERFCTR_AMD_DISPATCH_STALLS                                 0xd1
+#define PERFCTR_AMD_DISPATCH_MISPRED_BRANCH_STALL_CYCLES            0xd2
+#define PERFCTR_AMD_DISPATCH_SERIALIZATION_STALL_CYCLES             0xd3
+#define PERFCTR_AMD_DISPATCH_SEGMENTLOAD_STALL_CYCLES               0xd4
+#define PERFCTR_AMD_DISPATCH_REORDER_BUFFER_FULL_STALL_CYCLES       0xd5
+#define PERFCTR_AMD_DISPATCH_RESERVATION_STATION_FULL_STALL_CYCLES  0xd6
+#define PERFCTR_AMD_DISPATCH_LS_FULL_STALL_CYCLES                   0xd8
+#define PERFCTR_AMD_DISPATCH_WAIT_ALLQUIET_STALL_CYCLES             0xd9
+#define PERFCTR_AMD_DISPATCH_FAR_XFER_OR_RESYNC_RETIRE_STALL_CYCLES 0xda
+
+/* AMD Memory Controller Events */
+
+#define PERFCTR_AMD_MEM_CTRL_PAGE_TABLE_OVERFLOWS                   0xe1
+#define PERFCTR_AMD_CPU_IO_REQUESTS_TO_MEMORY_IO                    0xe9
+#define PERFCTR_AMD_PROBE_RESPONSE_AND_UPSTREAM_REQ                 0xec 
+ 
+/* AMD HyperTransport Interface Events */
+
+#define PERFCTR_AMD_HT_L0_TX_BW                                     0xf6
+#define PERFCTR_AMD_HT_L1_TX_BW                                     0xf7
+#define PERFCTR_AMD_HT_L2_TX_BW                                     0xf8
+
+/*
+ * ----------------------------------------------------------------------
+ *
+ * Intel P6 family (excluding newer Core architecture)
+ *
+ * ----------------------------------------------------------------------
+ */
+
+/*
+ * Event numbers for P6 Family Processors.
+ */
+
+/* P6 Data Cache Unit (DCU) */
+#define PERFCTR_P6_DATA_MEM_REFS                 0x00000043  
+#define PERFCTR_P6_DCU_LINES_IN                  0x00000045
+#define PERFCTR_P6_DCU_M_LINES_IN                0x00000046 
+#define PERFCTR_P6_DCU_MISS_OUTSTANDING          0x00000048
+
+/* P6 Instruction Fetch Unit (IFU) */
+#define PERFCTR_P6_IFU_IFETCH                    0x00000080
+#define PERFCTR_P6_IFU_IFETCH_MISS               0x00000081
+#define PERFCTR_P6_ITLB_MISS                     0x00000085
+#define PERFCTR_P6_IFU_MEM_STALL                 0x00000086
+#define PERFCTR_P6_ILD_STALL                     0x00000087
+
+/* P6 L2 Cache */
+#define PERFCTR_P6_L2_IFETCH                     0x00000f28
+#define PERFCTR_P6_L2_LD                         0x00000f29
+#define PERFCTR_P6_L2_ST                         0x00000f2a
+#define PERFCTR_P6_L2_LINES_IN                   0x00000024
+#define PERFCTR_P6_L2_LINES_OUT                  0x00000026
+#define PERFCTR_P6_L2_LINES_INM                  0x00000025
+#define PERFCTR_P6_L2_LINES_OUTM                 0x00000027
+#define PERFCTR_P6_L2_RQSTS                      0x00000f2e
+#define PERFCTR_P6_L2_ADS                        0x00000021
+#define PERFCTR_P6_L2_DBUS_BUSY_RD               0x00000023
+
+/* P6 External Bus Logic */
+#define PERFCTR_P6_BUSDRDY_CLOCKS_SELF           0x00000062
+#define PERFCTR_P6_BUSDRDY_CLOCKS_ANY            0x00002062
+#define PERFCTR_P6_BUS_LOCK_CLOCKS_SELF          0x00000063
+#define PERFCTR_P6_BUS_LOCK_CLOCKS_ANY           0x00002063
+#define PERFCTR_P6_BUS_REQ_OUTSTANDING           0x00000060
+#define PERFCTR_P6_BUS_TRAN_BRD_SELF             0x00000065
+#define PERFCTR_P6_BUS_TRAN_BRD_ANY              0x00002065
+#define PERFCTR_P6_BUS_TRAN_RFO_SELF             0x00000066
+#define PERFCTR_P6_BUS_TRAN_RFO_ANY              0x00002066
+#define PERFCTR_P6_BUS_TRAN_WB_SELF              0x00000067
+#define PERFCTR_P6_BUS_TRAN_WB_ANY               0x00002067
+#define PERFCTR_P6_BUS_TRAN_IFETCH_SELF          0x00000068
+#define PERFCTR_P6_BUS_TRAN_IFETCH_ANY           0x00002068
+#define PERFCTR_P6_BUS_TRAN_INVAL_SELF           0x00000069
+#define PERFCTR_P6_BUS_TRAN_INVAL_ANY            0x00002069
+#define PERFCTR_P6_BUS_TRAN_PWR_SELF             0x0000006a
+#define PERFCTR_P6_BUS_TRAN_PWR_ANY              0x0000206a
+#define PERFCTR_P6_BUS_TRAN_P_SELF               0x0000006b
+#define PERFCTR_P6_BUS_TRAN_P_ANY                0x0000206b
+#define PERFCTR_P6_BUS_TRAN_IO_SELF              0x0000006c
+#define PERFCTR_P6_BUS_TRAN_IO_ANY               0x0000206c
+#define PERFCTR_P6_BUS_TRAN_DEF_SELF             0x0000006d
+#define PERFCTR_P6_BUS_TRAN_DEF_ANY              0x0000206d
+#define PERFCTR_P6_BUS_TRAN_DEF_SELF             0x0000006d
+#define PERFCTR_P6_BUS_TRAN_DEF_ANY              0x0000206d
+#define PERFCTR_P6_BUS_TRAN_BURST_SELF           0x0000006e
+#define PERFCTR_P6_BUS_TRAN_BURST_ANY            0x0000206e
+#define PERFCTR_P6_BUS_TRAN_ANY_SELF             0x00000070
+#define PERFCTR_P6_BUS_TRAN_ANY_ANY              0x00002070
+#define PERFCTR_P6_BUS_TRAN_MEM_SELF             0x0000006f
+#define PERFCTR_P6_BUS_TRAN_MEM_ANY              0x0000206f
+#define PERFCTR_P6_BUS_TRAN_RCV                  0x00000064
+#define PERFCTR_P6_BUS_BNR_DRV                   0x00000061
+#define PERFCTR_P6_BUS_HIT_DRV                   0x0000007a
+#define PERFCTR_P6_BUS_HITM_DRV                  0x0000007b
+#define PERFCTR_P6_BUS_SNOOP_STALL               0x0000007E
+
+/* P6 Floating-Point Unit */
+#define PERFCTR_P6_FLOPS                         0x000000c1
+#define PERFCTR_P6_FP_COMP_OPS_EXE               0x00000010
+#define PERFCTR_P6_FP_ASSIST                     0x00000011
+#define PERFCTR_P6_MUL                           0x00000012
+#define PERFCTR_P6_DIV                           0x00000013
+#define PERFCTR_P6_CYCLES_DIV_BUSY               0x00000014
+
+/* P6 Memory Ordering */
+#define PERFCTR_P6_LD_BLOCKS                     0x00000003
+#define PERFCTR_P6_SB_DRAINS                     0x00000004
+#define PERFCTR_P6_MISALIGN_MEM_REF              0x00000005
+#define PERFCTR_P6_EMON_KNI_PREF_DISPATCHED_NTA  0x00000007
+#define PERFCTR_P6_EMON_KNI_PREF_DISPATCHED_T1   0x00000107
+#define PERFCTR_P6_EMON_KNI_PREF_DISPATCHED_T2   0x00000207
+#define PERFCTR_P6_EMON_KNI_PREF_DISPATCHED_WOS  0x00000307
+#define PERFCTR_P6_EMON_KNI_PREF_MISS_NTA        0x0000004b
+#define PERFCTR_P6_EMON_KNI_PREF_MISS_T1         0x0000014b
+#define PERFCTR_P6_EMON_KNI_PREF_MISS_T2         0x0000024b
+#define PERFCTR_P6_EMON_KNI_PREF_MISS_WOS        0x0000034b
+
+/* P6 Instruction Decoding and Retirement */
+#define PERFCTR_P6_INST_RETIRED                  0x000000c0
+#define PERFCTR_P6_UOPS_RETIRED                  0x000000c2
+#define PERFCTR_P6_INST_DECODED                  0x000000d0
+#define PERFCTR_P6_EMON_KNI_INST_RETIRED         0x000000d8
+#define PERFCTR_P6_EMON_KNI_INST_RETIRED_SC      0x000001d8
+#define PERFCTR_P6_EMON_KNI_COMP_INST_RETIRED    0x000000d9
+#define PERFCTR_P6_EMON_KNI_COMP_INST_RETIRED_SC 0x000001d9
+
+/* P6 Interrupts */
+#define PERFCTR_P6_HW_INT_RX                     0x000000c8
+#define PERFCTR_P6_CYCLES_INT_MASKED             0x000000c6
+#define PERFCTR_P6_CYCLES_INT_PENDING_AND_MASKED 0x000000c7
+
+/* P6 Branches */
+#define PERFCTR_P6_BR_INST_RETIRED               0x000000c4
+#define PERFCTR_P6_BR_MISS_PRED_RETIRED          0x000000c5
+#define PERFCTR_P6_BR_TAKEN_RETIRED              0x000000c9
+#define PERFCTR_P6_BR_MISS_PRED_TAKEN_RET        0x000000ca
+#define PERFCTR_P6_BR_INST_DECODED               0x000000e0
+#define PERFCTR_P6_BTB_MISSES                    0x000000e2
+#define PERFCTR_P6_BR_BOGUS                      0x000000e4
+#define PERFCTR_P6_BACLEARS                      0x000000e6
+
+/* P6 Stalls */
+#define PERFCTR_P6_RESOURCE_STALLS               0x000000a2
+#define PERFCTR_P6_PARTIAL_RAT_CLEARS            0x000000d2
+
+/* P6 Segment Register Loads */
+#define PERFCTR_P6_SEGMENT_REG_LOADS             0x00000006
+
+/* P6 Clocks */
+#define PERFCTR_P6_CPU_CLK_UNHALTED              0x00000079
+
+/* P6 MMX Unit */
+#define PERFCTR_P6_MMX_INSTR_EXEC                0x000000b0
+#define PERFCTR_P6_MMX_SAT_INSTR_EXEC            0x000000b1
+#define PERFCTR_P6_MMX_UOPS_EXEC                 0x000000b2
+#define PERFCTR_P6_MMX_INSTR_TYPE_EXEC_PK_MUL    0x000001b3
+#define PERFCTR_P6_MMX_INSTR_TYPE_EXEC_PK_SHIFT  0x000002b3
+#define PERFCTR_P6_MMX_INSTR_TYPE_EXEC_PK_OP     0x000004b3
+#define PERFCTR_P6_MMX_INSTR_TYPE_EXEC_UNPK_OP   0x000008b3
+#define PERFCTR_P6_MMX_INSTR_TYPE_EXEC_PK_LOG    0x000010b3
+#define PERFCTR_P6_MMX_INSTR_TYPE_EXEC_PK_ARITH  0x000020b3
+#define PERFCTR_P6_FP_MMX_TRANS_TO               0x000000cc
+#define PERFCTR_P6_FP_MMX_TRANS_FROM             0x000001cc
+#define PERFCTR_P6_FP_MMX_ASSIST                 0x000000cd
+#define PERFCTR_P6_FP_MMX_INSTR_RET              0x000000ce
+
+/* P6 Segment Register Renaming */
+#define PERFCTR_P6_SEG_RENAME_STALLS_ES          0x000001d4
+#define PERFCTR_P6_SEG_RENAME_STALLS_DS          0x000002d4
+#define PERFCTR_P6_SEG_RENAME_STALLS_FS          0x000004d4
+#define PERFCTR_P6_SEG_RENAME_STALLS_GS          0x000008d4
+#define PERFCTR_P6_SEG_RENAME_STALLS_ANY         0x00000fd4
+#define PERFCTR_P6_SEG_RENAMES_ES                0x000001d5
+#define PERFCTR_P6_SEG_RENAMES_DS                0x000002d5
+#define PERFCTR_P6_SEG_RENAMES_FS                0x000004d5
+#define PERFCTR_P6_SEG_RENAMES_GS                0x000008d5
+#define PERFCTR_P6_SEG_RENAMES_ANY               0x00000fd5
+#define PERFCTR_P6_RET_SEG_RENAMES               0x000000d6
+
+/*
+ * P6 Event Selection MSRs
+ */
+
+#define PERFCTR_P6_EVENT_MASK                    0x000000ff
+#define PERFCTR_P6_EVENT_SHIFT                   0
+#define PERFCTR_P6_UNIT_MASK                     0x0000ff00
+#define PERFCTR_P6_UNIT_SHIFT                    8
+#define PERFCTR_P6_USER_MODE                     0x00010000
+#define PERFCTR_P6_KERNEL_MODE                   0x00020000
+#define PERFCTR_P6_EDGE_DETECT                   0x00040000
+#define PERFCTR_P6_PIN_CONTROL                   0x00080000
+#define PERFCTR_P6_APIC_INTR                     0x00100000
+#define PERFCTR_P6_ENABLE                        0x00400000
+#define PERFCTR_P6_INVERT_COUNTER_MASK           0x00800000
+#define PERFCTR_P6_COUNTER_MASK                  0xff000000        
+#define PERFCTR_P6_COUNTER_MASK_SHIFT            24
+#define PERFCTR_P6_SHIFT_BY_UNITMASK(e)          (e << 8)
+
+/*
+ * P6 Performance Counter MSR Addresses
+ */
+#define PERFCTR_P6_PERFEVTSEL0_ADDR              0x00000186
+#define PERFCTR_P6_PERFCTR0_ADDR                 0x000000c1
+
+/*
+ * ----------------------------------------------------------------------
+ *
+ * Intel Core architecture
+ *
+ *    Use CPUID 0xa to get perf capabilities.  Some (7) events are
+ *    architectural; most are version-specific.
+ *
+ *    V1: Yonah, V2: Merom, V2+: Penryn
+ *
+ *    V1 is similar to P6, with some additions:
+ *       - Global control MSR
+ *    V2 introduces:
+ *       - 3 fixed counters
+ *       - Ability to freeze a counter before PMI delivery.
+ *       - Freeze during SMI (Penryn+ only)
+ *       - VMCS global enable (Penryn+ only)
+ *
+ * ----------------------------------------------------------------------
+ */
+#define PERFCTR_CORE_PERFCTR0_ADDR                  0x0c1
+#define PERFCTR_CORE_PERFEVTSEL0_ADDR               0x186
+#define PERFCTR_CORE_FIXED_CTR0_ADDR                0x309
+#define PERFCTR_CORE_FIXED_CTR_CTRL_ADDR            0x38d
+#define PERFCTR_CORE_FIXED_CTR_CTRL_PMI_MASK        0x888
+#define PERFCTR_CORE_GLOBAL_STATUS_ADDR             0x38e
+#define PERFCTR_CORE_GLOBAL_CTRL_ADDR               0x38f
+#define PERFCTR_CORE_GLOBAL_OVF_CTRL_ADDR           0x390
+#define PERFCTR_CORE_GLOBAL_STATUS_RESET_ADDR       0x390
+#define PERFCTR_CORE_GLOBAL_STATUS_SET_ADDR         0x391
+#define PERFCTR_CORE_GLOBAL_UNAVAILABLE_STATUS_ADDR 0x392
+#define PERFCTR_CORE_PERFCTR0_FULL_WIDTH_ADDR       0x4c1
+#define PERFCTR_CORE_GLOBAL_PMC0_ENABLE             0x1
+#define PERFCTR_CORE_GLOBAL_PMC1_ENABLE             0x2
+#define PERFCTR_CORE_GLOBAL_FIXED_ENABLE            0x700000000ULL
+#define PERFCTR_CORE_USER_MODE                      PERFCTR_CPU_USER_MODE
+#define PERFCTR_CORE_KERNEL_MODE                    PERFCTR_CPU_KERNEL_MODE
+#define PERFCTR_CORE_APIC_INTR                      PERFCTR_CPU_APIC_INTR
+#define PERFCTR_CORE_ENABLE                         PERFCTR_CPU_ENABLE
+#define PERFCTR_CORE_ANYTHREAD                      0x00200000
+#define PERFCTR_CORE_IN_TX                          (CONST64U(1) << 32)
+#define PERFCTR_CORE_IN_TXCP                        (CONST64U(1) << 33)
+#define PERFCTR_CORE_SHIFT_BY_UNITMASK(e)           ((e) << 8)
+#define PERFCTR_CORE_FIXED_CTR0_PMC                 0x40000000
+#define PERFCTR_CORE_FIXED_CTR1_PMC                 0x40000001
+#define PERFCTR_CORE_FIXED_PMI_MASKn(n)             (CONST64U(0x8) << ((n) * 4))
+#define PERFCTR_CORE_FIXED_ANY_MASKn(n)             (CONST64U(0x4) << ((n) * 4))
+#define PERFCTR_CORE_FIXED_KERNEL_MASKn(n)          (CONST64U(0x1) << ((n) * 4))
+#define PERFCTR_CORE_FIXED_USER_MASKn(n)            (CONST64U(0x2) << ((n) * 4))
+#define PERFCTR_CORE_FIXED_ENABLE_MASKn(n)          (CONST64U(0x3) << ((n) * 4))
+#define PERFCTR_CORE_FIXED_MASKn(n)                 (CONST64U(0xf) << ((n) * 4))
+#define PERFCTR_CORE_FIXED_SHIFTBYn(n)              ((n) * 4)
+#define PERFCTR_CORE_FIXED_ANYTHREAD                CONST64U(0x00000444)
+#define PERFCTR_CORE_PMI_UNAVAILABLE_IN_USE         (CONST64U(1) << 63)
+// XXX serebrin/dhecht: 1-10-11: Make ANYTHREAD depend on number of fixed PMCs
+
+#define PERFCTR_CORE_GLOBAL_STATUS_CTR_FRZ       (1ULL << 59)
+#define PERFCTR_CORE_GLOBAL_STATUS_ASCI          (1ULL << 60)
+#define PERFCTR_CORE_GLOBAL_STATUS_OVFBUFFER     (1ULL << 62)
+
+/* Architectural event counters */
+#define PERFCTR_CORE_UNHALTED_CORE_CYCLES        0x3c
+#define PERFCTR_CORE_INST_RETIRED                0xc0
+/* bus cycles */
+#define PERFCTR_CORE_UNHALTED_REF_CYCLES         (0x3c | (0x01 << 8))
+
+/*
+ * See Tables 30-2, 30-4 of the
+ * "Intel 64 and IA-32 Architecture's Software Developer Manual,
+ * Volume 3B, System Programming Guide, Part 2
+ */
+#define PERFCTR_CORE_LLC_REF                     (0x2e | (0x4f << 8))
+#define PERFCTR_CORE_LLC_MISSES                  (0x2e | (0x41 << 8))
+#define PERFCTR_CORE_LLC_MISSES_PREFETCH         (0x2e | (0x71 << 8))
+#define PERFCTR_CORE_LLC_MISSES_ALL              (0x2e | (0xc1 << 8))
+#define PERFCTR_CORE_LLC_MISSES_ALL_PREFETCH     (0x2e | (0xf1 << 8))
+#define PERFCTR_CORE_BRANCH_RETIRED              0xc4
+#define PERFCTR_CORE_BRANCH_MISPRED_RETIRED      0xc5
+
+/* Non-Architectural event counters in Intel Core and Core 2 */
+#define PERFCTR_CORE_L2_LINES_IN                 0x24
+#define PERFCTR_CORE_L2_M_LINES_IN               0x25
+#define PERFCTR_CORE_L2_LINES_OUT                0x26
+#define PERFCTR_CORE_L2_M_LINES_OUT              0x27
+#define PERFCTR_CORE_DATA_MEM_REF                0x43
+#define PERFCTR_CORE_DATA_MEM_CACHE_REF          0x44
+#define PERFCTR_CORE_DCACHE_REPL                 0x45
+#define PERFCTR_CORE_DCACHE_M_REPL               0x46
+#define PERFCTR_CORE_DCACHE_M_EVICT              0x47
+#define PERFCTR_CORE_DCACHE_PEND_MISS            0x48
+#define PERFCTR_CORE_DTLB_MISS                   0x49
+#define PERFCTR_CORE_BUS_TRANS                   0x70
+#define PERFCTR_CORE_ICACHE_READS                0x80
+#define PERFCTR_CORE_ICACHE_MISSES               0x81
+#define PERFCTR_CORE_ITLB_MISSES                 0x85
+#define PERFCTR_CORE_UOPS_RETIRED                0xC2
+#define PERFCTR_CORE_RESOURCE_STALLS             0xDC
+#define PERFCTR_NEHALEM_OFFCORE_RESP0_EVENT      (0xB7 | (0x01 << 8))
+#define PERFCTR_NEHALEM_OFFCORE_RESP1_EVENT      (0xBB | (0x01 << 8))
+
+/* Intel TSX performance events introduced on Haswell */
+#define PERFCTR_HASWELL_HLE_RETIRED_START        (0xc8 | (0x01 << 8))
+#define PERFCTR_HASWELL_HLE_RETIRED_COMMIT       (0xc8 | (0x02 << 8))
+#define PERFCTR_HASWELL_HLE_RETIRED_ABORT        (0xc8 | (0x04 << 8))
+#define PERFCTR_HASWELL_RTM_RETIRED_START        (0xc9 | (0x01 << 8))
+#define PERFCTR_HASWELL_RTM_RETIRED_COMMIT       (0xc9 | (0x02 << 8))
+#define PERFCTR_HASWELL_RTM_RETIRED_ABORT        (0xc9 | (0x04 << 8))
+
+/*
+ * Nehalem off-core response events. See Section 30.6.1.2 of the
+ * "Intel 64 and IA-32 Architecture's Software Developer Manual,
+ * Volume 3B, System Programming Guide, Part 2.
+ * One can specify
+ * (request from the core, response from the uncore) pairs.
+ */
+#define PERFCTR_NEHALEM_OFFCORE_RESP0_ADDR             0x1A6
+// requests
+#define PERFCTR_NEHALEM_OFFCORE_RQST_DMND_DATA_RD       0x1
+#define PERFCTR_NEHALEM_OFFCORE_RQST_DMND_RFO           0x2
+#define PERFCTR_NEHALEM_OFFCORE_RQST_DMND_IFETCH        0x4
+#define PERFCTR_NEHALEM_OFFCORE_RQST_WB                 0x8
+#define PERFCTR_NEHALEM_OFFCORE_RQST_PF_DATA_RD         0x10
+#define PERFCTR_NEHALEM_OFFCORE_RQST_PF_RFO             0x20
+#define PERFCTR_NEHALEM_OFFCORE_RQST_PF_IFETCH          0x40
+#define PERFCTR_NEHALEM_OFFCORE_RQST_OTHER              0x80
+
+// responses
+#define PERFCTR_NEHALEM_OFFCORE_RESP_UNCORE_HIT         0x100
+#define PERFCTR_NEHALEM_OFFCORE_RESP_OTHER_CORE_HIT_SNP 0x200
+#define PERFCTR_NEHALEM_OFFCORE_RESP_OTHER_CORE_HITM    0x400
+#define PERFCTR_NEHALEM_OFFCORE_RESP_REMOTE_CACHE_FWD   0x1000
+#define PERFCTR_NEHALEM_OFFCORE_RESP_REMOTE_DRAM        0x2000
+#define PERFCTR_NEHALEM_OFFCORE_RESP_LOCAL_DRAM         0x4000
+#define PERFCTR_NEHALEM_OFFCORE_RESP_NON_DRAM           0x8000
+
+// Nehalem Uncore events.
+
+/*
+ * Uncore event MSRs. See table B-5 "MSRs in processors based on the
+ * Intel micro-architecture (Nehalem), in "Intel 64 and IA-32 Architecture's
+ * Software Developer Manual, Volume 3B, System Programming Guide, Part 2".
+ * Though note that the addresses listed for PMCs and event select MSRs are
+ * incorrect (swapped) in the manual.
+ */
+#define PERFCTR_NEHALEM_UNCORE_GLOBALCTRL_ADDR   0x391
+#define PERFCTR_NEHALEM_UNCORE_PERFEVTSEL0_ADDR  0x3c0
+#define PERFCTR_NEHALEM_UNCORE_PERFCTR0_ADDR     0x3b0
+
+/*
+ * The uncore event masks. See section 30.6.2 of the
+ * "Intel 64 and IA-32 Architecture's Software Developer Manual,
+ * Volume 3B, System Programming Guide, Part 2"
+ */
+
+// Enable the use of the programmable uncore counter "x".
+#define PERFCTR_NEHALEM_UNCORE_ENABLE_CTR(x)     (1 << (x))
+#define PERFCTR_NEHALEM_UNCORE_EDGE_DETECT       0x40000
+#define PERFCTR_NEHALEM_UNCORE_ENABLE            0x400000
+#define PERFCTR_NEHALEM_UNCORE_L3_LINES_IN       (0x0a | (0x0f << 8))
+
+
+/*
+ * ----------------------------------------------------------------------
+ *
+ * Pentium 4
+ *
+ * ----------------------------------------------------------------------
+ */
+
+/*
+ * Pentium 4 Counter Configuration Control Register flags and fields
+ */
+#define PERFCTR_PENTIUM4_CCCR_ENABLE                   0x00001000
+#define PERFCTR_PENTIUM4_CCCR_SET_ESCR(c, e)           ((c) |= (((e) & 0x7) << 13))
+#define PERFCTR_PENTIUM4_CCCR_REQRSVD                  0x00030000 // always set these bits
+#define PERFCTR_PENTIUM4_CCCR_COMPARE                  0x00040000
+#define PERFCTR_PENTIUM4_CCCR_COMPLEMENT               0x00080000
+#define PERFCTR_PENTIUM4_CCCR_SET_THRESHOLD(c, e)      ((c) |= (((e) & 0xf) << 20))
+#define PERFCTR_PENTIUM4_CCCR_EDGE                     0x01000000
+#define PERFCTR_PENTIUM4_CCCR_FORCE_OVF                0x02000000
+#define PERFCTR_PENTIUM4_CCCR_OVF_PMI_T0               0x04000000
+#define PERFCTR_PENTIUM4_CCCR_OVF_PMI_T1               0x08000000
+#define PERFCTR_PENTIUM4_CCCR_CASCADE                  0x40000000
+#define PERFCTR_PENTIUM4_CCCR_OVF                      0x80000000
+
+#define PERFCTR_PENTIUM4_COUNTER_BASEADDR              0x00000300
+#define PERFCTR_PENTIUM4_CCCR_BASE_ADDR                0x00000360
+
+#define PERFCTR_PENTIUM4_CCCR_THRESHOLD(e)             ((e & 0xf) << 20)
+#define PERFCTR_PENTIUM4_OPT_EDGE_DETECT (PERFCTR_PENTIUM4_CCCR_COMPARE | PERFCTR_PENTIUM4_CCCR_EDGE)
+
+/*
+ * Pentium 4 Event Selection Control Register flags
+ */
+#define PERFCTR_PENTIUM4_ESCR_USER_MODE_T0             0x00000004
+#define PERFCTR_PENTIUM4_ESCR_KERNEL_MODE_T0           0x00000008
+#define PERFCTR_PENTIUM4_ESCR_USER_MODE_T1             0x00000001
+#define PERFCTR_PENTIUM4_ESCR_KERNEL_MODE_T1           0x00000002
+#define PERFCTR_PENTIUM4_SHIFT_BY_UNITMASK(e)          (e << 9)
+#define PENTIUM4_EVTSEL(e)                             (e << 25)
+
+/*
+ * Event definitions for Pentium4 Family Processors. 
+ * There are many more of these possible.
+ * See Appendix A.1 in Volume 3 of the IA32 manual.
+ */
+
+#define PERFCTR_PENTIUM4_EVT_INSTR_RETIRED              PENTIUM4_EVTSEL(0x02)
+#define PERFCTR_PENTIUM4_EVT_INSTR_COMPLETED            PENTIUM4_EVTSEL(0x07)
+#define PERFCTR_PENTIUM4_EVT_BSQ_CACHE_REFERENCE        PENTIUM4_EVTSEL(0x0c)
+#define PERFCTR_PENTIUM4_EVT_ITLB_REFERENCE             PENTIUM4_EVTSEL(0x18)
+#define PERFCTR_PENTIUM4_EVT_PAGE_WALK_TYPE             PENTIUM4_EVTSEL(0x01)   
+#define PERFCTR_PENTIUM4_EVT_BPU_FETCH_REQUEST          PENTIUM4_EVTSEL(0x03)
+#define PERFCTR_PENTIUM4_EVT_BRANCH_RETIRED             PENTIUM4_EVTSEL(0x06)  
+#define PERFCTR_PENTIUM4_EVT_MISPRED_BRANCH_RETIRED     PENTIUM4_EVTSEL(0x03)
+#define PERFCTR_PENTIUM4_EVT_MACHINE_CLEAR              PENTIUM4_EVTSEL(0x02)
+#define PERFCTR_PENTIUM4_EVT_MEMORY_CANCEL              PENTIUM4_EVTSEL(0x02) 
+#define PERFCTR_PENTIUM4_GLOBAL_POWER_EVENTS            PENTIUM4_EVTSEL(0x13)
+
+/*
+ * Pentium4 doesn't have an event for clock cycles, but Intel
+ * outlines a method in the IA32 manual, vol 3, sec 14.9.9,
+ * for measuring cycles which involves this event strategy.
+ */
+
+#define PERFCTR_PENTIUM4_EVT_CLK_CYCLES \
+   PENTIUM4_EVTSEL(0x2) | \
+   PERFCTR_PENTIUM4_SHIFT_BY_UNITMASK (0x01 | 0x02 | 0x04 | 0x08)
+
+
+/*
+ * PerfCtr_Config --
+ *      Describes configuration for a single hardware performance counter
+ *
+ *      Since this is only used to record general performance counters, we
+ *      made the assumption in nmiProfiler.c  that the type is GENERAL and
+ *      index is counter number of type GENERAL.
+ *      
+ *      
+ *      On AMD K8 and GH:
+ *      index:        Which perf ctr, 0 to 3.  RDPMC argument
+ *      addr:         MSR of raw perf ctr              (0xc0010004 + index).
+ *      escrAddr:     MSR # of the Perf Event Selector (0xc0010000 + index).
+ *      escrVal:      Value placed in PerfEvtSel MSR; what to measure.
+ *
+ *      On AMD BD:
+ *      index:        Which perf ctr, 0 to 5.  RDPMC argument
+ *      addr:         MSR of raw perf ctr              (0xc0010201 + 2 * index).
+ *                                  aliased PMCs 0 - 3 (0xc0010004 + index).
+ *      escrAddr:     MSR # of the Perf Event Selector (0xc0010200 + 2 * index).
+ *                                  aliased PMCs 0 - 3 (0xc0010000 + index).
+ *      escrVal:      Value placed in PerfEvtSel MSR; what to measure.
+ * 
+ *      No field should be greater than 32-bit as it is shared with monitor.
+ *
+ *      On Intel Core architecture:
+ *      <to be documented>
+ */
+typedef struct PerfCtr_Config {
+   uint64 escrVal;
+   uint32 index;
+   uint32 addr;
+   uint32 escrAddr;
+   uint32 resetHi;
+   uint32 periodMean;
+
+   /*
+    * Random number (whose absolute value is capped at
+    * periodJitterMask) is used to randomize sampling interval.
+    */
+   uint32  periodJitterMask;
+   uint32  seed;    // seed is used to compute next random number
+   uint16  config;
+   Bool    valid;
+   Bool    pebsEnabled;
+} PerfCtr_Config;
+
+
+/*
+ * Program/reprogram event reg(s) associated w/perfctrs & start or stop perfctrs
+ */
+static INLINE void
+PerfCtrWriteEvtSel(PerfCtr_Config *ctr,  // IN: counter to write
+                   uint32 escrVal)       // IN: event register value
+{
+   __SET_MSR(ctr->escrAddr, escrVal);
+}
+
+
+/*
+ * Set/reset performance counters to engender desired period before overflow
+ */
+static INLINE void
+PerfCtrWriteCounter(PerfCtr_Config *ctr,   // IN: counter to write
+                    uint32 valueLo,        // IN: low 32 bits of value to write
+                    uint32 valueHi)        // IN: high 32 bits of value to write
+{
+   WRMSR(ctr->addr, valueLo, valueHi);
+}
+
+
+static INLINE uint64
+PerfCtr_SelValidBits(Bool amd)
+{
+   /*
+    * Intel enforces PIN_CONTROL as MBZ; AMD does not.  Always mask on AMD
+    * to avoid toggling the physical pin.
+    */
+   uint64 bits = PERFCTR_CPU_EVENT_MASK  | PERFCTR_CPU_UNIT_MASK |
+                 PERFCTR_CPU_USER_MODE   | PERFCTR_CPU_KERNEL_MODE |
+                 PERFCTR_CPU_EDGE_DETECT | PERFCTR_CPU_APIC_INTR |
+                 PERFCTR_CPU_ENABLE      | PERFCTR_CPU_INVERT_COUNTER_MASK |
+                 PERFCTR_CPU_COUNTER_MASK;
+   if (amd) {
+      bits |= PERFCTR_AMD_EXT_EVENT_MASK | PERFCTR_AMD_EVTSEL_HOST |
+              PERFCTR_AMD_EVTSEL_GUEST;
+   } else {
+      bits |= PERFCTR_CORE_ANYTHREAD | PERFCTR_CORE_IN_TX |
+              PERFCTR_CORE_IN_TXCP;
+   }
+   return bits;
+}
+
+static INLINE uint64
+PerfCtr_PgcValidBits(unsigned numGenCtrs, unsigned numFixCtrs)
+{
+   return MASK64(numGenCtrs) | (MASK64(numFixCtrs) << 32);
+}
+
+static INLINE uint64
+PerfCtr_FccValidBits(unsigned numFixCtrs)
+{
+   return MASK64(numFixCtrs * 4);
+}
+
+static INLINE uint64
+PerfCtr_PgcToOvfValidBits(uint64 pgcValBits)
+{
+   return pgcValBits | MASKRANGE64(63, 61);
+}
+
+static INLINE uint64
+PerfCtr_PgcToStsRstValidBits(uint64 pgcValBits)
+{
+   return pgcValBits | (1ULL << 55) | MASKRANGE64(63, 58);
+}
+
+static INLINE uint64
+PerfCtr_PgcToGssValidBits(uint64 pgcValBits)
+{
+   return pgcValBits | (1ULL << 55) | MASKRANGE64(62, 58);
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ *  PerfCtr_HypervisorCPUIDSig --
+ *
+ *      Get the hypervisor signature string from CPUID.
+ *
+ * Results:
+ *      TRUE on success FALSE otherwise.
+ *      Unqualified 16 byte nul-terminated hypervisor string which may contain
+ *      garbage.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+PerfCtr_HypervisorCPUIDSig(CPUIDRegs *name)
+{
+   CPUIDRegs regs;
+
+   __GET_CPUID(1, &regs);
+   if (!CPUID_ISSET(1, ECX, HYPERVISOR, regs.ecx)) {
+      return FALSE;
+   }
+
+   __GET_CPUID(0x40000000, name);
+
+   if (name->eax < 0x40000000) {
+      return FALSE;
+   }
+
+   return TRUE;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ *  PerfCtr_PEBSAvailable --
+ *
+ *      Checks if this CPU is capable of PEBS.
+ *
+ * Results:
+ *      TRUE if PEBS is supported, FALSE otherwise.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+PerfCtr_PEBSAvailable(void)
+{
+   CPUIDRegs regs;
+   __GET_CPUID(0, &regs);
+   if (CPUID_IsVendorIntel(&regs) &&
+       ((__GET_MSR(MSR_MISC_ENABLE) & MSR_MISC_ENABLE_EMON_AVAILABLE) != 0) &&
+       ((__GET_MSR(MSR_MISC_ENABLE) & MSR_MISC_ENABLE_PEBS_UNAVAILABLE) == 0)) {
+      CPUIDRegs hvendor;
+
+      /*
+       * Hyper-V doesn't support PEBS and may #GP if we try to write the
+       * PEBS enable MSR so always consider PEBS un-available on Hyper-V -
+       * PR 1039970.
+       */
+      return !PerfCtr_HypervisorCPUIDSig(&hvendor) ||
+             !CPUID_IsRawVendor(&hvendor,
+                                CPUID_HYPERV_HYPERVISOR_VENDOR_STRING);
+   }
+   return FALSE; 
+}
+
+/* The following are taken from the Intel Architecture Manual,
+ * Book 3, Table 14-4. 
+ */ 
+
+/* --------- BEGIN INTEL DEFINES ------------------------ */
+
+#define PENTIUM4_MSR_BPU_COUNTER0_IDX           0
+#define PENTIUM4_MSR_BPU_COUNTER0_ADDR          0x300
+#define PENTIUM4_MSR_BPU_CCCR0                  0x360
+#define PENTIUM4_MSR_BPU_COUNTER1_IDX           1
+#define PENTIUM4_MSR_BPU_COUNTER1_ADDR          0x301
+#define PENTIUM4_MSR_BPU_CCCR1                  0x361
+#define PENTIUM4_MSR_BPU_COUNTER2_IDX           2
+#define PENTIUM4_MSR_BPU_COUNTER2_ADDR          0x302
+#define PENTIUM4_MSR_BPU_CCCR2                  0x362
+#define PENTIUM4_MSR_BPU_COUNTER3_IDX           3
+#define PENTIUM4_MSR_BPU_COUNTER3_ADDR          0x303
+#define PENTIUM4_MSR_BPU_CCCR3                  0x363
+#define PENTIUM4_MSR_MS_COUNTER0_IDX            4
+#define PENTIUM4_MSR_MS_COUNTER0_ADDR           0x304
+#define PENTIUM4_MSR_MS_CCCR0                   0x364
+#define PENTIUM4_MSR_MS_COUNTER1_IDX            5
+#define PENTIUM4_MSR_MS_COUNTER1_ADDR           0x305
+#define PENTIUM4_MSR_MS_CCCR1                   0x365
+#define PENTIUM4_MSR_MS_COUNTER2_IDX            6
+#define PENTIUM4_MSR_MS_COUNTER2_ADDR           0x306
+#define PENTIUM4_MSR_MS_CCCR2                   0x366
+#define PENTIUM4_MSR_MS_COUNTER3_IDX            7
+#define PENTIUM4_MSR_MS_COUNTER3_ADDR           0x307
+#define PENTIUM4_MSR_MS_CCCR3                   0x367
+#define PENTIUM4_MSR_FLAME_COUNTER0_IDX         8
+#define PENTIUM4_MSR_FLAME_COUNTER0_ADDR        0x308
+#define PENTIUM4_MSR_FLAME_CCCR0                0x368
+#define PENTIUM4_MSR_FLAME_COUNTER1_IDX         9
+#define PENTIUM4_MSR_FLAME_COUNTER1_ADDR        0x309
+#define PENTIUM4_MSR_FLAME_CCCR1                0x369
+#define PENTIUM4_MSR_FLAME_COUNTER2_IDX         10
+#define PENTIUM4_MSR_FLAME_COUNTER2_ADDR        0x30A
+#define PENTIUM4_MSR_FLAME_CCCR2                0x36A
+#define PENTIUM4_MSR_FLAME_COUNTER3_IDX         11
+#define PENTIUM4_MSR_FLAME_COUNTER3_ADDR        0x30B
+#define PENTIUM4_MSR_FLAME_CCCR3                0x36B
+#define PENTIUM4_MSR_IQ_COUNTER0_IDX            12
+#define PENTIUM4_MSR_IQ_COUNTER0_ADDR           0x30C
+#define PENTIUM4_MSR_IQ_CCCR0                   0x36C
+#define PENTIUM4_MSR_IQ_COUNTER1_IDX            13
+#define PENTIUM4_MSR_IQ_COUNTER1_ADDR           0x30D
+#define PENTIUM4_MSR_IQ_CCCR1                   0x36D
+#define PENTIUM4_MSR_IQ_COUNTER2_IDX            14
+#define PENTIUM4_MSR_IQ_COUNTER2_ADDR           0x30E
+#define PENTIUM4_MSR_IQ_CCCR2                   0x36E
+#define PENTIUM4_MSR_IQ_COUNTER3_IDX            15
+#define PENTIUM4_MSR_IQ_COUNTER3_ADDR           0x30F
+#define PENTIUM4_MSR_IQ_CCCR3                   0x36F
+#define PENTIUM4_MSR_IQ_COUNTER4_IDX            16
+#define PENTIUM4_MSR_IQ_COUNTER4_ADDR           0x310
+#define PENTIUM4_MSR_IQ_CCCR4                   0x370
+#define PENTIUM4_MSR_IQ_COUNTER5_IDX            17
+#define PENTIUM4_MSR_IQ_COUNTER5_ADDR           0x311
+#define PENTIUM4_MSR_IQ_CCCR5                   0x371
+
+#define PENTIUM4_MSR_ALF_ESCR0_IDX              1
+#define PENTIUM4_MSR_ALF_ESCR0_ADDR             0x3CA
+#define PENTIUM4_MSR_ALF_ESCR1_IDX              1
+#define PENTIUM4_MSR_ALF_ESCR1_ADDR             0x3CB
+#define PENTIUM4_MSR_BPU_ESCR0_IDX              0
+#define PENTIUM4_MSR_BPU_ESCR0_ADDR             0x3B2
+#define PENTIUM4_MSR_BPU_ESCR1_IDX              0
+#define PENTIUM4_MSR_BPU_ESCR1_ADDR             0x3B3
+#define PENTIUM4_MSR_BSU_ESCR0_IDX              7
+#define PENTIUM4_MSR_BSU_ESCR0_ADDR             0x3A0
+#define PENTIUM4_MSR_BSU_ESCR1_IDX              7
+#define PENTIUM4_MSR_BSU_ESCR1_ADDR             0x3A1
+#define PENTIUM4_MSR_CRU_ESCR0_IDX              4
+#define PENTIUM4_MSR_CRU_ESCR0_ADDR             0x3B8
+#define PENTIUM4_MSR_CRU_ESCR1_IDX              4
+#define PENTIUM4_MSR_CRU_ESCR1_ADDR             0x3B9
+#define PENTIUM4_MSR_CRU_ESCR2_IDX              5
+#define PENTIUM4_MSR_CRU_ESCR2_ADDR             0x3CC
+#define PENTIUM4_MSR_CRU_ESCR3_IDX              5
+#define PENTIUM4_MSR_CRU_ESCR3_ADDR             0x3CD
+#define PENTIUM4_MSR_CRU_ESCR4_IDX              6
+#define PENTIUM4_MSR_CRU_ESCR4_ADDR             0x3E0
+#define PENTIUM4_MSR_CRU_ESCR5_IDX              6
+#define PENTIUM4_MSR_CRU_ESCR5_ADDR             0x3E1
+#define PENTIUM4_MSR_DAC_ESCR0_IDX              5
+#define PENTIUM4_MSR_DAC_ESCR0_ADDR             0x3A8
+#define PENTIUM4_MSR_DAC_ESCR1_IDX              5
+#define PENTIUM4_MSR_DAC_ESCR1_ADDR             0x3A9
+#define PENTIUM4_MSR_FIRM_ESCR0_IDX             1
+#define PENTIUM4_MSR_FIRM_ESCR0_ADDR            0x3A4
+#define PENTIUM4_MSR_FIRM_ESCR1_IDX             1
+#define PENTIUM4_MSR_FIRM_ESCR1_ADDR            0x3A5
+#define PENTIUM4_MSR_FLAME_ESCR0_IDX            0
+#define PENTIUM4_MSR_FLAME_ESCR0_ADDR           0x3A6
+#define PENTIUM4_MSR_FLAME_ESCR1_IDX            0
+#define PENTIUM4_MSR_FLAME_ESCR1_ADDR           0x3A7
+#define PENTIUM4_MSR_FSB_ESCR0_IDX              6
+#define PENTIUM4_MSR_FSB_ESCR0_ADDR             0x3A2
+#define PENTIUM4_MSR_FSB_ESCR1_IDX              6
+#define PENTIUM4_MSR_FSB_ESCR1_ADDR             0x3A3
+#define PENTIUM4_MSR_IQ_ESCR0_IDX               0
+#define PENTIUM4_MSR_IQ_ESCR0_ADDR              0x3BA
+#define PENTIUM4_MSR_IQ_ESCR1_IDX               0
+#define PENTIUM4_MSR_IQ_ESCR1_ADDR              0x3BB
+#define PENTIUM4_MSR_IS_ESCR0_IDX               1
+#define PENTIUM4_MSR_IS_ESCR0_ADDR              0x3B4
+#define PENTIUM4_MSR_IS_ESCR1_IDX               1
+#define PENTIUM4_MSR_IS_ESCR1_ADDR              0x3B5
+#define PENTIUM4_MSR_ITLB_ESCR0_IDX             3
+#define PENTIUM4_MSR_ITLB_ESCR0_ADDR            0x3B6
+#define PENTIUM4_MSR_ITLB_ESCR1_IDX             3
+#define PENTIUM4_MSR_ITLB_ESCR1_ADDR            0x3B7
+#define PENTIUM4_MSR_IX_ESCR0_IDX               5
+#define PENTIUM4_MSR_IX_ESCR0_ADDR              0x3C8
+#define PENTIUM4_MSR_IX_ESCR1_IDX               5
+#define PENTIUM4_MSR_IX_ESCR1_ADDR              0x3C9
+#define PENTIUM4_MSR_MOB_ESCR0_IDX              2
+#define PENTIUM4_MSR_MOB_ESCR0_ADDR             0x3AA
+#define PENTIUM4_MSR_MOB_ESCR1_IDX              2
+#define PENTIUM4_MSR_MOB_ESCR1_ADDR             0x3AB
+#define PENTIUM4_MSR_MS_ESCR0_IDX               0
+#define PENTIUM4_MSR_MS_ESCR0_ADDR              0x3C0
+#define PENTIUM4_MSR_MS_ESCR1_IDX               0
+#define PENTIUM4_MSR_MS_ESCR1_ADDR              0x3C1
+#define PENTIUM4_MSR_PMH_ESCR0_IDX              4
+#define PENTIUM4_MSR_PMH_ESCR0_ADDR             0x3AC
+#define PENTIUM4_MSR_PMH_ESCR1_IDX              4
+#define PENTIUM4_MSR_PMH_ESCR1_ADDR             0x3AD
+#define PENTIUM4_MSR_RAT_ESCR0_IDX              2
+#define PENTIUM4_MSR_RAT_ESCR0_ADDR             0x3BC
+#define PENTIUM4_MSR_RAT_ESCR1_IDX              2
+#define PENTIUM4_MSR_RAT_ESCR1_ADDR             0x3BD
+#define PENTIUM4_MSR_SAAT_ESCR0_IDX             2
+#define PENTIUM4_MSR_SAAT_ESCR0_ADDR            0x3AE
+#define PENTIUM4_MSR_SAAT_ESCR1_IDX             2
+#define PENTIUM4_MSR_SAAT_ESCR1_ADDR            0x3AF
+#define PENTIUM4_MSR_SSU_ESCR0_IDX              3
+#define PENTIUM4_MSR_SSU_ESCR0_ADDR             0x3BE
+#define PENTIUM4_MSR_TBPU_ESCR0_IDX             2
+#define PENTIUM4_MSR_TBPU_ESCR0_ADDR            0x3C2
+#define PENTIUM4_MSR_TBPU_ESCR1_IDX             2
+#define PENTIUM4_MSR_TBPU_ESCR1_ADDR            0x3C3
+#define PENTIUM4_MSR_TC_ESCR0_IDX               1
+#define PENTIUM4_MSR_TC_ESCR0_ADDR              0x3C4
+#define PENTIUM4_MSR_TC_ESCR1_IDX               1
+#define PENTIUM4_MSR_TC_ESCR1_ADDR              0x3C5
+#define PENTIUM4_MSR_U2L_ESCR0_IDX              3
+#define PENTIUM4_MSR_U2L_ESCR0_ADDR             0x3B0
+#define PENTIUM4_MSR_U2L_ESCR1_IDX              3
+#define PENTIUM4_MSR_U2L_ESCR1_ADDR             0x3B1
+
+#define PENTIUM4_MIN_ESCR_ADDR                  0x3A0
+#define PENTIUM4_MAX_ESCR_ADDR                  0x3E1
+#define PENTIUM4_NUM_ESCR_ADDRS                 (PENTIUM4_MAX_ESCR_ADDR - PENTIUM4_MIN_ESCR_ADDR + 1)
+
+/* -------- END INTEL DEFINES ------------------------- */
+
+#endif // ifndef _X86PERFCTR_H_ 
diff --git a/vmmon-only/include/x86segdescrs.h b/vmmon-only/include/x86segdescrs.h
new file mode 100644
index 00000000..951ea029
--- /dev/null
+++ b/vmmon-only/include/x86segdescrs.h
@@ -0,0 +1,101 @@
+/*********************************************************
+ * Copyright (C) 2006-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86segdescrs.h --
+ *
+ *	Type definitions for the x86 segment descriptors.
+ */
+
+#ifndef _X86SEGDESCRS_H_
+#define _X86SEGDESCRS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+
+/*
+ * Segment Descriptors.
+ */
+
+typedef struct Descriptor {
+   unsigned   limit_lo  : 16;
+   unsigned   base_lo   : 16;
+   unsigned   base_mid  : 8;
+   unsigned   type      : 4;
+   unsigned   S         : 1;
+   unsigned   DPL       : 2;
+   unsigned   present   : 1;
+   unsigned   limit_hi  : 4;
+   unsigned   AVL       : 1;
+   unsigned   longmode  : 1;
+   unsigned   DB        : 1;
+   unsigned   gran      : 1;
+   unsigned   base_hi   : 8;
+} Descriptor;
+
+/*
+ * 16-byte system descriptors for 64-bit mode.
+ */
+
+typedef 
+#include "vmware_pack_begin.h"
+struct Descriptor64 {
+   unsigned   limit_lo  : 16;   // Limit bits 15-0.
+   unsigned   base_lo   : 24;   // Base bits  23-0.
+   unsigned   type      : 4;
+   unsigned   S         : 1;
+   unsigned   DPL       : 2;
+   unsigned   present   : 1;
+   unsigned   limit_hi  : 4;    // Limit bits 19-16.
+   unsigned   AVL       : 1;
+   unsigned   reserved0 : 2;
+   unsigned   gran      : 1;
+   unsigned   base_mid  : 8;    // Base bits 31-24.
+   unsigned   base_hi   : 32;   // Base bits 63-32.
+   unsigned   reserved1 : 8;
+   unsigned   ext_attrs : 5;
+   unsigned   reserved2 : 19;
+}
+#include "vmware_pack_end.h"
+Descriptor64;
+
+typedef union {
+   Descriptor desc;
+   uint32     word[2];
+   uint64     qword;
+} DescriptorUnion;
+
+typedef union {
+   Descriptor64 desc;
+   Descriptor   part[2];
+   uint32       word[4];
+   uint64       qword[2];
+} Descriptor64Union;
+
+
+#endif // ifndef _X86SEGDESCRS_H_
diff --git a/vmmon-only/include/x86sel.h b/vmmon-only/include/x86sel.h
new file mode 100644
index 00000000..934bfde6
--- /dev/null
+++ b/vmmon-only/include/x86sel.h
@@ -0,0 +1,67 @@
+/*********************************************************
+ * Copyright (C) 2006-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86sel.h --
+ *
+ *      Definitions and macros for dealing with x86 segment selectors.
+ */
+
+#ifndef _X86SEL_H_
+#define _X86SEL_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#define SELECTOR_GDT             0
+#define SELECTOR_LDT             1
+#define SELECTOR_RPL_SHIFT       0
+#define SELECTOR_RPL_MASK        0x03u
+#define SELECTOR_TI_SHIFT        2
+#define SELECTOR_TI_MASK         0x4
+#define SELECTOR_INDEX_SHIFT     3
+#define SELECTOR_INDEX_MASK      0xfff8
+
+#define SELECTOR_RPL(_sel)       (((Selector)(_sel)) & SELECTOR_RPL_MASK)
+#define SELECTOR_TABLE(_sel)     ((((Selector)(_sel)) & SELECTOR_TI_MASK) >> SELECTOR_TI_SHIFT)
+#define SELECTOR_INDEX(_sel)     (((Selector)(_sel)) >> SELECTOR_INDEX_SHIFT)
+#define SELECTOR_CLEAR_RPL(_sel) ((Selector)(((Selector)(_sel)) & ~SELECTOR_RPL_MASK))
+#define NULL_SELECTOR(_sel)      (!SELECTOR_CLEAR_RPL(_sel))
+
+#define MAKE_SELECTOR_UNCHECKED(_index, _ti, _RPL)      \
+   ((Selector)(((_index) << SELECTOR_INDEX_SHIFT)  |    \
+               ((_ti   ) << SELECTOR_TI_SHIFT)     |    \
+               ((_RPL  ) << SELECTOR_RPL_SHIFT)))
+
+static INLINE Selector
+MAKE_SELECTOR(unsigned index, unsigned ti, unsigned rpl)
+{
+   ASSERT(index <= (SELECTOR_INDEX_MASK >> SELECTOR_INDEX_SHIFT) &&
+          ti    <= (SELECTOR_TI_MASK >> SELECTOR_TI_SHIFT)       &&
+          rpl   <= (SELECTOR_RPL_MASK >> SELECTOR_RPL_SHIFT));
+   return MAKE_SELECTOR_UNCHECKED(index, ti, rpl);
+}
+
+#endif /* !defined _X86SEL_H_ */
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
new file mode 100644
index 00000000..584a4afc
--- /dev/null
+++ b/vmmon-only/include/x86svm.h
@@ -0,0 +1,496 @@
+/*********************************************************
+ * Copyright (C) 2005-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86svm.h --
+ *
+ *    This header file contains basic definitions related to
+ *    AMD's hardware virtualization implementation, which you
+ *    may see referred to as SVM, AMD-V, or Pacifica.
+ */
+
+
+#ifndef _X86SVM_H_
+#define _X86SVM_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMX
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "x86msr.h"
+#if defined(USERLEVEL) || defined(MONITOR_APP)
+#include "vm_basic_asm.h"
+#else
+#include "vm_asm.h"
+#endif
+#include "x86cpuid_asm.h"
+
+#ifdef VMM
+#include "cpuidMonitor.h"
+#endif
+
+#define SVM_VMCB_IO_BITMAP_SIZE    (3 * PAGE_SIZE)
+#define SVM_VMCB_MSR_BITMAP_SIZE   (2 * PAGE_SIZE)
+
+/* Exit controls for the CR/DR access and hardware exceptions */
+#define SVM_CR_RD_CTL(num)         (0x1 << (num))
+#define SVM_CR_RD_CTL_ALL          0x0000ffff
+#define SVM_CR_WR_CTL(num)         (0x10000 << (num))
+#define SVM_CR_WR_CTL_ALL          0xffff0000
+#define SVM_DR_RD_CTL(num)         (0x1 << (num))
+#define SVM_DR_RD_CTL_ALL          0x0000ffff
+#define SVM_DR_WR_CTL(num)         (0x10000 << (num))
+#define SVM_DR_WR_CTL_ALL          0xffff0000
+#define SVM_XCP_CTL(vector)        (0x1 << (vector))
+#define SVM_XCP_CTL_ALL            0xffffffff
+
+/* Execution intercept controls */
+/* VMCB.exitCtl */
+#define SVM_VMCB_EXEC_CTL_INTR        0x0000000000000001ULL
+#define SVM_VMCB_EXEC_CTL_NMI         0x0000000000000002ULL
+#define SVM_VMCB_EXEC_CTL_SMI         0x0000000000000004ULL
+#define SVM_VMCB_EXEC_CTL_INIT        0x0000000000000008ULL
+#define SVM_VMCB_EXEC_CTL_VINTR       0x0000000000000010ULL
+#define SVM_VMCB_EXEC_CTL_CR0_SEL_WR  0x0000000000000020ULL
+#define SVM_VMCB_EXEC_CTL_SIDT        0x0000000000000040ULL
+#define SVM_VMCB_EXEC_CTL_SGDT        0x0000000000000080ULL
+#define SVM_VMCB_EXEC_CTL_SLDT        0x0000000000000100ULL
+#define SVM_VMCB_EXEC_CTL_STR         0x0000000000000200ULL
+#define SVM_VMCB_EXEC_CTL_LIDT        0x0000000000000400ULL
+#define SVM_VMCB_EXEC_CTL_LGDT        0x0000000000000800ULL
+#define SVM_VMCB_EXEC_CTL_LLDT        0x0000000000001000ULL
+#define SVM_VMCB_EXEC_CTL_LTR         0x0000000000002000ULL
+#define SVM_VMCB_EXEC_CTL_RDTSC       0x0000000000004000ULL
+#define SVM_VMCB_EXEC_CTL_RDPMC       0x0000000000008000ULL
+#define SVM_VMCB_EXEC_CTL_PUSHF       0x0000000000010000ULL
+#define SVM_VMCB_EXEC_CTL_POPF        0x0000000000020000ULL
+#define SVM_VMCB_EXEC_CTL_CPUID       0x0000000000040000ULL
+#define SVM_VMCB_EXEC_CTL_RSM         0x0000000000080000ULL
+#define SVM_VMCB_EXEC_CTL_IRET        0x0000000000100000ULL
+#define SVM_VMCB_EXEC_CTL_SWINT       0x0000000000200000ULL
+#define SVM_VMCB_EXEC_CTL_INVD        0x0000000000400000ULL
+#define SVM_VMCB_EXEC_CTL_PAUSE       0x0000000000800000ULL
+#define SVM_VMCB_EXEC_CTL_HLT         0x0000000001000000ULL
+#define SVM_VMCB_EXEC_CTL_INVLPG      0x0000000002000000ULL
+#define SVM_VMCB_EXEC_CTL_INVLPGA     0x0000000004000000ULL
+#define SVM_VMCB_EXEC_CTL_IOIO        0x0000000008000000ULL
+#define SVM_VMCB_EXEC_CTL_MSR         0x0000000010000000ULL
+#define SVM_VMCB_EXEC_CTL_TS          0x0000000020000000ULL
+#define SVM_VMCB_EXEC_CTL_FERR_FRZ    0x0000000040000000ULL
+#define SVM_VMCB_EXEC_CTL_SHUTDOWN    0x0000000080000000ULL
+#define SVM_VMCB_EXEC_CTL_VMRUN       0x0000000100000000ULL
+#define SVM_VMCB_EXEC_CTL_VMMCALL     0x0000000200000000ULL
+#define SVM_VMCB_EXEC_CTL_VMLOAD      0x0000000400000000ULL
+#define SVM_VMCB_EXEC_CTL_VMSAVE      0x0000000800000000ULL
+#define SVM_VMCB_EXEC_CTL_STGI        0x0000001000000000ULL
+#define SVM_VMCB_EXEC_CTL_CLGI        0x0000002000000000ULL
+#define SVM_VMCB_EXEC_CTL_SKINIT      0x0000004000000000ULL
+#define SVM_VMCB_EXEC_CTL_RDTSCP      0x0000008000000000ULL
+#define SVM_VMCB_EXEC_CTL_ICEBP       0x0000010000000000ULL
+#define SVM_VMCB_EXEC_CTL_WBINVD      0x0000020000000000ULL
+#define SVM_VMCB_EXEC_CTL_MONITOR     0x0000040000000000ULL
+#define SVM_VMCB_EXEC_CTL_MWAIT       0x0000080000000000ULL
+#define SVM_VMCB_EXEC_CTL_MWAIT_COND  0x0000100000000000ULL
+#define SVM_VMCB_EXEC_CTL_XSETBV      0x0000200000000000ULL
+
+/* VMCB.tlbCtl */
+#define SVM_VMCB_TLB_CTL_FLUSH              0x01
+#define SVM_VMCB_TLB_CTL_FLUSH_ONLY_CURRENT 0x02
+#define SVM_VMCB_TLB_CTL_FLUSH_KEEP_GLOBALS 0x04
+
+/* VMCB.vAPIC */
+#define SVM_VMCB_APIC_VTPR_MASK            0x00000000000000ffULL
+#define SVM_VMCB_APIC_VTPR_SHIFT           0
+#define SVM_VMCB_APIC_VIRQ                 0x0000000000000100ULL
+#define SVM_VMCB_APIC_VINTR_PRIO_MASK      0x00000000000f0000ULL
+#define SVM_VMCB_APIC_VINTR_PRIO_SHIFT     16
+#define SVM_VMCB_APIC_VIGN_TPR             0x0000000000100000ULL
+#define SVM_VMCB_APIC_VINTR_MASKING        0x0000000001000000ULL
+#define SVM_VMCB_APIC_AVIC_ENABLE          0x0000000080000000ULL
+#define SVM_VMCB_APIC_VINTR_VECTOR_MASK    0x000000ff00000000ULL
+#define SVM_VMCB_APIC_VINTR_VECTOR_SHIFT   32
+
+/* VMCB.intrState */
+#define SVM_VMCB_INTRSTATE_INTR_SHADOW     (1 << 0)
+
+/* VMCB.nptCtl */
+#define SVM_VMCB_NPTCTL_NP_ENABLE          (1 << 0)
+
+/* VMCB.debugCtl */
+#define SVM_VMCB_DEBUGCTL_LBR_ENABLE       (1 << 0)
+
+/* VMCB.clean */
+#define SVMCLEAN       \
+   CLEANBIT(I,    0)   \
+   CLEANBIT(IOPM, 1)   \
+   CLEANBIT(ASID, 2)   \
+   CLEANBIT(TPR,  3)   \
+   CLEANBIT(NP,   4)   \
+   CLEANBIT(CRX,  5)   \
+   CLEANBIT(DRX,  6)   \
+   CLEANBIT(DT,   7)   \
+   CLEANBIT(SEG,  8)   \
+   CLEANBIT(CR2,  9)   \
+   CLEANBIT(LBR,  10)  \
+   CLEANBIT(AVIC, 11)
+
+#define SVM_VMCB_CLEAN_MASK           ((1 << SVM_VMCB_NUM_CLEANBITS) - 1)
+
+/* Segment attribute masks (used for conversion to unpacked format) */
+#define SVM_VMCB_ATTRIB_LOW           0x000000ff
+#define SVM_VMCB_ATTRIB_HI            0x00000f00
+
+#define SVM_VMCB_AR_ACCESSED        AR_ACCESSED
+#define SVM_VMCB_AR_WRITE           AR_WRITE
+#define SVM_VMCB_AR_READ            AR_READ
+#define SVM_VMCB_AR_CONFORM         AR_CONFORM
+#define SVM_VMCB_AR_CODE            AR_CODE
+#define SVM_VMCB_AR_TYPE            AR_TYPE
+#define SVM_VMCB_AR_S               AR_S
+#define SVM_VMCB_AR_DPL             AR_DPL
+#define SVM_VMCB_AR_PRES            AR_PRES
+#define SVM_VMCB_AR_AVL             (AR_AVL      >> 4)
+#define SVM_VMCB_AR_LONGMODE        (AR_LONGMODE >> 4)
+#define SVM_VMCB_AR_DB              (AR_DB       >> 4)
+#define SVM_VMCB_AR_GRAN            (AR_GRAN     >> 4)
+
+#define SVM_VMCB_AR_TYPE_SHIFT      AR_TYPE_SHIFT
+#define SVM_VMCB_AR_S_SHIFT         AR_S_SHIFT
+#define SVM_VMCB_AR_DPL_SHIFT       AR_DPL_SHIFT
+#define SVM_VMCB_AR_PRES_SHIFT      AR_PRES_SHIFT
+#define SVM_VMCB_AR_AVL_SHIFT       (AR_AVL_SHIFT      - 4)
+#define SVM_VMCB_AR_LONGMODE_SHIFT  (AR_LONGMODE_SHIFT - 4)
+#define SVM_VMCB_AR_DB_SHIFT        (AR_DB_SHIFT       - 4)
+#define SVM_VMCB_AR_GRAN_SHIFT      (AR_GRAN_SHIFT     - 4)
+
+/* Unique Exit Codes */
+#define SVM_EXITCODE_CR_READ(n)             (0 + (n))
+#define SVM_EXITCODE_CR_WRITE(n)           (16 + (n))
+#define SVM_EXITCODE_DR_READ(n)            (32 + (n))
+#define SVM_EXITCODE_DR_WRITE(n)           (48 + (n))
+#define SVM_EXITCODE_XCP(n)                (64 + (n))
+#define SVM_EXITCODE_INTR                  96
+#define SVM_EXITCODE_NMI                   97
+#define SVM_EXITCODE_SMI                   98
+#define SVM_EXITCODE_INIT                  99
+#define SVM_EXITCODE_VINTR                100
+#define SVM_EXITCODE_CR0_SEL_WR           101
+#define SVM_EXITCODE_SIDT                 102
+#define SVM_EXITCODE_SGDT                 103
+#define SVM_EXITCODE_SLDT                 104
+#define SVM_EXITCODE_STR                  105
+#define SVM_EXITCODE_LIDT                 106
+#define SVM_EXITCODE_LGDT                 107
+#define SVM_EXITCODE_LLDT                 108
+#define SVM_EXITCODE_LTR                  109
+#define SVM_EXITCODE_RDTSC                110
+#define SVM_EXITCODE_RDPMC                111
+#define SVM_EXITCODE_PUSHF                112
+#define SVM_EXITCODE_POPF                 113
+#define SVM_EXITCODE_CPUID                114
+#define SVM_EXITCODE_RSM                  115
+#define SVM_EXITCODE_IRET                 116
+#define SVM_EXITCODE_SWINT                117
+#define SVM_EXITCODE_INVD                 118
+#define SVM_EXITCODE_PAUSE                119
+#define SVM_EXITCODE_HLT                  120
+#define SVM_EXITCODE_INVLPG               121
+#define SVM_EXITCODE_INVLPGA              122
+#define SVM_EXITCODE_IOIO                 123
+#define SVM_EXITCODE_MSR                  124
+#define SVM_EXITCODE_TS                   125
+#define SVM_EXITCODE_FERR_FRZ             126
+#define SVM_EXITCODE_SHUTDOWN             127
+#define SVM_EXITCODE_VMRUN                128
+#define SVM_EXITCODE_VMMCALL              129
+#define SVM_EXITCODE_VMLOAD               130
+#define SVM_EXITCODE_VMSAVE               131
+#define SVM_EXITCODE_STGI                 132
+#define SVM_EXITCODE_CLGI                 133
+#define SVM_EXITCODE_SKINIT               134
+#define SVM_EXITCODE_RDTSCP               135
+#define SVM_EXITCODE_ICEBP                136
+#define SVM_EXITCODE_WBINVD               137
+#define SVM_EXITCODE_MONITOR              138
+#define SVM_EXITCODE_MWAIT                139
+#define SVM_EXITCODE_MWAIT_COND           140
+#define SVM_EXITCODE_XSETBV               141
+#define SVM_EXITCODE_NPF                 1024
+#define SVM_EXITCODE_AVIC_INCOMPLETE_IPI 1025
+#define SVM_EXITCODE_AVIC_NOACCEL        1026
+#define SVM_EXITCODE_INVALID             (-1ULL)
+
+/* ExitInfo1 for I/O exits */
+#define SVM_IOEXIT_IN            0x00000001
+#define SVM_IOEXIT_STR           0x00000004
+#define SVM_IOEXIT_REP           0x00000008
+#define SVM_IOEXIT_SIZE_MASK     0x00000070
+#define SVM_IOEXIT_SIZE_SHIFT    4
+#define SVM_IOEXIT_SZ8           0x00000010
+#define SVM_IOEXIT_SZ16          0x00000020
+#define SVM_IOEXIT_SZ32          0x00000040
+#define SVM_IOEXIT_ADDR_MASK     0x00000380
+#define SVM_IOEXIT_ADDR_SHIFT    7
+#define SVM_IOEXIT_A16           0x00000080
+#define SVM_IOEXIT_A32           0x00000100
+#define SVM_IOEXIT_A64           0x00000200
+#define SVM_IOEXIT_SEG_MASK      0x00001c00
+#define SVM_IOEXIT_SEG_SHIFT     10
+#define SVM_IOEXIT_PORT_MASK     0xffff0000
+#define SVM_IOEXIT_PORT_SHIFT    16
+#define SVM_IOEXIT_MBZ           0x00000002
+#define SVM_IOEXIT_SBZ           0x0000e000
+
+/* ExitInfo1 for CR exits */
+#define SVM_CREXIT_MOVCR         (1ull << 63)
+#define SVM_CREXIT_GPR_MASK      0xf
+
+/* ExitInfo2 for Task Switch exits */
+#define SVM_TSEXIT_ERRORCODE_MASK  0x00000000ffffffffULL
+#define SVM_TSEXIT_IRET            0x0000001000000000ULL
+#define SVM_TSEXIT_LJMP            0x0000004000000000ULL
+#define SVM_TSEXIT_EV              0x0000100000000000ULL
+#define SVM_TSEXIT_RF              0x0001000000000000ULL
+
+/* ExitInfo1 for SMI exits */
+#define SVM_SMIEXIT_EXTERNAL       0x0000000000000001ULL
+#define SVM_SMIEXIT_IN             0x0000000100000000ULL
+#define SVM_SMIEXIT_VALID          0x0000000200000000ULL
+#define SVM_SMIEXIT_STR            0x0000000400000000ULL
+#define SVM_SMIEXIT_REP            0x0000000800000000ULL
+#define SVM_SMIEXIT_SZ8            0x0000001000000000ULL
+#define SVM_SMIEXIT_SZ16           0x0000002000000000ULL
+#define SVM_SMIEXIT_SZ32           0x0000004000000000ULL
+#define SVM_SMIEXIT_A16            0x0000008000000000ULL
+#define SVM_SMIEXIT_A32            0x0000010000000000ULL
+#define SVM_SMIEXIT_A64            0x0000020000000000ULL
+#define SVM_SMIEXIT_PORT           0xffff000000000000ULL
+#define SVM_SMIEXIT_MBZ            0x0000fc00fffffffeULL
+
+/* ExitInfo1 for NPF exits */
+#define SVM_NPFEXIT_P              (1 << 0)
+#define SVM_NPFEXIT_RW             (1 << 1)
+#define SVM_NPFEXIT_US             (1 << 2)
+#define SVM_NPFEXIT_RSVD           (1 << 3)
+#define SVM_NPFEXIT_ID             (1 << 4)
+#define SVM_NPFEXIT_FINAL_ADDR     (1ULL << 32)    /* Rev. C */
+#define SVM_NPFEXIT_PTE_ACCESS     (1ULL << 33)    /* Rev. C */
+
+/* Event Injection */
+#define SVM_INTINFO_VECTOR_MASK   0x000000ff
+#define SVM_INTINFO_TYPE_SHIFT    8
+#define SVM_INTINFO_TYPE_MASK     (7 << SVM_INTINFO_TYPE_SHIFT)
+#define SVM_INTINFO_TYPE_EXTINT   (0 << SVM_INTINFO_TYPE_SHIFT)
+#define SVM_INTINFO_TYPE_RSVD     (1 << SVM_INTINFO_TYPE_SHIFT)
+#define SVM_INTINFO_TYPE_NMI      (2 << SVM_INTINFO_TYPE_SHIFT)
+#define SVM_INTINFO_TYPE_XCP      (3 << SVM_INTINFO_TYPE_SHIFT)
+#define SVM_INTINFO_TYPE_INTN     (4 << SVM_INTINFO_TYPE_SHIFT)
+#define SVM_INTINFO_EV            0x00000800
+#define SVM_INTINFO_RSVD          0x7ffff000
+#define SVM_INTINFO_VALID         0x80000000
+
+
+#define SVM_EXEC_CTL_BIT(exitCode) (1ULL << (exitCode - SVM_EXITCODE_INTR))
+
+#define VERIFY_EXEC_CTL(name)                                 \
+   ASSERT_ON_COMPILE(SVM_EXEC_CTL_BIT(SVM_EXITCODE_##name) == \
+                     SVM_VMCB_EXEC_CTL_##name);
+
+/* Header for a secure loader block with no SL header */
+#pragma pack(push, 1)
+typedef struct {
+   uint16 entryOffs;
+   uint16 codeLen;
+} SLB_Header;
+#pragma pack(pop)
+
+enum {
+#define CLEANBIT(_name, _pos) SVM_VMCB_CLEAN_ ## _name = _pos,
+
+   SVMCLEAN
+   SVM_VMCB_NUM_CLEANBITS
+
+#undef CLEANBIT
+};
+   
+static INLINE uint64
+SVM_ExecCtlBit(uint32 exitCode)
+{
+   VERIFY_EXEC_CTL(INTR);
+   VERIFY_EXEC_CTL(NMI);
+   VERIFY_EXEC_CTL(SMI);
+   VERIFY_EXEC_CTL(INIT);
+   VERIFY_EXEC_CTL(VINTR);
+   VERIFY_EXEC_CTL(CR0_SEL_WR);
+   VERIFY_EXEC_CTL(SIDT);
+   VERIFY_EXEC_CTL(SGDT);
+   VERIFY_EXEC_CTL(SLDT);
+   VERIFY_EXEC_CTL(STR);
+   VERIFY_EXEC_CTL(LIDT);
+   VERIFY_EXEC_CTL(LGDT);
+   VERIFY_EXEC_CTL(LLDT);
+   VERIFY_EXEC_CTL(LTR);
+   VERIFY_EXEC_CTL(RDTSC);
+   VERIFY_EXEC_CTL(RDPMC);
+   VERIFY_EXEC_CTL(PUSHF);
+   VERIFY_EXEC_CTL(POPF);
+   VERIFY_EXEC_CTL(CPUID);
+   VERIFY_EXEC_CTL(RSM);
+   VERIFY_EXEC_CTL(IRET);
+   VERIFY_EXEC_CTL(SWINT);
+   VERIFY_EXEC_CTL(INVD);
+   VERIFY_EXEC_CTL(PAUSE);
+   VERIFY_EXEC_CTL(HLT);
+   VERIFY_EXEC_CTL(INVLPG);
+   VERIFY_EXEC_CTL(INVLPGA);
+   VERIFY_EXEC_CTL(IOIO);
+   VERIFY_EXEC_CTL(MSR);
+   VERIFY_EXEC_CTL(TS);
+   VERIFY_EXEC_CTL(FERR_FRZ);
+   VERIFY_EXEC_CTL(SHUTDOWN);
+   VERIFY_EXEC_CTL(VMRUN);
+   VERIFY_EXEC_CTL(VMMCALL);
+   VERIFY_EXEC_CTL(VMLOAD);
+   VERIFY_EXEC_CTL(VMSAVE);
+   VERIFY_EXEC_CTL(STGI);
+   VERIFY_EXEC_CTL(CLGI);
+   VERIFY_EXEC_CTL(SKINIT);
+   VERIFY_EXEC_CTL(RDTSCP);
+   VERIFY_EXEC_CTL(ICEBP);
+   VERIFY_EXEC_CTL(WBINVD);
+   VERIFY_EXEC_CTL(MONITOR);
+   VERIFY_EXEC_CTL(MWAIT);
+   VERIFY_EXEC_CTL(MWAIT_COND);
+   VERIFY_EXEC_CTL(XSETBV);
+   ASSERT(SVM_EXITCODE_INTR <= exitCode && exitCode <= SVM_EXITCODE_XSETBV);
+   return SVM_EXEC_CTL_BIT(exitCode);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SVM_EnabledFromFeatures --
+ * 
+ *  Returns TRUE if SVM is enabled in the given VM control MSR bits.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+SVM_EnabledFromFeatures(uint64 vmCR)
+{
+   return (vmCR & MSR_VM_CR_SVME_DISABLE) == 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SVM_LockedFromFeatures --
+ * 
+ *  Returns TRUE if SVM is locked in the given VM control MSR bits.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+SVM_LockedFromFeatures(uint64 vmCR)
+{
+   return (vmCR & MSR_VM_CR_SVM_LOCK) != 0;
+}
+
+
+#if !defined(USERLEVEL) && !defined(MONITOR_APP) /* { */
+/*
+ *----------------------------------------------------------------------
+ * SVM_EnabledCPU --
+ *
+ *   Returns TRUE if SVM is enabled on this CPU.  This function assumes
+ *   that the processor is SVM_Capable().
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+SVM_EnabledCPU(void)
+{
+   return SVM_EnabledFromFeatures(__GET_MSR(MSR_VM_CR));
+}
+#endif /* } !defined(USERLEVEL) */
+
+
+#ifndef VMM
+/*
+ *----------------------------------------------------------------------
+ * SVM_CapableCPU --
+ *
+ *   Verify that this CPU is SVM-capable.
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+SVM_CapableCPU(void)
+{
+   return ((__GET_EAX_FROM_CPUID(0x80000000) >= 0x8000000a) &&
+           CPUID_ISSET(0x80000001, ECX, SVM,
+                       __GET_ECX_FROM_CPUID(0x80000001)) &&
+           CPUID_GET(0x8000000a, EAX, SVM_REVISION,
+                     __GET_EAX_FROM_CPUID(CPUID_SVM_FEATURES)) != 0);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ * SVM_SupportedVersion --
+ *
+ *   Verify that a CPU has the SVM capabilities required to run the
+ *   SVM-enabled monitor.  This function assumes that the processor is
+ *   SVM_Capable().  We only support CPUs that populate the exitIntInfo
+ *   field of the VMCB when IDT vectoring is interrupted by a task switch
+ *   intercept.  That behavior was first introduced with Family 10H.
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+SVM_SupportedVersion(uint32 version)
+{
+   return CPUID_EFFECTIVE_FAMILY(version) >= CPUID_FAMILY_K8L;
+}
+
+
+/*
+ *
+ *----------------------------------------------------------------------
+ * SVM_SupportedCPU --
+ *
+ *   Wrapper to call SVM_SupportedVersion() with the right
+ *   parameter(s) for the current CPU.
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+SVM_SupportedCPU(void)
+{
+   return SVM_SupportedVersion(__GET_EAX_FROM_CPUID(1));
+}
+
+
+#endif /* VMM */
+
+#endif /* _X86SVM_H_ */
diff --git a/vmmon-only/include/x86types.h b/vmmon-only/include/x86types.h
new file mode 100644
index 00000000..cf7966e9
--- /dev/null
+++ b/vmmon-only/include/x86types.h
@@ -0,0 +1,479 @@
+/*********************************************************
+ * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86types.h --
+ *
+ *      Type definitions for the x86 architecture.
+ */
+
+#ifndef _X86TYPES_H_
+#define _X86TYPES_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "address_defs.h"
+#include "x86segdescrs.h"
+
+/*
+ * Types used for PL4 page table in x86_64 and arm64
+ */
+
+typedef uint64 VM_L4E;
+typedef uint64 VM_L3E;
+typedef uint64 VM_L2E;
+typedef uint64 VM_L1E;
+
+
+/*
+ * Page table
+ */
+
+typedef uint32 VM_PDE;
+typedef uint32 VM_PTE;
+typedef uint64 VM_PAE_PDE;
+typedef uint64 VM_PAE_PTE;
+typedef uint64 VM_PDPTE;
+
+
+/*
+ * Extended page table
+ */
+
+typedef uint64 VM_EPTE;
+
+/*
+ * Registers
+ */
+
+typedef union SharedReg64 {
+   Reg8  reg8[2];
+   Reg16 reg16;
+   Reg32 reg32;
+   Reg64 reg64;
+} SharedReg64;
+
+typedef union SharedUReg64 {
+   UReg8  ureg8[2];
+   UReg16 ureg16;
+   UReg32 ureg32;
+   UReg32 ureg32Pair[2];
+   UReg64 ureg64;
+} SharedUReg64;
+
+typedef uint8 Instruction;
+
+typedef uint16 Selector;
+
+/*
+ *   tasks
+ */
+
+
+#define IST_NUM_ENTRIES 8
+#pragma pack(push, 1)
+typedef struct Task64 {
+   uint32     reserved0;
+   uint64     rsp[3];   // Stacks for CPL 0-2.
+   uint64     ist[IST_NUM_ENTRIES];   // ist[0] is reserved.
+   uint64     reserved1;
+   uint16     reserved2;
+   uint16     IOMapBase;
+} Task64;
+#pragma pack(pop)
+
+
+#pragma pack(push, 1)
+typedef struct Task32 {
+   uint32     prevTask;
+   uint32     esp0;
+   uint32     ss0;
+   uint32     esp1;
+   uint32     ss1;
+   uint32     esp2;
+   uint32     ss2;
+   uint32     cr3;
+   uint32     eip;
+   uint32     eflags;
+   uint32     eax;
+   uint32     ecx;
+   uint32     edx;
+   uint32     ebx;
+   uint32     esp;
+   uint32     ebp;
+   uint32     esi;
+   uint32     edi;
+   uint32     es;
+   uint32     cs;
+   uint32     ss;
+   uint32     ds;
+   uint32     fs;
+   uint32     gs;
+   uint32     ldt;
+   uint16     trap;
+   uint16     IOMapBase;
+} Task32;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct {
+   uint16     prevTask;
+   uint16     sp0;  // static.  Unmarked fields are dynamic
+   uint16     ss0;  // static
+   uint16     sp1;  // static
+   uint16     ss1;  // static
+   uint16     sp2;  // static
+   uint16     ss2;  // static 
+   uint16     ip;
+   uint16     flags;
+   uint16     ax;
+   uint16     cx;
+   uint16     dx;
+   uint16     bx;
+   uint16     sp;
+   uint16     bp;
+   uint16     si;
+   uint16     di;
+   uint16     es;
+   uint16     cs;
+   uint16     ss;
+   uint16     ds;
+   uint16     ldt;  // static
+} Task16;
+#pragma pack(pop)
+
+// Task defaults to Task32 for everyone except vmkernel. Task64 is used where
+// needed by these products.
+#if defined VMX86_SERVER && defined VMKERNEL
+#ifdef VM_X86_64
+typedef Task64 Task;
+#else
+typedef Task32 Task;
+#endif
+#else /* VMX86_SERVER && defined VMKERNEL */
+typedef Task32 Task;
+#endif
+
+
+/*
+ *   far pointers
+ */
+
+#pragma pack(push, 1)
+typedef struct {
+#if defined(VMM) || defined(COREQUERY)
+   uint64 va;
+#else
+   uint32 va;
+#endif
+   Selector seg;
+} FarPtr;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct FarPtr16 {
+   uint16   offset;
+   uint16   selector;
+} FarPtr16;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct FarPtr32 {
+   uint32   offset;
+   uint16   selector;
+} FarPtr32;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct FarPtr64 {
+   uint64   offset;
+   uint16   selector;
+} FarPtr64;
+#pragma pack(pop)
+
+/*
+ * X86-defined stack layouts for interrupts, exceptions, irets, calls, etc.
+ */
+
+/*
+ * Layout of the 64-bit stack frame on exception.
+ */
+#pragma pack(push, 1)
+typedef struct x86ExcFrame64 {
+   uint64       rip;
+   uint16       cs, __sel[3];
+   uint64       rflags;
+   uint64       rsp;
+   uint16       ss, __ssel[3];
+} x86ExcFrame64;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct x86ExcFrame64WithErrorCode {
+   uint32       errorCode, __errorCode;
+   uint64       rip;
+   uint16       cs, __sel[3];
+   uint64       rflags;
+   uint64       rsp;
+   uint16       ss, __ssel[3];
+} x86ExcFrame64WithErrorCode;
+#pragma pack(pop)
+
+/*
+ * Layout of the 32-bit stack frame on exception.
+ */
+#pragma pack(push, 1)
+typedef struct x86ExcFrame32 {
+   uint32         eip;
+   union {
+      struct {
+         uint16   sel, __sel;
+      }           cs16;
+      uint32      cs32;
+   } u;
+   uint32         eflags;
+} x86ExcFrame32;
+#pragma pack(pop)
+
+/*
+ * Layout of the 32-bit stack frame with ss:esp and no error code.
+ */
+#pragma pack(push, 1)
+typedef struct x86ExcFrame32WithStack {
+   uint32      eip;
+   uint16      cs, __csu;
+   uint32      eflags;
+   uint32      esp;
+   uint16      ss, __ssu;
+} x86ExcFrame32WithStack;
+#pragma pack(pop)
+
+/*
+ * Layout of the 32-bit stack frame on inter-level transfer.
+ */
+#pragma pack(push, 1)
+typedef struct x86ExcFrame32IL {
+   uint32      errorCode;
+   uint32      eip;
+   uint16      cs, __csu;
+   uint32      eflags;
+   uint32      esp;
+   uint16      ss, __ssu;
+} x86ExcFrame32IL;
+#pragma pack(pop)
+
+
+/*
+ * Layout of the 16-bit stack frame on exception.
+ */
+#pragma pack(push, 1)
+typedef struct x86ExcFrame16 {
+   uint16   eip;
+   uint16   cs;
+   uint16   eflags;
+} x86ExcFrame16;
+#pragma pack(pop)
+
+/*
+ * Layout of the 16-bit stack frame which incudes ss:sp.
+ */
+#pragma pack(push, 1)
+typedef struct x86ExcFrame16WithStack {
+   uint16   ip;
+   uint16   cs;
+   uint16   flags;
+   uint16   sp;
+   uint16   ss;
+} x86ExcFrame16WithStack;
+#pragma pack(pop)
+
+/*
+ * Layout of the 32-bit stack frame on exception
+ * from V8086 mode. It is also a superset
+ * of inter-level exception stack frame, which
+ * in turn is superset of intra-level exception
+ * stack frame.
+ */
+#pragma pack(push, 1)
+typedef struct x86ExcFrameV8086 {
+   uint32         eip;
+   union {
+      struct {
+         uint16   sel, __sel;
+      }           cs16;
+      uint32      cs32;
+   } u;
+   uint32         eflags;
+   uint32         esp;
+   uint16         ss, __ss;
+   uint16         es, __es;
+   uint16         ds, __ds;
+   uint16         fs, __fs;
+   uint16         gs, __gs;
+} x86ExcFrameV8086;
+#pragma pack(pop)
+
+/*
+ * Layout of the 32-bit stack frame on exception
+ * from V8086 mode with errorCode. It is
+ * superset of SegmentExcFrameV8086.
+ */
+#pragma pack(push, 1)
+typedef struct x86ExcFrameV8086WithErrorCode {
+   uint32         errorCode;
+   uint32         eip;
+   union {
+      struct {
+         uint16   sel, __sel;
+      }           cs16;
+      uint32      cs32;
+   } u;
+   uint32         eflags;
+   uint32         esp;
+   uint16         ss, __ss;
+   uint16         es, __es;
+   uint16         ds, __ds;
+   uint16         fs, __fs;
+   uint16         gs, __gs;
+} x86ExcFrameV8086WithErrorCode;
+#pragma pack(pop)
+
+/*
+ * Layout of the stack on a 32 bit far call.
+ */
+#pragma pack(push, 1)
+typedef struct x86CallStack32 {
+   uint32   eip;
+   uint16   cs, __cs;
+} x86CallStack32;
+#pragma pack(pop)
+
+/*
+ * Layout of the stack on a 16 bit far call.
+ */
+#pragma pack(push, 1)
+typedef struct x86CallStack16 {
+   uint16   ip;
+   uint16   cs;
+} x86CallStack16;
+#pragma pack(pop)
+
+/*
+ * Layout of the stack on a 32 bit far call.
+ */
+#pragma pack(push, 1)
+typedef struct x86CallGateStack32 {
+   uint32   eip;
+   uint16   cs, __cs;
+   uint32   esp;
+   uint16   ss, __ss;
+} x86CallGateStack32;
+#pragma pack(pop)
+
+/*
+ * Layout of the stack on a 16 bit far call.
+ */
+#pragma pack(push, 1)
+typedef struct x86CallGateStack16 {
+   uint16   ip;
+   uint16   cs;
+   uint16   sp;
+   uint16   ss;
+} x86CallGateStack16;
+#pragma pack(pop)
+
+typedef struct DebugControlRegister {
+
+   int l0:1;
+   int g0:1;
+   int l1:1;
+   int g1:1;
+   int l2:1;
+   int g2:1;
+   int l3:1;
+   int g3:1;
+   
+   int le:1;
+   int ge:1;
+   int oo1:3;
+   
+   int gd:1;
+   int oo:2;
+   
+   int rw0:2;
+   int len0:2;
+   int rw1:2;
+   int len1:2;
+   int rw2:2;
+   int len2:2;
+   int rw3:2;
+   int len3:2;
+   
+} DebugControlRegister;
+
+/*
+ * When an interrupt descriptor has an IST entry programmed, for any raised
+ * interrupt (or fault, or exception), the stack pointer is switched to the top
+ * of a specified stack and the exception frame is pushed.  If another
+ * interrupt is raised with the same IST entry programmed before the first is
+ * handled, the first's context is corrupted and system integrity is
+ * compromised.
+ *
+ * When the monitor binary translates code for a guest, any interrupt must be
+ * taken on a host stack, and thus IST entries are used for all vectors.  The
+ * vmkernel uses a separate stack for #MCE handling, programmed via an IST
+ * entry.  In both cases, the danger of context corruption by successive faults
+ * is real and must be dealt with.
+ *
+ * In handlers for these exceptions, the initial exception frame is copied
+ * further down the stack and the stack pointer updated to point to the copy.
+ * The distance from the top of the stack for the copy is situation-dependent.
+ *
+ * ExcFrame64ForCopy extends x86ExcFrame64 and maintains congruence with the
+ * full x86 exception frame types (VMKFullExcFrame and the monitor's ExcFrame).
+ * Enough space is afforded for a couple of temporary software-pushed registers
+ * to accommodate the stack copy.
+ */
+#pragma pack(push, 1)
+typedef struct ExcFrame64ForCopy {
+   UReg64      r13;                  // Pushed by SW. Used as temp reg.
+   UReg64      r14;                  // Pushed by SW. Used as temp reg.
+   UReg64      r15;                  // Pushed by SW. Pushed by gate.
+   
+   UReg64      errorCode;            // Pushed by SW or HW.
+   
+   UReg64      rip;                  // Pushed by HW.
+   uint16      cs, __csu[3];         // Pushed by HW.
+   uint64      rflags;               // Pushed by HW.
+
+   UReg64      rsp;                  // Pushed by HW.
+   uint16      ss, __ssu[3];         // Pushed by HW.
+} ExcFrame64ForCopy;
+#pragma pack(pop)
+
+#endif // ifndef _X86TYPES_H_
diff --git a/vmmon-only/include/x86vendor.h b/vmmon-only/include/x86vendor.h
new file mode 100644
index 00000000..0c9ccdd7
--- /dev/null
+++ b/vmmon-only/include/x86vendor.h
@@ -0,0 +1,37 @@
+
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _X86VENDOR_H_
+#define _X86VENDOR_H_
+
+/*
+ * CPU vendors
+ */
+
+typedef enum {
+   CPUID_VENDOR_UNKNOWN,
+   CPUID_VENDOR_COMMON,
+   CPUID_VENDOR_INTEL,
+   CPUID_VENDOR_AMD,
+   CPUID_VENDOR_CYRIX,
+   CPUID_VENDOR_VIA,
+   CPUID_NUM_VENDORS
+} CpuidVendor;
+
+#endif
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
new file mode 100644
index 00000000..321b5331
--- /dev/null
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -0,0 +1,213 @@
+/*********************************************************
+ * Copyright (C) 2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86vt-vmcs-fields.h --
+ *
+ * VMCS encodings; SDM volume 3 Appendix B.
+ * These are the values passed to VMWRITE and VMREAD.
+ *
+ * VMCS_FIELD(name, encoding)
+ */
+
+#include "community_source.h"
+
+/*
+ * VMCS_FIELD(name,                    encoding, vVT support)
+ */
+
+/* 16-bit control fields. */
+VMCS_FIELD(VPID,                    0x0000, TRUE)
+VMCS_FIELD(PI_NOTIFY,               0x0002, FALSE)
+VMCS_FIELD(EPTP_INDEX,              0x0004, FALSE)
+
+/* 16-bit guest state. */
+VMCS_FIELD(ES,                      0x0800, TRUE)
+VMCS_FIELD(CS,                      0x0802, TRUE)
+VMCS_FIELD(SS,                      0x0804, TRUE)
+VMCS_FIELD(DS,                      0x0806, TRUE)
+VMCS_FIELD(FS,                      0x0808, TRUE)
+VMCS_FIELD(GS,                      0x080A, TRUE)
+VMCS_FIELD(LDTR,                    0x080C, TRUE)
+VMCS_FIELD(TR,                      0x080E, TRUE)
+VMCS_FIELD(INTR_STATUS,             0x0810, FALSE)
+
+/* 16-bit host state. */
+VMCS_FIELD(HOST_ES,                 0x0C00, TRUE)
+VMCS_FIELD(HOST_CS,                 0x0C02, TRUE)
+VMCS_FIELD(HOST_SS,                 0x0C04, TRUE)
+VMCS_FIELD(HOST_DS,                 0x0C06, TRUE)
+VMCS_FIELD(HOST_FS,                 0x0C08, TRUE)
+VMCS_FIELD(HOST_GS,                 0x0C0A, TRUE)
+VMCS_FIELD(HOST_TR,                 0x0C0C, TRUE)
+
+/* 64-bit control fields. */
+VMCS_FIELD(IOBITMAPA,               0x2000, TRUE)
+VMCS_FIELD(IOBITMAPB,               0x2002, TRUE)
+VMCS_FIELD(MSRBITMAP,               0x2004, TRUE)
+VMCS_FIELD(VMEXIT_MSR_STORE_ADDR,   0x2006, TRUE)
+VMCS_FIELD(VMEXIT_MSR_LOAD_ADDR,    0x2008, TRUE)
+VMCS_FIELD(VMENTRY_MSR_LOAD_ADDR,   0x200A, TRUE)
+VMCS_FIELD(EXECUTIVE_VMCS_PTR,      0x200C, TRUE)
+VMCS_FIELD(TSC_OFF,                 0x2010, TRUE)
+VMCS_FIELD(VIRT_APIC_ADDR,          0x2012, TRUE)
+VMCS_FIELD(APIC_ACCESS_ADDR,        0x2014, FALSE)
+VMCS_FIELD(PI_DESC_ADDR,            0x2016, FALSE)
+VMCS_FIELD(VMFUNC_CTLS,             0x2018, FALSE)
+VMCS_FIELD(EPTP,                    0x201A, TRUE)
+VMCS_FIELD(EOI_EXIT0,               0x201C, FALSE)
+VMCS_FIELD(EOI_EXIT1,               0x201E, FALSE)
+VMCS_FIELD(EOI_EXIT2,               0x2020, FALSE)
+VMCS_FIELD(EOI_EXIT3,               0x2022, FALSE)
+VMCS_FIELD(EPTP_LIST_ADDR,          0x2024, FALSE)
+VMCS_FIELD(VMREAD_BITMAP,           0x2026, FALSE)
+VMCS_FIELD(VMWRITE_BITMAP,          0x2028, FALSE)
+VMCS_FIELD(VE_INFO_ADDR,            0x202A, FALSE)
+VMCS_FIELD(XSS_EXITING_BITMAP,      0x202C, FALSE)
+VMCS_FIELD(ENCLS_EXITING_BITMAP,    0x202E, FALSE)
+
+/* 64-bit read-only data field. */
+VMCS_FIELD(PHYSADDR,                0x2400, TRUE)
+
+/* 64-bit guest state. */
+VMCS_FIELD(LINK_PTR,                0x2800, TRUE)
+VMCS_FIELD(DEBUGCTL,                0x2802, TRUE)
+VMCS_FIELD(PAT,                     0x2804, FALSE)
+VMCS_FIELD(EFER,                    0x2806, TRUE)
+VMCS_FIELD(PGC,                     0x2808, TRUE)
+VMCS_FIELD(PDPTE0,                  0x280A, TRUE)
+VMCS_FIELD(PDPTE1,                  0x280C, TRUE)
+VMCS_FIELD(PDPTE2,                  0x280E, TRUE)
+VMCS_FIELD(PDPTE3,                  0x2810, TRUE)
+
+/* 64-bit host state. */
+VMCS_FIELD(HOST_PAT,                0x2C00, FALSE)
+VMCS_FIELD(HOST_EFER,               0x2C02, TRUE)
+VMCS_FIELD(HOST_PGC,                0x2C04, TRUE)
+
+/* 32-bit control fields. */
+VMCS_FIELD(PIN_VMEXEC_CTL,          0x4000, TRUE)
+VMCS_FIELD(CPU_VMEXEC_CTL,          0x4002, TRUE)
+VMCS_FIELD(XCP_BITMAP,              0x4004, TRUE)
+VMCS_FIELD(PF_ERR_MASK,             0x4006, TRUE)
+VMCS_FIELD(PF_ERR_MATCH,            0x4008, TRUE)
+VMCS_FIELD(CR3_TARG_COUNT,          0x400A, TRUE)
+VMCS_FIELD(VMEXIT_CTL,              0x400C, TRUE)
+VMCS_FIELD(VMEXIT_MSR_STORE_COUNT,  0x400E, TRUE)
+VMCS_FIELD(VMEXIT_MSR_LOAD_COUNT,   0x4010, TRUE)
+VMCS_FIELD(VMENTRY_CTL,             0x4012, TRUE)
+VMCS_FIELD(VMENTRY_MSR_LOAD_COUNT,  0x4014, TRUE)
+VMCS_FIELD(VMENTRY_INTR_INFO,       0x4016, TRUE)
+VMCS_FIELD(VMENTRY_XCP_ERR,         0x4018, TRUE)
+VMCS_FIELD(VMENTRY_INSTR_LEN,       0x401A, TRUE)
+VMCS_FIELD(TPR_THRESHOLD,           0x401C, TRUE)
+VMCS_FIELD(2ND_VMEXEC_CTL,          0x401E, TRUE)
+VMCS_FIELD(PAUSE_LOOP_GAP,          0x4020, FALSE)
+VMCS_FIELD(PAUSE_LOOP_WINDOW,       0x4022, FALSE)
+
+/* 32-bit read-only data fields. */
+VMCS_FIELD(VMINSTR_ERR,             0x4400, TRUE)
+VMCS_FIELD(EXIT_REASON,             0x4402, TRUE)
+VMCS_FIELD(EXIT_INTR_INFO,          0x4404, TRUE)
+VMCS_FIELD(EXIT_INTR_ERR,           0x4406, TRUE)
+VMCS_FIELD(IDTVEC_INFO,             0x4408, TRUE)
+VMCS_FIELD(IDTVEC_ERR,              0x440A, TRUE)
+VMCS_FIELD(INSTRLEN,                0x440C, TRUE)
+VMCS_FIELD(INSTR_INFO,              0x440E, TRUE)
+
+/* 32-bit guest state. */
+VMCS_FIELD(ES_LIMIT,                0x4800, TRUE)
+VMCS_FIELD(CS_LIMIT,                0x4802, TRUE)
+VMCS_FIELD(SS_LIMIT,                0x4804, TRUE)
+VMCS_FIELD(DS_LIMIT,                0x4806, TRUE)
+VMCS_FIELD(FS_LIMIT,                0x4808, TRUE)
+VMCS_FIELD(GS_LIMIT,                0x480A, TRUE)
+VMCS_FIELD(LDTR_LIMIT,              0x480C, TRUE)
+VMCS_FIELD(TR_LIMIT,                0x480E, TRUE)
+VMCS_FIELD(GDTR_LIMIT,              0x4810, TRUE)
+VMCS_FIELD(IDTR_LIMIT,              0x4812, TRUE)
+VMCS_FIELD(ES_AR,                   0x4814, TRUE)
+VMCS_FIELD(CS_AR,                   0x4816, TRUE)
+VMCS_FIELD(SS_AR,                   0x4818, TRUE)
+VMCS_FIELD(DS_AR,                   0x481A, TRUE)
+VMCS_FIELD(FS_AR,                   0x481C, TRUE)
+VMCS_FIELD(GS_AR,                   0x481E, TRUE)
+VMCS_FIELD(LDTR_AR,                 0x4820, TRUE)
+VMCS_FIELD(TR_AR,                   0x4822, TRUE)
+VMCS_FIELD(HOLDOFF,                 0x4824, TRUE)
+VMCS_FIELD(ACTSTATE,                0x4826, TRUE)
+VMCS_FIELD(SMBASE,                  0x4828, TRUE)
+VMCS_FIELD(SYSENTER_CS,             0x482A, TRUE)
+VMCS_FIELD(TIMER,                   0x482E, FALSE)
+
+/* 32-bit host state. */
+VMCS_FIELD(HOST_SYSENTER_CS,        0x4C00, TRUE)
+
+/* natural-width control fields. */
+VMCS_FIELD(CR0_GHMASK,              0x6000, TRUE)
+VMCS_FIELD(CR4_GHMASK,              0x6002, TRUE)
+VMCS_FIELD(CR0_SHADOW,              0x6004, TRUE)
+VMCS_FIELD(CR4_SHADOW,              0x6006, TRUE)
+VMCS_FIELD(CR3_TARGVAL0,            0x6008, TRUE)
+VMCS_FIELD(CR3_TARGVAL1,            0x600A, TRUE)
+VMCS_FIELD(CR3_TARGVAL2,            0x600C, TRUE)
+VMCS_FIELD(CR3_TARGVAL3,            0x600E, TRUE)
+
+/* natural-width read-only data fields. */
+VMCS_FIELD(EXIT_QUAL,               0x6400, TRUE)
+VMCS_FIELD(IO_ECX,                  0x6402, TRUE)
+VMCS_FIELD(IO_ESI,                  0x6404, TRUE)
+VMCS_FIELD(IO_EDI,                  0x6406, TRUE)
+VMCS_FIELD(IO_EIP,                  0x6408, TRUE)
+VMCS_FIELD(LINEAR_ADDR,             0x640A, TRUE)
+
+/* natural-width guest state. */
+VMCS_FIELD(CR0,                     0x6800, TRUE)
+VMCS_FIELD(CR3,                     0x6802, TRUE)
+VMCS_FIELD(CR4,                     0x6804, TRUE)
+VMCS_FIELD(ES_BASE,                 0x6806, TRUE)
+VMCS_FIELD(CS_BASE,                 0x6808, TRUE)
+VMCS_FIELD(SS_BASE,                 0x680A, TRUE)
+VMCS_FIELD(DS_BASE,                 0x680C, TRUE)
+VMCS_FIELD(FS_BASE,                 0x680E, TRUE)
+VMCS_FIELD(GS_BASE,                 0x6810, TRUE)
+VMCS_FIELD(LDTR_BASE,               0x6812, TRUE)
+VMCS_FIELD(TR_BASE,                 0x6814, TRUE)
+VMCS_FIELD(GDTR_BASE,               0x6816, TRUE)
+VMCS_FIELD(IDTR_BASE,               0x6818, TRUE)
+VMCS_FIELD(DR7,                     0x681A, TRUE)
+VMCS_FIELD(ESP,                     0x681C, TRUE)
+VMCS_FIELD(EIP,                     0x681E, TRUE)
+VMCS_FIELD(EFLAGS,                  0x6820, TRUE)
+VMCS_FIELD(PENDDBG,                 0x6822, TRUE)
+VMCS_FIELD(SYSENTER_ESP,            0x6824, TRUE)
+VMCS_FIELD(SYSENTER_EIP,            0x6826, TRUE)
+
+/* natural-width host state. */
+VMCS_FIELD(HOST_CR0,                0x6C00, TRUE)
+VMCS_FIELD(HOST_CR3,                0x6C02, TRUE)
+VMCS_FIELD(HOST_CR4,                0x6C04, TRUE)
+VMCS_FIELD(HOST_FSBASE,             0x6C06, TRUE)
+VMCS_FIELD(HOST_GSBASE,             0x6C08, TRUE)
+VMCS_FIELD(HOST_TRBASE,             0x6C0A, TRUE)
+VMCS_FIELD(HOST_GDTRBASE,           0x6C0C, TRUE)
+VMCS_FIELD(HOST_IDTRBASE,           0x6C0E, TRUE)
+VMCS_FIELD(HOST_SYSENTER_ESP,       0x6C10, TRUE)
+VMCS_FIELD(HOST_SYSENTER_EIP,       0x6C12, TRUE)
+VMCS_FIELD(HOST_ESP,                0x6C14, TRUE)
+VMCS_FIELD(HOST_EIP,                0x6C16, TRUE)
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
new file mode 100644
index 00000000..993a8a9e
--- /dev/null
+++ b/vmmon-only/include/x86vt.h
@@ -0,0 +1,1047 @@
+/*********************************************************
+ * Copyright (C) 2004-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _X86VT_H_
+#define _X86VT_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMX
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "community_source.h"
+#include "x86msr.h"
+#include "vm_basic_defs.h"
+#if defined(USERLEVEL) || defined(MONITOR_APP)
+#include "vm_basic_asm.h"
+#else
+#include "vm_asm.h"
+#endif
+#include "x86cpuid_asm.h"
+
+/* VMX related MSRs */
+#define MSR_VMX_BASIC                  0x00000480
+#define MSR_VMX_PINBASED_CTLS          0x00000481
+#define MSR_VMX_PROCBASED_CTLS         0x00000482
+#define MSR_VMX_EXIT_CTLS              0x00000483
+#define MSR_VMX_ENTRY_CTLS             0x00000484
+#define MSR_VMX_MISC                   0x00000485
+#define MSR_VMX_CR0_FIXED0             0x00000486
+#define MSR_VMX_CR0_FIXED1             0x00000487
+#define MSR_VMX_CR4_FIXED0             0x00000488
+#define MSR_VMX_CR4_FIXED1             0x00000489
+#define MSR_VMX_VMCS_ENUM              0x0000048a
+#define MSR_VMX_2ND_CTLS               0x0000048b
+#define MSR_VMX_EPT_VPID               0x0000048c
+#define MSR_VMX_TRUE_PINBASED_CTLS     0x0000048d
+#define MSR_VMX_TRUE_PROCBASED_CTLS    0x0000048e
+#define MSR_VMX_TRUE_EXIT_CTLS         0x0000048f
+#define MSR_VMX_TRUE_ENTRY_CTLS        0x00000490
+#define MSR_VMX_VMFUNC                 0x00000491
+#define NUM_VMX_MSRS                   (MSR_VMX_VMFUNC - MSR_VMX_BASIC + 1)
+
+/*
+ * An alias to accommodate Intel's naming convention in feature masks.
+ */
+#define MSR_VMX_PROCBASED_CTLS2        MSR_VMX_2ND_CTLS
+
+
+/*
+ * Single bit macros for backwards compatibility.  These can't be
+ * defined as enumeration values using the VMXCAP macro, because
+ * the Microsoft compiler doesn't like 64-bit enumeration values.
+ */
+
+#define MSR_VMX_BASIC_32BITPA                   \
+   (CONST64U(1) << MSR_VMX_BASIC_32BITPA_SHIFT)
+#define MSR_VMX_BASIC_DUALVMM                   \
+   (CONST64U(1) << MSR_VMX_BASIC_DUALVMM_SHIFT)
+#define MSR_VMX_BASIC_ADVANCED_IOINFO           \
+   (CONST64U(1) << MSR_VMX_BASIC_ADVANCED_IOINFO_SHIFT)
+#define MSR_VMX_BASIC_TRUE_CTLS                 \
+   (CONST64U(1) << MSR_VMX_BASIC_TRUE_CTLS_SHIFT)
+                                               
+#define MSR_VMX_MISC_VMEXIT_SAVES_LMA           \
+   (CONST64U(1) << MSR_VMX_MISC_VMEXIT_SAVES_LMA_SHIFT)
+#define MSR_VMX_MISC_ACTSTATE_HLT               \
+   (CONST64U(1) << MSR_VMX_MISC_ACTSTATE_HLT_SHIFT)
+#define MSR_VMX_MISC_ACTSTATE_SHUTDOWN          \
+   (CONST64U(1) << MSR_VMX_MISC_ACTSTATE_SHUTDOWN_SHIFT)
+#define MSR_VMX_MISC_ACTSTATE_SIPI              \
+   (CONST64U(1) << MSR_VMX_MISC_ACTSTATE_SIPI_SHIFT)
+#define MSR_VMX_MISC_RDMSR_SMBASE_IN_SMM        \
+   (CONST64U(1) << MSR_VMX_MISC_RDMSR_SMBASE_IN_SMM_SHIFT)
+#define MSR_VMX_MISC_ALLOW_ALL_VMWRITES         \
+   (CONST64U(1) << MSR_VMX_MISC_ALLOW_ALL_VMWRITES_SHIFT)
+#define MSR_VMX_MISC_ZERO_VMENTRY_INSTLEN         \
+   (CONST64U(1) << MSR_VMX_MISC_ZERO_VMENTRY_INSTLEN_SHIFT)
+
+
+#define MSR_VMX_EPT_VPID_EPTE_X                 \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_EPTE_X_SHIFT)
+#define MSR_VMX_EPT_VPID_GAW_48                 \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_GAW_48_SHIFT)
+#define MSR_VMX_EPT_VPID_ETMT_UC                \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_ETMT_UC_SHIFT)
+#define MSR_VMX_EPT_VPID_ETMT_WB                \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_ETMT_WB_SHIFT)
+#define MSR_VMX_EPT_VPID_SP_2MB                 \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_SP_2MB_SHIFT)
+#define MSR_VMX_EPT_VPID_SP_1GB                 \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_SP_1GB_SHIFT)
+#define MSR_VMX_EPT_VPID_INVEPT                 \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_INVEPT_SHIFT)
+#define MSR_VMX_EPT_VPID_ACCESS_DIRTY           \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_ACCESS_DIRTY_SHIFT)
+#define MSR_VMX_EPT_VPID_INVEPT_EPT_CTX         \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_INVEPT_EPT_CTX_SHIFT)
+#define MSR_VMX_EPT_VPID_INVEPT_GLOBAL          \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_INVEPT_GLOBAL_SHIFT)
+#define MSR_VMX_EPT_VPID_INVVPID                \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_INVVPID_SHIFT)
+#define MSR_VMX_EPT_VPID_INVVPID_ADDR           \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_INVVPID_ADDR_SHIFT)
+#define MSR_VMX_EPT_VPID_INVVPID_VPID_CTX       \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_INVVPID_VPID_CTX_SHIFT)
+#define MSR_VMX_EPT_VPID_INVVPID_ALL_CTX        \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_INVVPID_ALL_CTX_SHIFT)
+#define MSR_VMX_EPT_VPID_INVVPID_VPID_CTX_LOCAL \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_INVVPID_VPID_CTX_LOCAL_SHIFT)
+
+#define VT_VMCS_STANDARD_TAG           0x00000000
+#define VT_VMCS_SHADOW_TAG             0x80000000
+
+/*
+ * Structure of VMCS Component Encoding.
+ */
+#define VT_ENCODING_ACCESS_HIGH        0x00000001
+#define VT_ENCODING_INDEX_MASK         0x000003fe
+#define VT_ENCODING_INDEX_SHIFT                 1
+#define VT_ENCODING_TYPE_MASK          0x00000c00
+#define VT_ENCODING_TYPE_SHIFT                 10
+#define VT_ENCODING_TYPE_CTL                    0
+#define VT_ENCODING_TYPE_VMEXIT_INFO            1
+#define VT_ENCODING_TYPE_GUEST                  2
+#define VT_ENCODING_TYPE_HOST                   3
+#define VT_ENCODING_NUM_TYPES                   4
+#define VT_ENCODING_SIZE_MASK          0x00006000
+#define VT_ENCODING_SIZE_SHIFT                 13
+#define VT_ENCODING_SIZE_16BIT                  0
+#define VT_ENCODING_SIZE_64BIT                  1
+#define VT_ENCODING_SIZE_32BIT                  2
+#define VT_ENCODING_SIZE_NATURAL                3
+#define VT_ENCODING_NUM_SIZES                   4
+#define VT_ENCODING_RSVD               0xffff9000
+
+enum {
+#define VMCS_FIELD(name, encoding, vvt) VT_VMCS_##name = encoding,
+#include "x86vt-vmcs-fields.h"
+#undef VMCS_FIELD
+};
+
+/*
+ * Sizes of referenced fields
+ */
+#define VT_VMCS_IO_BITMAP_SIZE    (2 * PAGE_SIZE)
+#define VT_VMCS_MSR_BITMAP_SIZE   (1 * PAGE_SIZE)
+
+/*
+ * Execution control bit capabilities come in pairs: a "required" bit in
+ * the low dword, and an "allowed" bit in the high dword.
+ */
+#define VMXCTL(_msrName, _field, _pos)                   \
+   VMXREQUIRE(_msrName, _field, _pos,        1)          \
+     VMXALLOW(_msrName, _field, (_pos) + 32, 1)
+
+/*
+ * VMX-fixed bit MSRs come in pairs: allowed to be zero and allowed to
+ * be one.  Each has its own capability bits, but the field names and bit
+ * positions are the same.
+ */
+#define VMXFIXED(_msrName, _field, _pos)                 \
+   VMXCAP(_msrName ## 0, _field, _pos, 1)                \
+   VMXCAP(_msrName ## 1, _field, _pos, 1)
+
+/*
+ * Basic VMX Information
+ */
+#define VMX_BASIC(_field, _pos, _len)                    \
+   VMXCAP(_BASIC, _field, _pos, _len)
+#define VMX_BASIC_CAP_NDA
+#define VMX_BASIC_CAP_PUB                                \
+   VMX_BASIC(VMCS_ID,               0, 32)               \
+   VMX_BASIC(VMCS_SIZE,            32, 13)               \
+   VMX_BASIC(32BITPA,              48,  1)               \
+   VMX_BASIC(DUALVMM,              49,  1)               \
+   VMX_BASIC(MEMTYPE,              50,  4)               \
+   VMX_BASIC(ADVANCED_IOINFO,      54,  1)               \
+   VMX_BASIC(TRUE_CTLS,            55,  1)
+
+#define VMX_BASIC_CAP                                    \
+        VMX_BASIC_CAP_NDA                                \
+        VMX_BASIC_CAP_PUB
+
+/*
+ * Pin-Based VM-Execution Controls
+ */
+#define VMX_PIN(_field, _pos)                            \
+   VMXCTL(_PINBASED_CTLS, _field, _pos)
+#define VMX_PINBASED_CTLS_CAP_NDA
+
+#define VMX_PINBASED_CTLS_CAP_PUB                        \
+   VMX_PIN(EXTINT_EXIT,          0)                      \
+   VMX_PIN(NMI_EXIT,             3)                      \
+   VMX_PIN(VNMI,                 5)                      \
+   VMX_PIN(TIMER,                6)                      \
+   VMX_PIN(POSTED_INTR,          7)
+
+#define VMX_PINBASED_CTLS_CAP                            \
+        VMX_PINBASED_CTLS_CAP_NDA                        \
+        VMX_PINBASED_CTLS_CAP_PUB
+
+/*
+ * Primary Processor-Based VM-Execution Controls
+ */
+#define VMX_CPU(_field, _pos)                            \
+   VMXCTL(_PROCBASED_CTLS, _field, _pos)
+#define VMX_PROCBASED_CTLS_CAP_NDA
+
+#define VMX_PROCBASED_CTLS_CAP_PUB                       \
+   VMX_CPU(VINTR_WINDOW,         2)                      \
+   VMX_CPU(TSCOFF,               3)                      \
+   VMX_CPU(HLT,                  7)                      \
+   VMX_CPU(INVLPG,               9)                      \
+   VMX_CPU(MWAIT,               10)                      \
+   VMX_CPU(RDPMC,               11)                      \
+   VMX_CPU(RDTSC,               12)                      \
+   VMX_CPU(LDCR3,               15)                      \
+   VMX_CPU(STCR3,               16)                      \
+   VMX_CPU(LDCR8,               19)                      \
+   VMX_CPU(STCR8,               20)                      \
+   VMX_CPU(TPR_SHADOW,          21)                      \
+   VMX_CPU(VNMI_WINDOW,         22)                      \
+   VMX_CPU(MOVDR,               23)                      \
+   VMX_CPU(IO,                  24)                      \
+   VMX_CPU(IOBITMAP,            25)                      \
+   VMX_CPU(MTF,                 27)                      \
+   VMX_CPU(MSRBITMAP,           28)                      \
+   VMX_CPU(MONITOR,             29)                      \
+   VMX_CPU(PAUSE,               30)                      \
+   VMX_CPU(USE_2ND,             31)
+
+#define VMX_PROCBASED_CTLS_CAP                           \
+        VMX_PROCBASED_CTLS_CAP_NDA                       \
+        VMX_PROCBASED_CTLS_CAP_PUB
+
+/*
+ * Secondary Processor-Based VM-Execution Controls
+ */
+#define VMX_CPU2(_field, _pos)                           \
+   VMXCTL(_PROCBASED_CTLS2, _field, _pos)
+#define VMX_PROCBASED_CTLS2_CAP_NDA
+#define VMX_PROCBASED_CTLS2_CAP_PUB                      \
+   VMX_CPU2(APIC,                0)                      \
+   VMX_CPU2(EPT,                 1)                      \
+   VMX_CPU2(DT,                  2)                      \
+   VMX_CPU2(RDTSCP,              3)                      \
+   VMX_CPU2(X2APIC,              4)                      \
+   VMX_CPU2(VPID,                5)                      \
+   VMX_CPU2(WBINVD,              6)                      \
+   VMX_CPU2(UNRESTRICTED,        7)                      \
+   VMX_CPU2(APICREG,             8)                      \
+   VMX_CPU2(VINTR,               9)                      \
+   VMX_CPU2(PAUSE_LOOP,         10)                      \
+   VMX_CPU2(RDRAND,             11)                      \
+   VMX_CPU2(INVPCID,            12)                      \
+   VMX_CPU2(VMFUNC,             13)                      \
+   VMX_CPU2(VMCS_SHADOW,        14)                      \
+   VMX_CPU2(ENCL,               15)                      \
+   VMX_CPU2(RDSEED,             16)                      \
+   VMX_CPU2(EPT_VIOL_VE,        18)                      \
+   VMX_CPU2(XSAVES,             20)
+
+#define VMX_PROCBASED_CTLS2_CAP                          \
+        VMX_PROCBASED_CTLS2_CAP_NDA                      \
+        VMX_PROCBASED_CTLS2_CAP_PUB
+
+/*
+ * VM-Exit Controls
+ */
+#define VMX_EXIT(_field, _pos)                           \
+   VMXCTL(_EXIT_CTLS, _field, _pos)
+#define VMX_EXIT_CTLS_CAP_NDA
+#define VMX_EXIT_CTLS_CAP_PUB                            \
+   VMX_EXIT(SAVE_DEBUGCTL,       2)                      \
+   VMX_EXIT(LONGMODE,            9)                      \
+   VMX_EXIT(LOAD_PGC,           12)                      \
+   VMX_EXIT(INTRACK,            15)                      \
+   VMX_EXIT(SAVE_PAT,           18)                      \
+   VMX_EXIT(LOAD_PAT,           19)                      \
+   VMX_EXIT(SAVE_EFER,          20)                      \
+   VMX_EXIT(LOAD_EFER,          21)                      \
+   VMX_EXIT(SAVE_TIMER,         22)
+
+#define VMX_EXIT_CTLS_CAP                                \
+        VMX_EXIT_CTLS_CAP_NDA                            \
+        VMX_EXIT_CTLS_CAP_PUB
+
+/*
+ * VM-Entry Controls
+ */
+#define VMX_ENTRY(_field, _pos)                          \
+   VMXCTL(_ENTRY_CTLS, _field, _pos)
+#define VMX_ENTRY_CTLS_CAP_NDA
+#define VMX_ENTRY_CTLS_CAP_PUB                           \
+   VMX_ENTRY(LOAD_DEBUGCTL,      2)                      \
+   VMX_ENTRY(LONGMODE,           9)                      \
+   VMX_ENTRY(ENTRY_TO_SMM,      10)                      \
+   VMX_ENTRY(SMM_TEARDOWN,      11)                      \
+   VMX_ENTRY(LOAD_PGC,          13)                      \
+   VMX_ENTRY(LOAD_PAT,          14)                      \
+   VMX_ENTRY(LOAD_EFER,         15)
+
+#define VMX_ENTRY_CTLS_CAP                               \
+        VMX_ENTRY_CTLS_CAP_NDA                           \
+        VMX_ENTRY_CTLS_CAP_PUB
+
+/*
+ * Miscellaneoous Data
+ */
+#define VMX_MISC(_field, _pos, _len)                     \
+   VMXCAP(_MISC, _field, _pos, _len)
+#define VMX_MISC_CAP_NDA
+#define VMX_MISC_CAP_PUB                                 \
+   VMX_MISC(TMR_RATIO,              0,  5)               \
+   VMX_MISC(VMEXIT_SAVES_LMA,       5,  1)               \
+   VMX_MISC(ACTSTATE_HLT,           6,  1)               \
+   VMX_MISC(ACTSTATE_SHUTDOWN,      7,  1)               \
+   VMX_MISC(ACTSTATE_SIPI,          8,  1)               \
+   VMX_MISC(RDMSR_SMBASE_IN_SMM,   15,  1)               \
+   VMX_MISC(CR3_TARGETS,           16,  9)               \
+   VMX_MISC(MAX_MSRS,              25,  3)               \
+   VMX_MISC(ALLOW_ALL_VMWRITES,    29,  1)               \
+   VMX_MISC(ZERO_VMENTRY_INSTLEN,  30,  1)               \
+   VMX_MISC(MSEG_ID,               32, 32)               \
+
+#define VMX_MISC_CAP                                     \
+        VMX_MISC_CAP_NDA                                 \
+        VMX_MISC_CAP_PUB
+
+/*
+ * VMX-Fixed Bits in CR0
+ */
+#define VMX_FIXED_CR0(_field, _pos)                      \
+   VMXFIXED(_CR0_FIXED, _field, _pos)
+#define VMX_FIXED_CR0_CAP_NDA
+#define VMX_FIXED_CR0_CAP_PUB                            \
+   VMX_FIXED_CR0(PE,          0)                         \
+   VMX_FIXED_CR0(MP,          1)                         \
+   VMX_FIXED_CR0(EM,          2)                         \
+   VMX_FIXED_CR0(TS,          3)                         \
+   VMX_FIXED_CR0(ET,          4)                         \
+   VMX_FIXED_CR0(NE,          5)                         \
+   VMX_FIXED_CR0(WP,         16)                         \
+   VMX_FIXED_CR0(AM,         18)                         \
+   VMX_FIXED_CR0(NW,         29)                         \
+   VMX_FIXED_CR0(CD,         30)                         \
+   VMX_FIXED_CR0(PG,         31)
+
+#define VMX_FIXED_CR0_CAP                                \
+        VMX_FIXED_CR0_CAP_NDA                            \
+        VMX_FIXED_CR0_CAP_PUB
+
+/*
+ * VMX-Fixed Bits in CR4
+ */
+#define VMX_FIXED_CR4(_field, _pos)                      \
+   VMXFIXED(_CR4_FIXED, _field, _pos)
+#define VMX_FIXED_CR4_CAP_NDA
+#define VMX_FIXED_CR4_CAP_PUB                            \
+   VMX_FIXED_CR4(VME,         0)                         \
+   VMX_FIXED_CR4(PVI,         1)                         \
+   VMX_FIXED_CR4(TSD,         2)                         \
+   VMX_FIXED_CR4(DE,          3)                         \
+   VMX_FIXED_CR4(PSE,         4)                         \
+   VMX_FIXED_CR4(PAE,         5)                         \
+   VMX_FIXED_CR4(MCE,         6)                         \
+   VMX_FIXED_CR4(PGE,         7)                         \
+   VMX_FIXED_CR4(PCE,         8)                         \
+   VMX_FIXED_CR4(OSFXSR,      9)                         \
+   VMX_FIXED_CR4(OSXMMEXCPT, 10)                         \
+   VMX_FIXED_CR4(VMXE,       13)                         \
+   VMX_FIXED_CR4(SMXE,       14)                         \
+   VMX_FIXED_CR4(FSGSBASE,   16)                         \
+   VMX_FIXED_CR4(PCIDE,      17)                         \
+   VMX_FIXED_CR4(OSXSAVE,    18)                         \
+   VMX_FIXED_CR4(SMEP,       20)                         \
+   VMX_FIXED_CR4(SMAP,       21)
+
+#define VMX_FIXED_CR4_CAP                                \
+        VMX_FIXED_CR4_CAP_NDA                            \
+        VMX_FIXED_CR4_CAP_PUB
+
+/*
+ * VMCS Enumeration
+ */
+#define VMX_VMCS_ENUM_CAP_NDA
+#define VMX_VMCS_ENUM_CAP_PUB                           \
+   VMXCAP(_VMCS_ENUM, MAX_INDEX,    1,  9)
+
+#define VMX_VMCS_ENUM_CAP                               \
+        VMX_VMCS_ENUM_CAP_NDA                           \
+        VMX_VMCS_ENUM_CAP_PUB
+
+/*
+ * VPID and EPT Capabilities
+ */
+#define VMX_EPT(_field, _pos, _len)                     \
+   VMXCAP(_EPT_VPID, _field, _pos, _len)
+#define VMX_EPT_VPID_CAP_NDA
+#define VMX_EPT_VPID_CAP_PUB                            \
+   VMX_EPT(EPTE_X,                  0,  1)              \
+   VMX_EPT(GAW_48,                  6,  1)              \
+   VMX_EPT(ETMT_UC,                 8,  1)              \
+   VMX_EPT(ETMT_WB,                14,  1)              \
+   VMX_EPT(SP_2MB,                 16,  1)              \
+   VMX_EPT(SP_1GB,                 17,  1)              \
+   VMX_EPT(INVEPT,                 20,  1)              \
+   VMX_EPT(ACCESS_DIRTY,           21,  1)              \
+   VMX_EPT(INVEPT_EPT_CTX,         25,  1)              \
+   VMX_EPT(INVEPT_GLOBAL,          26,  1)              \
+   VMX_EPT(INVVPID,                32,  1)              \
+   VMX_EPT(INVVPID_ADDR,           40,  1)              \
+   VMX_EPT(INVVPID_VPID_CTX,       41,  1)              \
+   VMX_EPT(INVVPID_ALL_CTX,        42,  1)              \
+   VMX_EPT(INVVPID_VPID_CTX_LOCAL, 43,  1)
+
+#define VMX_EPT_VPID_CAP                                \
+        VMX_EPT_VPID_CAP_NDA                            \
+        VMX_EPT_VPID_CAP_PUB
+
+/*
+ * VM Functions
+ */
+#define VMX_VMFUNC_CAP_NDA
+#define VMX_VMFUNC_CAP_PUB                              \
+   VMXCAP(_VMFUNC, EPTP_SWITCHING,  0,  1)
+
+#define VMX_VMFUNC_CAP     \
+        VMX_VMFUNC_CAP_NDA \
+        VMX_VMFUNC_CAP_PUB
+
+
+
+
+/*
+ * Match the historical names for these fields:
+ * <field>_SHIFT is the lsb of the field.
+ * <field>_MASK is an unshifted bit-mask the width of the field.
+ * <field> is the bit-mask shifted into the field's position in the MSR.
+ */
+enum {
+#define VMXCAP(_msrName, _field, _pos, _len)                              \
+   MSR_VMX ## _msrName ## _ ## _field ## _SHIFT = (_pos),                 \
+   MSR_VMX ## _msrName ## _ ## _field ## _MASK  = (int)MASK64(_len),      \
+
+   VMX_BASIC_CAP
+   VMX_MISC_CAP
+   VMX_VMCS_ENUM_CAP
+   VMX_EPT_VPID_CAP
+
+#undef VMXCAP
+};
+
+/*
+ * Convert capabilities into VMCS control bit names.
+ */
+enum {
+#define _PINBASED_CTLS        VT_VMCS_PIN_VMEXEC_CTL_
+#define _PROCBASED_CTLS       VT_VMCS_CPU_VMEXEC_CTL_
+#define _PROCBASED_CTLS2      VT_VMCS_2ND_VMEXEC_CTL_
+#define _EXIT_CTLS            VT_VMCS_VMEXIT_CTL_
+#define _ENTRY_CTLS           VT_VMCS_VMENTRY_CTL_
+
+#define VMXREQUIRE(_msrName, _field, _pos, _len)                      \
+        VMXCAP(_msrName, _field, _pos, _len)
+#define VMXALLOW(_msrName, _field, _pos, _len)
+#define VMXCAP(_msrName, _field, _pos, _len)                          \
+   CONC(_msrName, _field) = 1ULL << (_pos),
+
+   VMX_PINBASED_CTLS_CAP
+   VMX_PROCBASED_CTLS_CAP
+   VMX_EXIT_CTLS_CAP
+   VMX_ENTRY_CTLS_CAP
+   VMX_PROCBASED_CTLS2_CAP
+
+#undef VMXCAP
+#undef VMXALLOW
+#undef VMXREQUIRE
+
+#undef _ENTRY_CTLS
+#undef _EXIT_CTLS
+#undef _PROCBASED_CTLS2
+#undef _PROCBASED_CTLS
+#undef _PINBASED_CTLS
+};
+
+/*
+ * The AR format is mostly the same as the SMM segment format; i.e.,
+ * a descriptor shifted by a byte. However, there is an extra bit in
+ * the high-order word which indicates an "unusable" selector.  A NULL
+ * selector is generally unusable, as are a few other corner cases.
+ */
+#define VT_VMCS_AR_UNUSABLE   0x00010000
+#define VT_VMCS_AR_RESERVED   0xfffe0f00
+
+/*
+ * Pending debug bits partially follow their DR6 counterparts.
+ * However, there are no must-be-one bits, the bits corresponding
+ * to DR6_BD and DR6_BT must be zero, and bit 12 indicates an
+ * enabled breakpoint.
+ */
+#define VT_VMCS_PENDDBG_B0         0x00000001
+#define VT_VMCS_PENDDBG_B1         0x00000002
+#define VT_VMCS_PENDDBG_B2         0x00000004
+#define VT_VMCS_PENDDBG_B3         0x00000008
+#define VT_VMCS_PENDDBG_BE         0x00001000
+#define VT_VMCS_PENDDBG_BS         0x00004000
+#define VT_VMCS_PENDDBG_RTM        0x00010000
+#define VT_VMCS_PENDDBG_MBZ        0xfffeaff0
+
+/* Exception error must-be-zero bits for VMEntry */
+#define VT_XCP_ERR_MBZ             0xffff8000
+
+/* Exit reasons. */
+#define VT_EXITREASON_EXC_OR_NMI            0
+#define VT_EXITREASON_EXTINT                1
+#define VT_EXITREASON_TRIPLEFAULT           2
+#define VT_EXITREASON_INIT                  3
+#define VT_EXITREASON_SIPI                  4
+#define VT_EXITREASON_IOSMI                 5
+#define VT_EXITREASON_OTHERSMI              6
+#define VT_EXITREASON_VINTR_WINDOW          7
+#define VT_EXITREASON_VNMI_WINDOW           8
+#define VT_EXITREASON_TS                    9
+#define VT_EXITREASON_CPUID                10
+#define VT_EXITREASON_GETSEC               11
+#define VT_EXITREASON_HLT                  12
+#define VT_EXITREASON_INVD                 13
+#define VT_EXITREASON_INVLPG               14
+#define VT_EXITREASON_RDPMC                15
+#define VT_EXITREASON_RDTSC                16
+#define VT_EXITREASON_RSM                  17
+#define VT_EXITREASON_VMCALL               18
+#define VT_EXITREASON_VMCLEAR              19
+#define VT_EXITREASON_VMLAUNCH             20
+#define VT_EXITREASON_VMPTRLD              21
+#define VT_EXITREASON_VMPTRST              22
+#define VT_EXITREASON_VMREAD               23
+#define VT_EXITREASON_VMRESUME             24
+#define VT_EXITREASON_VMWRITE              25
+#define VT_EXITREASON_VMXOFF               26
+#define VT_EXITREASON_VMXON                27
+#define VT_EXITREASON_CR                   28
+#define VT_EXITREASON_DR                   29
+#define VT_EXITREASON_IO                   30
+#define VT_EXITREASON_RDMSR                31
+#define VT_EXITREASON_WRMSR                32
+#define VT_EXITREASON_VMENTRYFAIL_GUEST   (33 | VT_EXITREASON_VMENTRYFAIL)
+#define VT_EXITREASON_VMENTRYFAIL_MSR     (34 | VT_EXITREASON_VMENTRYFAIL)
+#define VT_EXITREASON_MWAIT                36
+#define VT_EXITREASON_MTF                  37
+#define VT_EXITREASON_MONITOR              39
+#define VT_EXITREASON_PAUSE                40
+#define VT_EXITREASON_VMENTRYFAIL_MC      (41 | VT_EXITREASON_VMENTRYFAIL)
+#define VT_EXITREASON_TPR                  43
+#define VT_EXITREASON_APIC                 44
+#define VT_EXITREASON_EOI                  45
+#define VT_EXITREASON_GDTR_IDTR            46
+#define VT_EXITREASON_LDTR_TR              47
+#define VT_EXITREASON_EPT_VIOLATION        48
+#define VT_EXITREASON_EPT_MISCONFIG        49
+#define VT_EXITREASON_INVEPT               50
+#define VT_EXITREASON_RDTSCP               51
+#define VT_EXITREASON_TIMER                52
+#define VT_EXITREASON_INVVPID              53
+#define VT_EXITREASON_WBINVD               54
+#define VT_EXITREASON_XSETBV               55
+#define VT_EXITREASON_APIC_WRITE           56
+#define VT_EXITREASON_RDRAND               57
+#define VT_EXITREASON_INVPCID              58
+#define VT_EXITREASON_VMFUNC               59
+#define VT_EXITREASON_ENCLS                60
+#define VT_EXITREASON_RDSEED               61
+#define VT_EXITREASON_XSAVES               63
+#define VT_EXITREASON_XRSTORS              64
+
+/*
+ * VT synthesized exit reasons:
+ *
+ * Faked up reasons, not overlapping with any real exit codes, which
+ * help save repeated VMREADS in HVExit and HVTryFastExit of
+ * VT_VMCS_EXIT_INTR_INFO to extract the TYPE_MASK and VECTOR_MASK.
+ * See HVExitGlue.
+ *
+ * We shouldn't have to worry about new hardware introducing conflicting
+ * exit reasons, because we shouldn't encounter any new exit reasons
+ * unless we opt-in to the features that produce them.
+ */
+#define VT_EXITREASON_SYNTH_BASE     77
+#define VT_EXITREASON_SYNTH_IRET     77
+#define VT_EXITREASON_SYNTH_NMI      78
+#define VT_EXITREASON_SYNTH_ICEBP    79
+#define VT_EXITREASON_SYNTH_EXC_BASE 80
+#define VT_EXITREASON_SYNTH_MAX      111
+
+#define VT_EXITREASON_SYNTH_EXC(gatenum) \
+        (VT_EXITREASON_SYNTH_EXC_BASE + gatenum) /* 0-31 */
+
+#define VT_EXITREASON_INSIDE_ENCLAVE        (1U << 27)
+#define VT_EXITREASON_VMENTRYFAIL           (1U << 31)
+
+/* Instruction error codes. */
+#define VT_ERROR_VMCALL_VMX_ROOT            1
+#define VT_ERROR_VMCLEAR_INVALID_PA         2
+#define VT_ERROR_VMCLEAR_ROOT_PTR           3
+#define VT_ERROR_VMLAUNCH_NOT_CLEAR         4
+#define VT_ERROR_VMRESUME_NOT_LAUNCHED      5
+#define VT_ERROR_VMRESUME_AFTER_VMXOFF      6
+#define VT_ERROR_VMENTRY_INVALID_CTL        7
+#define VT_ERROR_VMENTRY_INVALID_HOST       8
+#define VT_ERROR_VMPTRLD_INVALID_PA         9
+#define VT_ERROR_VMPTRLD_ROOT_PTR          10
+#define VT_ERROR_VMPTRLD_BAD_REVISION      11
+#define VT_ERROR_VMACCESS_UNSUPPORTED      12
+#define VT_ERROR_VMWRITE_READ_ONLY         13
+#define VT_ERROR_VMXON_VMX_ROOT            15
+#define VT_ERROR_VMENTRY_INVALID_EXEC      16
+#define VT_ERROR_VMENTRY_EXEC_NOT_LAUNCHED 17
+#define VT_ERROR_VMENTRY_EXEC_NOT_ROOT     18
+#define VT_ERROR_VMCALL_NOT_CLEAR          19
+#define VT_ERROR_VMCALL_INVALID_CTL        20
+#define VT_ERROR_VMCALL_WRONG_MSEG         22
+#define VT_ERROR_VMXOFF_DUALVMM            23
+#define VT_ERROR_VMCALL_INVALID_SMM        24
+#define VT_ERROR_VMENTRY_INVALID_EXEC_CTL  25
+#define VT_ERROR_VMENTRY_MOVSS_SHADOW      26
+#define VT_ERROR_INVALIDATION_INVALID      28
+
+/* interrupt information fields. Low order 8 bits are vector. */
+#define VT_INTRINFO_TYPE_SHIFT      8
+#define VT_INTRINFO_TYPE_MASK       (7 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_TYPE_EXTINT     (0 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_TYPE_RSVD       (1 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_TYPE_NMI        (2 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_TYPE_EXC        (3 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_TYPE_INTN       (4 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_TYPE_PRIVTRAP   (5 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_TYPE_UNPRIVTRAP (6 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_TYPE_OTHER      (7 << VT_INTRINFO_TYPE_SHIFT)
+#define VT_INTRINFO_ERRORCODE       (1 << 11)
+#define VT_INTRINFO_NMIUNMASK       (1 << 12)
+#define VT_INTRINFO_VALID           (1U << 31)
+#define VT_INTRINFO_VECTOR_MASK     ((1 << VT_INTRINFO_TYPE_SHIFT) - 1)
+#define VT_INTRINFO_RESERVED        0x7fffe000
+
+/* Activity State */
+#define VT_ACTSTATE_ACTIVE     0
+#define VT_ACTSTATE_HLT        1
+#define VT_ACTSTATE_SHUT_DOWN  2
+#define VT_ACTSTATE_WFSIPI     3
+
+/* Interruptibility */
+#define VT_HOLDOFF_STI         0x00000001
+#define VT_HOLDOFF_MOVSS       0x00000002
+#define VT_HOLDOFF_SMI         0x00000004
+#define VT_HOLDOFF_NMI         0x00000008
+#define VT_HOLDOFF_ENCLAVE     0x00000010
+#define VT_HOLDOFF_INST        (VT_HOLDOFF_STI | VT_HOLDOFF_MOVSS)
+#define VT_HOLDOFF_RSV         0xFFFFFFE0
+
+/* VM Functions */
+#define VT_VMFUNC_MASK(_vmfunc)        (1ULL << (VT_VMFUNC_ ## _vmfunc))
+#define VT_VMFUNC_SWITCH_EPTP          0
+
+/* EPT Violation Qualification */
+#define VT_EPT_QUAL_ACCESS_SHIFT       0
+#define VT_EPT_QUAL_ACCESS_MASK        (0x7 << VT_EPT_QUAL_ACCESS_SHIFT)
+#define VT_EPT_QUAL_ACCESS_R           (1 << 0)
+#define VT_EPT_QUAL_ACCESS_W           (1 << 1)
+#define VT_EPT_QUAL_ACCESS_X           (1 << 2)
+#define VT_EPT_QUAL_PROT_SHIFT         3
+#define VT_EPT_QUAL_PROT_MASK          (0x7 << VT_EPT_QUAL_PROT_SHIFT)
+#define VT_EPT_QUAL_PROT_R             (1 << 3)
+#define VT_EPT_QUAL_PROT_W             (1 << 4)
+#define VT_EPT_QUAL_PROT_X             (1 << 5)
+#define VT_EPT_QUAL_LA_VALID           (1 << 7)
+#define VT_EPT_QUAL_FINAL_ADDR         (1 << 8)
+#define VT_EPT_QUAL_NMIUNMASK          (1 << 12)
+
+
+/* IOIO Qualification */
+#define VT_IO_QUAL_SIZE_SHIFT          0
+#define VT_IO_QUAL_SIZE_MASK           (0x7 << VT_IO_QUAL_SIZE_SHIFT)
+#define VT_IO_QUAL_IN                  (1 << 3)
+#define VT_IO_QUAL_STR                 (1 << 4)
+#define VT_IO_QUAL_REP                 (1 << 5)
+#define VT_IO_QUAL_IMM                 (1 << 6)
+#define VT_IO_QUAL_PORT_SHIFT          16
+#define VT_IO_QUAL_PORT_MASK           (0xffff << VT_IO_QUAL_PORT_SHIFT)
+
+/* Invalid Guest State Qualification */
+#define VT_GUESTFAIL_QUAL_UNUSED       1
+#define VT_GUESTFAIL_QUAL_PDPTE        2
+#define VT_GUESTFAIL_QUAL_NMI          3
+#define VT_GUESTFAIL_QUAL_LINK         4
+
+/* VMX abort indicators. */
+
+#define VT_VMX_ABORT_GUEST_MSRS        1
+#define VT_VMX_ABORT_HOST_PDPTES       2
+#define VT_VMX_ABORT_CORRUPT_VMCS      3
+#define VT_VMX_ABORT_HOST_MSRS         4
+#define VT_VMX_ABORT_VMEXIT_MC         5
+#define VT_VMX_ABORT_LM_TO_LEGACY      6
+
+
+/* Default-to-one bits for VMCS control fields. */
+
+#define VT_PINBASED_CTLS_DEFAULT1      0x00000016
+#define VT_PROCBASED_CTLS_DEFAULT1     0x0401e172
+#define VT_EXIT_CTLS_DEFAULT1          0x00036dff
+#define VT_ENTRY_CTLS_DEFAULT1         0x000011ff
+
+
+/* Required feature bits. */
+
+#define VT_REQUIRED_PINBASED_CTLS                      \
+   (VT_PINBASED_CTLS_DEFAULT1                        | \
+    VT_VMCS_PIN_VMEXEC_CTL_EXTINT_EXIT               | \
+    VT_VMCS_PIN_VMEXEC_CTL_NMI_EXIT)
+
+#define VT_REQUIRED_PROCBASED_CTLS                     \
+   (VT_PROCBASED_CTLS_DEFAULT1                       | \
+    VT_VMCS_CPU_VMEXEC_CTL_VINTR_WINDOW              | \
+    VT_VMCS_CPU_VMEXEC_CTL_TSCOFF                    | \
+    VT_VMCS_CPU_VMEXEC_CTL_HLT                       | \
+    VT_VMCS_CPU_VMEXEC_CTL_INVLPG                    | \
+    VT_VMCS_CPU_VMEXEC_CTL_MWAIT                     | \
+    VT_VMCS_CPU_VMEXEC_CTL_RDPMC                     | \
+    VT_VMCS_CPU_VMEXEC_CTL_RDTSC                     | \
+    VT_VMCS_CPU_VMEXEC_CTL_IO                        | \
+    VT_VMCS_CPU_VMEXEC_CTL_MOVDR                     | \
+    VT_VMCS_CPU_VMEXEC_CTL_LDCR8                     | \
+    VT_VMCS_CPU_VMEXEC_CTL_STCR8                     | \
+    VT_VMCS_CPU_VMEXEC_CTL_TPR_SHADOW                | \
+    VT_VMCS_CPU_VMEXEC_CTL_MONITOR)
+
+#define VT_REQUIRED_EXIT_CTLS                          \
+   (VT_EXIT_CTLS_DEFAULT1                            | \
+    VT_VMCS_VMEXIT_CTL_LONGMODE                      | \
+    VT_VMCS_VMEXIT_CTL_INTRACK)
+
+#define VT_REQUIRED_ENTRY_CTLS                         \
+   (VT_ENTRY_CTLS_DEFAULT1                           | \
+    VT_VMCS_VMENTRY_CTL_LONGMODE)
+
+#define VT_REQUIRED_VPID_SUPPORT                       \
+   (MSR_VMX_EPT_VPID_INVVPID                         | \
+    MSR_VMX_EPT_VPID_INVVPID_ADDR                    | \
+    MSR_VMX_EPT_VPID_INVVPID_VPID_CTX                | \
+    MSR_VMX_EPT_VPID_INVVPID_ALL_CTX)
+
+#define VT_REQUIRED_EPT_SUPPORT                        \
+   (MSR_VMX_EPT_VPID_EPTE_X                          | \
+    MSR_VMX_EPT_VPID_GAW_48                          | \
+    MSR_VMX_EPT_VPID_ETMT_WB                         | \
+    MSR_VMX_EPT_VPID_SP_2MB                          | \
+    MSR_VMX_EPT_VPID_INVEPT                          | \
+    MSR_VMX_EPT_VPID_INVEPT_EPT_CTX)
+
+typedef uint64 VTConfig[NUM_VMX_MSRS];
+
+typedef uint32 VTVMCSFieldBitmap[VT_ENCODING_NUM_SIZES][VT_ENCODING_NUM_TYPES];
+
+/*
+ *----------------------------------------------------------------------
+ * VTEncodingHighDword --
+ *
+ *   Does the VMCS component encoding reference the high 32-bits of a
+ *   64-bit component?
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VTEncodingHighDword(uint32 encoding)
+{
+   return (encoding & VT_ENCODING_ACCESS_HIGH) != 0;
+}
+
+/*
+ *----------------------------------------------------------------------
+ * VTEncodingIndex --
+ *
+ *   Extract the index field from a VMCS component encoding.
+ *----------------------------------------------------------------------
+ */
+static INLINE unsigned
+VTEncodingIndex(uint32 encoding)
+{
+   return (encoding & VT_ENCODING_INDEX_MASK) >> VT_ENCODING_INDEX_SHIFT;
+}
+
+/*
+ *----------------------------------------------------------------------
+ * VTEncodingType --
+ *
+ *   Extract the type field from a VMCS component encoding.
+ *----------------------------------------------------------------------
+ */
+static INLINE unsigned
+VTEncodingType(uint32 encoding)
+{
+   return (encoding & VT_ENCODING_TYPE_MASK) >> VT_ENCODING_TYPE_SHIFT;
+}
+
+/*
+ *----------------------------------------------------------------------
+ * VTEncodingSize --
+ *
+ *   Extract the size field from a VMCS component encoding.
+ *----------------------------------------------------------------------
+ */
+static INLINE unsigned
+VTEncodingSize(uint32 encoding)
+{
+   return (encoding & VT_ENCODING_SIZE_MASK) >> VT_ENCODING_SIZE_SHIFT;
+}
+
+/*
+ *----------------------------------------------------------------------
+ * VTComputeMandatoryBits --
+ *
+ *   Compute the mandatory bits for a VMCS field, based on the allowed
+ *   ones and allowed zeros as reported in the appropriate VMX MSR, and
+ *   the desired bits.
+ *----------------------------------------------------------------------
+ */
+static INLINE uint32
+VTComputeMandatoryBits(uint64 msrVal, uint32 bits)
+{
+   uint32 ones = LODWORD(msrVal);
+   uint32 zeros = HIDWORD(msrVal);
+   return (bits | ones) & zeros;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_EnabledFromFeatures --
+ *
+ *  Returns TRUE if VT is enabled in the given feature control bits.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_EnabledFromFeatures(uint64 featCtl)
+{
+   return ((featCtl & (MSR_FEATCTL_VMXE | MSR_FEATCTL_LOCK)) ==
+           (MSR_FEATCTL_VMXE | MSR_FEATCTL_LOCK));
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_LockedFromFeatures --
+ *
+ *  Returns TRUE if VT is locked in the given feature control bits.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_LockedFromFeatures(uint64 featCtl)
+{
+   return (featCtl & MSR_FEATCTL_LOCK) != 0;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_SupportedFromFeatures --
+ *
+ *   Returns TRUE if the given VMX features are compatible with our VT
+ *   monitor.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_SupportedFromFeatures(uint64 pinBasedCtl, uint64 procBasedCtl,
+                         uint64 entryCtl, uint64 exitCtl, uint64 basicCtl)
+{
+   unsigned memType;
+
+   if ((VT_REQUIRED_PINBASED_CTLS &
+        ~VTComputeMandatoryBits(pinBasedCtl, VT_REQUIRED_PINBASED_CTLS)) ||
+       (VT_REQUIRED_PROCBASED_CTLS &
+        ~VTComputeMandatoryBits(procBasedCtl, VT_REQUIRED_PROCBASED_CTLS)) ||
+       (VT_REQUIRED_ENTRY_CTLS &
+        ~VTComputeMandatoryBits(entryCtl, VT_REQUIRED_ENTRY_CTLS)) ||
+       (VT_REQUIRED_EXIT_CTLS &
+        ~VTComputeMandatoryBits(exitCtl, VT_REQUIRED_EXIT_CTLS))) {
+      return FALSE;
+   }
+
+   memType = (unsigned)((basicCtl >> MSR_VMX_BASIC_MEMTYPE_SHIFT) &
+                        MSR_VMX_BASIC_MEMTYPE_MASK);
+
+   if (memType != MTRR_TYPE_WB) {
+      return FALSE;
+   }
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_RealModeSupportedFromFeatures --
+ *
+ *   Returns TRUE if the given VMX features provide real-address
+ *   mode guest support.
+ *
+ *   Assumes that VT is supported.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_RealModeSupportedFromFeatures(uint64 secondary)
+{
+   return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_UNRESTRICTED) != 0;
+}
+
+
+#if !defined(USERLEVEL) && !defined(MONITOR_APP) /* { */
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_EnabledCPU --
+ *
+ *   Returns TRUE if VT is enabled on this CPU.  This function assumes
+ *   that the processor is VT_Capable().
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_EnabledCPU(void)
+{
+   return VT_EnabledFromFeatures(__GET_MSR(MSR_FEATCTL));
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_SupportedCPU --
+ *
+ *   Returns TRUE if this CPU has all of the features that we need to
+ *   run our VT monitor.  This function assumes that the processor is
+ *   VT_Capable().
+ *
+ *   Note that all currently shipping VT-capable processors meet these
+ *   criteria, and that we do not expect any surprises in the field.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_SupportedCPU(void)
+{
+   if (__GET_MSR(MSR_VMX_BASIC) & MSR_VMX_BASIC_TRUE_CTLS) {
+      return VT_SupportedFromFeatures(__GET_MSR(MSR_VMX_TRUE_PINBASED_CTLS),
+                                      __GET_MSR(MSR_VMX_TRUE_PROCBASED_CTLS),
+                                      __GET_MSR(MSR_VMX_TRUE_ENTRY_CTLS),
+                                      __GET_MSR(MSR_VMX_TRUE_EXIT_CTLS),
+                                      __GET_MSR(MSR_VMX_BASIC));
+   } else {
+      return VT_SupportedFromFeatures(__GET_MSR(MSR_VMX_PINBASED_CTLS),
+                                      __GET_MSR(MSR_VMX_PROCBASED_CTLS),
+                                      __GET_MSR(MSR_VMX_ENTRY_CTLS),
+                                      __GET_MSR(MSR_VMX_EXIT_CTLS),
+                                      __GET_MSR(MSR_VMX_BASIC));
+   }
+}
+
+#endif /* } !defined(USERLEVEL) */
+
+#if !defined(VMM) /* { */
+/*
+ *----------------------------------------------------------------------
+ * VT_CapableCPU --
+ *
+ *   Verify that this CPU is VT-capable.
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_CapableCPU(void)
+{
+   return CPUID_ISSET(1, ECX, VMX, __GET_ECX_FROM_CPUID(1));
+}
+#endif /* } !defined(VMM) */
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_ConfigIndex --
+ *
+ *      Convert an MSR number to an index into the VTConfig array.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE unsigned
+VT_ConfigIndex(uint32 msrNum)
+{
+   ASSERT(msrNum >= MSR_VMX_BASIC &&
+          msrNum < MSR_VMX_BASIC + NUM_VMX_MSRS);
+   return msrNum - MSR_VMX_BASIC;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_ConfigMSRNum --
+ *
+ *      Convert an index into the VTConfig array to an MSR number.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint32
+VT_ConfigMSRNum(unsigned index)
+{
+   ASSERT(index < NUM_VMX_MSRS);
+   return MSR_VMX_BASIC + index;
+}
+
+
+#endif /* _X86VT_H_ */
diff --git a/vmmon-only/include/x86vtinstr.h b/vmmon-only/include/x86vtinstr.h
new file mode 100644
index 00000000..844f92fc
--- /dev/null
+++ b/vmmon-only/include/x86vtinstr.h
@@ -0,0 +1,623 @@
+/*********************************************************
+ * Copyright (C) 2004-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _X86VTINSTR_H_
+#define _X86VTINSTR_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "x86_basic_defs.h"
+#include "community_source.h"
+
+#define INVALID_VMCS_ADDR    ~0ULL
+
+/*
+ * All VMX operations set an exit status in EFLAGS_CF and EFLAGS_ZF.
+ * If both flags are clear, the operation was successful.  If CF is set,
+ * the operation failed and there was no valid current VMCS.  If ZF
+ * is set, the operation failed and an error code was written to the
+ * VM-instruction error field of the current VMCS.  Note that the other
+ * four ALU flags are always cleared.
+ *
+ * Because of the VMX_FailValid behavior, we declare that "memory" is
+ * modified by all of these operations.  This may be overly paranoid,
+ * since the VM-instruction error field of the current VMCS should always
+ * be accessed by a VMREAD, and never by a direct memory access.
+ */
+
+typedef enum {
+   VMX_Success     = EFLAGS_SET,
+   VMX_FailInvalid = EFLAGS_SET | EFLAGS_CF,
+   VMX_FailValid   = EFLAGS_SET | EFLAGS_ZF
+} VMXStatus;
+
+static INLINE Bool
+VMXStatus_Valid(VMXStatus status)
+{
+   return status == VMX_Success     ||
+          status == VMX_FailInvalid ||
+          status == VMX_FailValid;
+}
+
+#if defined __GNUC__
+
+static INLINE VMXStatus
+VMXON_2_STATUS(MA* vmcs)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmxon %1; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        : "m"(*vmcs)
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMXON_UNCHECKED(MA *vmcs)
+{
+   __asm__ __volatile__("vmxon %0"
+                        :
+                        : "m"(*vmcs)
+                        : "cc", "memory");
+}
+
+static INLINE VMXStatus
+VMXOFF_2_STATUS(void)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmxoff; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        :
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMXOFF_UNCHECKED(void)
+{
+   __asm__ __volatile__("vmxoff"
+                        :
+                        :
+                        : "cc", "memory");
+}
+
+static INLINE VMXStatus
+VMCLEAR_2_STATUS(MA* vmcs)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmclear %1; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        : "m"(*vmcs)
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMCLEAR_UNCHECKED(MA* vmcs)
+{
+   __asm__ __volatile__("vmclear %0"
+                        :
+                        : "m"(*vmcs)
+                        : "cc", "memory");
+}
+
+static INLINE void
+VMCLEAR(MA* vmcs)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMCLEAR_2_STATUS(vmcs);
+      ASSERT(status == VMX_Success);
+   } else {
+      VMCLEAR_UNCHECKED(vmcs);
+   }
+}
+
+static INLINE VMXStatus
+VMPTRLD_2_STATUS(MA *vmcs)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmptrld %1; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        : "m"(*vmcs)
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMPTRLD_UNCHECKED(MA *vmcs)
+{
+   __asm__ __volatile__("vmptrld %0"
+                        :
+                        : "m"(*vmcs)
+                        : "cc", "memory");
+}
+
+static INLINE VMXStatus
+VMPTRST_2_STATUS(MA *vmcs)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmptrst %1; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        : "m"(*vmcs)
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMPTRST_UNCHECKED(MA *vmcs)
+{
+   __asm__ __volatile__("vmptrst %0"
+                        :
+                        : "m"(*vmcs)
+                        : "cc", "memory");
+}
+
+static INLINE VMXStatus
+VMREAD_2_STATUS(size_t encoding, size_t *retval)
+{
+   VMXStatus status;
+   size_t value;
+   __asm__ __volatile__("vmread %2, %1; lahf; movzbl %%ah, %0"
+                        : "=a"(status), "=rm"(value)
+                        : "r"(encoding)
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   *retval = value;
+   return status;
+}
+
+static INLINE size_t
+VMREAD_UNCHECKED(size_t encoding)
+{
+   size_t retval;
+   __asm__ __volatile__("vmread %1, %0"
+                        : "=rm"(retval)
+                        : "r"(encoding)
+                        : "cc", "memory");
+   return retval;
+}
+
+static INLINE size_t
+VMREAD(size_t encoding)
+{
+   size_t retval;
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMREAD_2_STATUS(encoding, &retval);
+      ASSERT(status == VMX_Success);
+   } else {
+      retval = VMREAD_UNCHECKED(encoding);
+   }
+   return retval;
+}
+
+static INLINE VMXStatus
+VMWRITE_2_STATUS(size_t encoding, size_t val)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmwrite %1, %2; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        : "rm"(val), "r"(encoding)
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMWRITE_UNCHECKED(size_t encoding, size_t val)
+{
+   __asm__ __volatile__("vmwrite %0, %1"
+                        :
+                        : "rm"(val), "r"(encoding)
+                        : "cc", "memory");
+}
+
+static INLINE void
+VMWRITE(size_t encoding, size_t val)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMWRITE_2_STATUS(encoding, val);
+      ASSERT(status == VMX_Success);
+   } else {
+      VMWRITE_UNCHECKED(encoding, val);
+   }
+}
+
+static INLINE VMXStatus
+VMLAUNCH_2_STATUS(void)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmlaunch; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        :
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMLAUNCH_UNCHECKED(void)
+{
+   __asm__ __volatile__("vmlaunch"
+                        :
+                        :
+                        : "cc", "memory");
+}
+
+static INLINE void
+VMLAUNCH(void)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMLAUNCH_2_STATUS();
+      ASSERT(status == VMX_Success);
+   } else {
+      VMLAUNCH_UNCHECKED();
+   }
+}
+
+static INLINE VMXStatus
+VMRESUME_2_STATUS(void)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmresume; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        :
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMRESUME_UNCHECKED(void)
+{
+   __asm__ __volatile__("vmresume"
+                        :
+                        :
+                        : "cc", "memory");
+}
+
+static INLINE void
+VMRESUME(void)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMRESUME_2_STATUS();
+      ASSERT(status == VMX_Success);
+   } else {
+      VMRESUME_UNCHECKED();
+   }
+}
+
+static INLINE VMXStatus
+VMCALL_2_STATUS(void)
+{
+   VMXStatus status;
+   __asm__ __volatile__("vmcall; lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        :
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+VMCALL_UNCHECKED(void)
+{
+   __asm__ __volatile__("vmcall"
+                        :
+                        :
+                        : "cc", "memory");
+}
+
+static INLINE void
+VMCALL(void)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMCALL_2_STATUS();
+      ASSERT(status == VMX_Success);
+   } else {
+      VMCALL_UNCHECKED();
+   }
+}
+
+#define INVVPID_EXTENT_ADDR               0
+#define INVVPID_EXTENT_VPID_CTX           1
+#define INVVPID_EXTENT_ALL_CTX            2
+#define INVVPID_EXTENT_VPID_CTX_LOCAL     3
+
+typedef struct {
+   uint64 vpid;
+   uint64 la;
+} InvvpidArg;
+
+static INLINE VMXStatus
+INVVPID_2_STATUS(InvvpidArg *v, size_t extent)
+{
+   VMXStatus status;
+   __asm__ __volatile__(
+                        "invvpid %1, %2;"
+                        "lahf; movzbl %%ah, %0"
+                        : "=a"(status)
+                        : "m"(*v), "r"(extent)
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+INVVPID_UNCHECKED(InvvpidArg *v, size_t extent)
+{
+   __asm__ __volatile__(
+                        "invvpid %0, %1"
+                        :
+                        : "m"(*v), "r"(extent)
+                        : "cc", "memory");
+}
+
+static INLINE void
+INVVPID(InvvpidArg *v, size_t extent)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = INVVPID_2_STATUS(v, extent);
+      ASSERT(status == VMX_Success);
+   } else {
+      INVVPID_UNCHECKED(v, extent);
+   }
+}
+
+static INLINE void
+INVVPID_ADDR(uint16 vpid, LA lAddr)
+{
+   InvvpidArg v;
+   v.vpid = vpid;
+   v.la = lAddr;
+   INVVPID(&v, INVVPID_EXTENT_ADDR);
+}
+
+static INLINE void
+INVVPID_CTX(uint16 vpid, Bool global)
+{
+   InvvpidArg v;
+   v.vpid = vpid;
+   INVVPID(&v, global ? INVVPID_EXTENT_VPID_CTX
+                      : INVVPID_EXTENT_VPID_CTX_LOCAL);
+}
+
+static INLINE void
+INVVPID_ALL(void)
+{
+   InvvpidArg v;
+   v.vpid = 0; // Bits 16-63 of the structure must be zero
+   INVVPID(&v, INVVPID_EXTENT_ALL_CTX);
+}
+
+
+#define INVEPT_EXTENT_EPT_CTX       1
+#define INVEPT_EXTENT_GLOBAL        2
+
+typedef struct {
+   uint64 eptp;
+   uint64 rsvd;
+} InveptArg;
+
+static INLINE VMXStatus
+INVEPT_2_STATUS(InveptArg *e, size_t extent)
+{
+   VMXStatus status;
+   __asm__ __volatile__(
+                        "invept %1, %2;"
+                        "lahf;"
+                        "movzbl %%ah, %0"
+                        : "=a"(status)
+                        : "m"(*e), "r"(extent)
+                        : "cc", "memory");
+   ASSERT(VMXStatus_Valid(status));
+   return status;
+}
+
+static INLINE void
+INVEPT_UNCHECKED(InveptArg *e, size_t extent)
+{
+   __asm__ __volatile__(
+                        "invept %0, %1"
+                        :
+                        : "m" (*e), "r" (extent)
+                        : "cc", "memory");
+}
+
+static INLINE void
+INVEPT(InveptArg *e, size_t extent)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = INVEPT_2_STATUS(e, extent);
+      ASSERT(status == VMX_Success);
+   } else {
+      INVEPT_UNCHECKED(e, extent);
+   }
+}
+
+
+static INLINE void
+INVEPT_CTX(uint64 eptp)
+{
+   InveptArg e;
+   e.eptp = eptp;
+   e.rsvd = 0;
+   INVEPT(&e, INVEPT_EXTENT_EPT_CTX);
+}
+
+static INLINE void
+INVEPT_GLOBAL(void)
+{
+   InveptArg e;
+   e.rsvd = 0;
+   INVEPT(&e, INVEPT_EXTENT_GLOBAL);
+}
+
+static INLINE void
+VMFUNC(unsigned num)
+{
+   __asm__ __volatile__ (".byte 0x0f, 0x01, 0xd4" : : "a" (num));
+}
+
+#elif defined _MSC_VER
+
+#if !defined VM_X86_64
+unsigned char __vmx_on(unsigned __int64 *);
+void          __vmx_off(void);
+int           __vmx_vmptrld(unsigned __int64 *);
+void          __vmx_vmptrst(unsigned __int64 *);
+#endif
+
+
+static INLINE VMXStatus
+VMXON_2_STATUS(MA *vmcs)
+{
+   unsigned char mscStatus;
+   static const VMXStatus MscToStatus[] =
+      {VMX_Success, VMX_FailValid, VMX_FailInvalid};
+
+   mscStatus = __vmx_on((unsigned __int64 *)vmcs);
+   ASSERT(mscStatus < ARRAYSIZE(MscToStatus));
+   return MscToStatus[mscStatus];
+}
+
+static INLINE void
+VMXON_UNCHECKED(MA *vmcs)
+{
+   (void)__vmx_on((unsigned __int64 *)vmcs);
+}
+
+static INLINE VMXStatus
+VMXOFF_2_STATUS(void)
+{
+   (void)__vmx_off();
+   return VMX_Success;
+}
+
+static INLINE void
+VMXOFF_UNCHECKED(void)
+{
+   (void)__vmx_off();
+}
+
+static INLINE VMXStatus
+VMPTRLD_2_STATUS(MA *vmcs)
+{
+   unsigned char mscStatus;
+   static const VMXStatus MscToStatus[] =
+      {VMX_Success, VMX_FailValid, VMX_FailInvalid};
+
+   mscStatus = __vmx_vmptrld((unsigned __int64 *)vmcs);
+   ASSERT(mscStatus < ARRAYSIZE(MscToStatus));
+   return MscToStatus[mscStatus];
+}
+
+static INLINE void
+VMPTRLD_UNCHECKED(MA *vmcs)
+{
+   (void)__vmx_vmptrld((unsigned __int64 *)vmcs);
+}
+
+static INLINE VMXStatus
+VMPTRST_2_STATUS(MA *vmcs)
+{
+   (void)__vmx_vmptrst((unsigned __int64 *)vmcs);
+   return VMX_Success;
+}
+
+static INLINE void
+VMPTRST_UNCHECKED(MA *vmcs)
+{
+   (void)__vmx_vmptrst((unsigned __int64 *)vmcs);
+}
+
+
+#endif
+
+
+static INLINE void
+VMXON(MA *vmcs)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMXON_2_STATUS(vmcs);
+      ASSERT(status == VMX_Success);
+   } else {
+      VMXON_UNCHECKED(vmcs); 
+   }
+}
+
+static INLINE void
+VMXOFF(void)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMXOFF_2_STATUS();
+      ASSERT(status == VMX_Success);
+   } else {
+      VMXOFF_UNCHECKED();
+   }
+}
+
+static INLINE void
+VMPTRLD(MA *vmcs)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMPTRLD_2_STATUS(vmcs);
+      ASSERT(status == VMX_Success);
+   } else {
+      VMPTRLD_UNCHECKED(vmcs);
+   }
+}
+
+static INLINE void
+VMPTRST(MA *vmcs)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMPTRST_2_STATUS(vmcs);
+      ASSERT(status == VMX_Success);
+   } else {
+      VMPTRST_UNCHECKED(vmcs);
+   }
+}
+
+#endif /* _X86VTINSTR_H_ */
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
new file mode 100644
index 00000000..87cf45be
--- /dev/null
+++ b/vmmon-only/linux/driver.c
@@ -0,0 +1,2103 @@
+/*********************************************************
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/* Must come before any kernel header file */
+#include "driver-config.h"
+
+#define EXPORT_SYMTAB
+
+#include <linux/file.h>
+#include <linux/highmem.h>
+#include <linux/poll.h>
+#include <linux/preempt.h>
+#include <linux/slab.h>
+#include <linux/smp.h>
+#include <linux/wait.h>
+
+#include <asm/hw_irq.h> /* for CALL_FUNCTION_VECTOR */
+
+#include "compat_version.h"
+#include "compat_module.h"
+#include "compat_page.h"
+
+#include "usercalldefs.h"
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 16)
+#error Linux before 2.6.16 is not supported
+#endif
+
+#include <asm/io.h>
+
+#include "vmware.h"
+#include "driverLog.h"
+#include "driver.h"
+#include "modulecall.h"
+#include "vm_asm.h"
+#include "vmx86.h"
+#include "initblock.h"
+#include "task.h"
+#include "memtrack.h"
+#include "task.h"
+#include "cpuid.h"
+#include "cpuid_info.h"
+#include "circList.h"
+#include "x86msr.h"
+
+#ifdef VMX86_DEVEL
+#include "private.h"
+#endif
+
+#include "hostif.h"
+#include "hostif_priv.h"
+#include "vmhost.h"
+
+#include "vmmonInt.h"
+
+static void LinuxDriverQueue(VMLinux *vmLinux);
+static void LinuxDriverDequeue(VMLinux *vmLinux);
+static Bool LinuxDriverCheckPadding(void);
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24)
+#define VMW_NOPAGE_2624
+#endif
+
+#define VMMON_UNKNOWN_SWAP_SIZE -1ULL
+
+struct VMXLinuxState linuxState;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Device Driver Interface --
+ *
+ *      Runs the VM by implementing open/close/ioctl functions
+ *
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int LinuxDriver_Open(struct inode *inode, struct file *filp);
+
+/*
+ * gcc-4.5+ can name-mangle LinuxDriver_Ioctl, but our stack-size
+ * script needs to find it.  So it shouldn't be static.  ("hidden"
+ * visibility would be OK.)
+ */
+long LinuxDriver_Ioctl(struct file *filp, u_int iocmd,
+                       unsigned long ioarg);
+
+static int LinuxDriver_Close(struct inode *inode, struct file *filp);
+static unsigned int LinuxDriverPoll(struct file *file, poll_table *wait);
+#if defined(VMW_NOPAGE_2624)
+static int LinuxDriverFault(struct vm_area_struct *vma, struct vm_fault *fault);
+#else
+static struct page *LinuxDriverNoPage(struct vm_area_struct *vma,
+                                      unsigned long address,
+                                      int *type);
+#endif
+static int LinuxDriverMmap(struct file *filp, struct vm_area_struct *vma);
+
+static void LinuxDriverPollTimeout(unsigned long clientData);
+static unsigned int LinuxDriverEstimateTSCkHz(void);
+
+static struct vm_operations_struct vmuser_mops = {
+#ifdef VMW_NOPAGE_2624
+        .fault  = LinuxDriverFault
+#else
+        .nopage = LinuxDriverNoPage
+#endif
+};
+
+static struct file_operations vmuser_fops;
+static struct timer_list tscTimer;
+static Atomic_uint32 tsckHz;
+static VmTimeStart tsckHzStartTime;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriverEstimateTSCkHzWork --
+ *
+ *      Estimates TSC frequency in terms of cycles and system uptime
+ *      elapsed since module init. At module init, the starting cycle
+ *      count and uptime are recorded (in tsckHzStartTime) and a timer
+ *      is scheduled to call this function after 4 seconds.
+ *
+ *      It is possible that vmx queries the TSC rate after module init
+ *      but before the 4s timer expires. In that case, we just go ahead
+ *      and compute the rate for the duration since the driver loaded.
+ *      When the timer expires, the new computed value is dropped. If the
+ *      query races with the timer, the first thread to write to 'tsckHz'
+ *      wins.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+LinuxDriverEstimateTSCkHzWork(void *data)
+{
+   VmTimeStart curTime;
+   uint64 cycles;
+   uint64 uptime;
+   unsigned int khz;
+
+   ASSERT(tsckHzStartTime.count != 0 && tsckHzStartTime.time != 0);
+   Vmx86_ReadTSCAndUptime(&curTime);
+   cycles = curTime.count - tsckHzStartTime.count;
+   uptime = curTime.time  - tsckHzStartTime.time;
+   khz    = Vmx86_ComputekHz(cycles, uptime);
+
+   if (khz != 0) {
+       if (Atomic_ReadIfEqualWrite(&tsckHz, 0, khz) == 0) {
+          Log("TSC frequency estimated using system uptime: %u\n", khz);
+       }
+   } else if (Atomic_ReadIfEqualWrite(&tsckHz, 0, cpu_khz) == 0) {
+       Log("Failed to compute TSC frequency, using cpu_khz: %u\n", cpu_khz);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriverEstimateTSCkHz --
+ *
+ *      Returns the estimated TSC khz, cached in tscKhz. If tsckHz is
+ *      0, the routine kicks off estimation work on CPU 0.
+ *
+ * Results:
+ *
+ *      Returns the estimated TSC khz value.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static unsigned int
+LinuxDriverEstimateTSCkHz(void)
+{
+   int err;
+   uint32 khz;
+
+   khz = Atomic_Read(&tsckHz);
+   if (khz != 0) {
+      return khz;
+   }
+   err = compat_smp_call_function_single(0, LinuxDriverEstimateTSCkHzWork,
+                                         NULL, 1);
+   /*
+    * The smp function call may fail for two reasons, either
+    * the function is not supportd by the kernel, or the cpu
+    * went offline. In this unlikely event, we just perform
+    * the work wherever we can.
+    */
+   if (err != 0) {
+      LinuxDriverEstimateTSCkHzWork(NULL);
+   }
+
+   return Atomic_Read(&tsckHz);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriverEstimateTSCkHzDeferred --
+ *
+ *      Timer callback for deferred TSC rate estimation.
+ *
+ *----------------------------------------------------------------------
+ */
+static void
+LinuxDriverEstimateTSCkHzDeferred(unsigned long data)
+{
+   LinuxDriverEstimateTSCkHz();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriverInitTSCkHz --
+ *
+ *      Initialize TSC khz rate.
+ *
+ *      We rely on the kernel estimated cycle rate in the exported
+ *      variable tsc_khz. If the kernel has disabled tsc, tsc_khz
+ *      will be 0, and we fall back on our own estimation routines.
+ *
+ * Side effects:
+ *
+ *      If tsc_khz is unusable, schedules a 4s timer for deferred
+ *      khz estimation (see LinuxDriverEstimateTSCkHz).
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+LinuxDriverInitTSCkHz(void)
+{
+   unsigned int khz;
+ 
+   khz = compat_tsc_khz();
+   if (khz != 0) {
+      Atomic_Write(&tsckHz, khz);
+      Log("Using tsc_khz as TSC frequency: %u\n", khz);
+      return;
+   }
+
+   Vmx86_ReadTSCAndUptime(&tsckHzStartTime);
+   tscTimer.function = LinuxDriverEstimateTSCkHzDeferred;
+   tscTimer.expires  = jiffies + 4 * HZ;
+   tscTimer.data     = 0;
+   add_timer(&tscTimer);
+}
+
+ 
+/*
+ *----------------------------------------------------------------------
+ *
+ * init_module --
+ *
+ *      linux module entry point. Called by /sbin/insmod command
+ *
+ * Results:
+ *      registers a device driver for a major # that depends
+ *      on the uid. Add yourself to that list.  List is now in
+ *      private/driver-private.c.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+init_module(void)
+{
+   int retval;
+
+   DriverLog_Init("/dev/vmmon");
+   HostIF_InitGlobalLock();
+
+   if (!LinuxDriverCheckPadding()) {
+      return -ENOEXEC;
+   }
+
+   CPUID_Init();
+   if (!Task_Initialize()) {
+      return -ENOEXEC;
+   }
+
+   /*
+    * Initialize LinuxDriverPoll state
+    */
+
+   init_waitqueue_head(&linuxState.pollQueue);
+   init_timer(&linuxState.pollTimer);
+   linuxState.pollTimer.data = 0;
+   linuxState.pollTimer.function = LinuxDriverPollTimeout;
+
+   linuxState.fastClockThread = NULL;
+   linuxState.fastClockFile = NULL;
+   linuxState.fastClockRate = 0;
+   linuxState.fastClockPriority = -20;
+   linuxState.swapSize = VMMON_UNKNOWN_SWAP_SIZE;
+
+   /*
+    * Initialize the file_operations structure. Because this code is always
+    * compiled as a module, this is fine to do it here and not in a static
+    * initializer.
+    */
+
+   memset(&vmuser_fops, 0, sizeof vmuser_fops);
+   vmuser_fops.owner = THIS_MODULE;
+   vmuser_fops.poll = LinuxDriverPoll;
+   vmuser_fops.unlocked_ioctl = LinuxDriver_Ioctl;
+   vmuser_fops.compat_ioctl = LinuxDriver_Ioctl;
+   vmuser_fops.open = LinuxDriver_Open;
+   vmuser_fops.release = LinuxDriver_Close;
+   vmuser_fops.mmap = LinuxDriverMmap;
+
+#ifdef VMX86_DEVEL
+   devel_init_module();
+   linuxState.minor = 0;
+   retval = register_chrdev(linuxState.major, linuxState.deviceName,
+                            &vmuser_fops);
+#else
+   sprintf(linuxState.deviceName, "vmmon");
+   linuxState.major = 10;
+   linuxState.minor = 165;
+   linuxState.misc.minor = linuxState.minor;
+   linuxState.misc.name = linuxState.deviceName;
+   linuxState.misc.fops = &vmuser_fops;
+
+   retval = misc_register(&linuxState.misc);
+#endif
+
+   if (retval) {
+      Warning("Module %s: error registering with major=%d minor=%d\n",
+              linuxState.deviceName, linuxState.major, linuxState.minor);
+
+      return -ENOENT;
+   }
+   Log("Module %s: registered with major=%d minor=%d\n",
+       linuxState.deviceName, linuxState.major, linuxState.minor);
+
+   HostIF_InitUptime();
+   init_timer(&tscTimer);
+   LinuxDriverInitTSCkHz();
+   Vmx86_InitIDList();
+
+   Log("Module %s: initialized\n", linuxState.deviceName);
+
+   return 0;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * cleanup_module --
+ *
+ *      Called by /sbin/rmmod
+ *
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+cleanup_module(void)
+{
+   /*
+    * XXX smp race?
+    */
+#ifdef VMX86_DEVEL
+   unregister_chrdev(linuxState.major, linuxState.deviceName);
+#else
+   misc_deregister(&linuxState.misc);
+#endif
+
+   Log("Module %s: unloaded\n", linuxState.deviceName);
+
+   del_timer_sync(&linuxState.pollTimer);
+   del_timer_sync(&tscTimer);
+
+   Task_Terminate();
+   // Make sure fastClockThread is dead
+   HostIF_FastClockLock(1);
+   HostIF_SetFastClockRate(0);
+   HostIF_FastClockUnlock(1);
+
+   HostIF_CleanupUptime();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriver_Open  --
+ *
+ *      called on open of /dev/vmmon or /dev/vmx86.$USER. Use count used
+ *      to determine eventual deallocation of the module
+ *
+ * Side effects:
+ *     Increment use count used to determine eventual deallocation of
+ *     the module
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+LinuxDriver_Open(struct inode *inode, // IN
+                 struct file *filp)   // IN
+{
+   VMLinux *vmLinux;
+
+   vmLinux = kmalloc(sizeof *vmLinux, GFP_KERNEL);
+   if (vmLinux == NULL) {
+      return -ENOMEM;
+   }
+   memset(vmLinux, 0, sizeof *vmLinux);
+
+   sema_init(&vmLinux->lock4Gb, 1);
+   init_waitqueue_head(&vmLinux->pollQueue);
+
+   filp->private_data = vmLinux;
+   LinuxDriverQueue(vmLinux);
+
+   Vmx86_Open();
+
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverAllocPages --
+ *
+ *    Allocate physically contiguous block of memory with specified order.
+ *    Pages in the allocated block are configured so that caller can pass
+ *    independent pages to the VM.
+ *
+ * Results:
+ *    Zero on success, non-zero (error code) on failure.
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static int
+LinuxDriverAllocPages(unsigned int gfpFlag, // IN
+                      unsigned int order,   // IN
+                      struct page **pg,     // OUT
+                      unsigned int size)    // IN
+{
+   struct page* page;
+
+   page = alloc_pages(gfpFlag, order);
+   if (page) {
+      unsigned int i;
+
+      /*
+       * Grab an extra reference on all pages except first one - first
+       * one was already refcounted by alloc_pages.
+       *
+       * Under normal situation all pages except first one in the block
+       * have refcount zero.  As we pass these pages to the VM, we must
+       * bump their count, otherwise VM will release these pages every
+       * time they would be unmapped from user's process, causing crash.
+       *
+       * Note that this depends on Linux VM internals.  It works on all
+       * kernels we care about.
+       */
+
+      order = 1 << order;
+      for (i = 0; i < order; i++) {
+         if (i) {
+            /*
+             * Debug kernels assert that page->_count is not zero when
+             * calling get_page. We use init_page_count as a temporary
+             * workaround. PR 894174
+             */
+#if LINUX_VERSION_CODE > KERNEL_VERSION(2, 6, 16)
+            ASSERT(page_count(page) == 0);
+            init_page_count(page);
+#else
+            get_page(page);
+#endif
+         }
+         if (i >= size) {
+            put_page(page);
+         } else {
+            void *addr = kmap(page);
+
+            memset(addr, 0, PAGE_SIZE);
+            kunmap(page);
+            *pg++ = page;
+         }
+         page++;
+      }
+
+      return 0;
+   }
+
+   return -ENOMEM;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverDestructor4Gb --
+ *
+ *    Deallocate all directly mappable memory.
+ *
+ * Results:
+ *    None
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+LinuxDriverDestructor4Gb(VMLinux *vmLinux) // IN
+{
+   unsigned int pg;
+
+   if (!vmLinux->size4Gb) {
+      return;
+   }
+   for (pg = 0; pg < vmLinux->size4Gb; pg++) {
+      put_page(vmLinux->pages4Gb[pg]);
+   }
+   vmLinux->size4Gb = 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriver_Close  --
+ *
+ *      called on close of /dev/vmmon or /dev/vmx86.$USER, most often when the
+ *      process exits. Decrement use count, allowing for possible uninstalling
+ *      of the module.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+LinuxDriver_Close(struct inode *inode, // IN
+                  struct file *filp)   // IN
+{
+   VMLinux *vmLinux;
+
+   vmLinux = (VMLinux *)filp->private_data;
+   ASSERT(vmLinux);
+
+   LinuxDriverDequeue(vmLinux);
+   if (vmLinux->vm != NULL) {
+      Vmx86_ReleaseVM(vmLinux->vm);
+      vmLinux->vm = NULL;
+   }
+
+   Vmx86_Close();
+
+   /*
+    * Destroy all low memory allocations.
+    * We are closing the struct file here, so clearly no other process
+    * uses it anymore, and we do not need to hold the semaphore.
+    */
+
+   LinuxDriverDestructor4Gb(vmLinux);
+
+   /*
+    * Clean up poll state.
+    */
+
+   HostIF_PollListLock(0);
+   if (vmLinux->pollBack != NULL) {
+      if ((*vmLinux->pollBack = vmLinux->pollForw) != NULL) {
+         vmLinux->pollForw->pollBack = vmLinux->pollBack;
+      }
+   }
+   HostIF_PollListUnlock(0);
+   // XXX call wake_up()?
+   HostIF_UnmapUserMem(vmLinux->pollTimeoutHandle);
+
+   kfree(vmLinux);
+   filp->private_data = NULL;
+
+   return 0;
+}
+
+
+#define POLLQUEUE_MAX_TASK 1000
+static DEFINE_SPINLOCK(pollQueueLock);
+static void *pollQueue[POLLQUEUE_MAX_TASK];
+static unsigned int pollQueueCount = 0;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverQueuePoll --
+ *
+ *      Remember that current process waits for next timer event.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+LinuxDriverQueuePoll(void)
+{
+   unsigned long flags;
+
+   spin_lock_irqsave(&pollQueueLock, flags);
+
+   /*
+    * Under normal circumstances every process should be listed
+    * only once in this array. If it becomes problem that process
+    * can be in the array twice, walk array! Maybe you can keep
+    * it sorted by 'current' value then, making IsPollQueued
+    * a bit faster...
+    */
+
+   if (pollQueueCount < POLLQUEUE_MAX_TASK) {
+      pollQueue[pollQueueCount++] = current;
+   }
+   spin_unlock_irqrestore(&pollQueueLock, flags);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverIsPollQueued --
+ *
+ *      Determine whether timer event occurred since we queued for it using
+ *      LinuxDriverQueuePoll.
+ *
+ * Results:
+ *      0    Event already occurred.
+ *      1    Event did not occur yet.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER int
+LinuxDriverIsPollQueued(void)
+{
+   unsigned long flags;
+   unsigned int i;
+   int retval = 0;
+
+   spin_lock_irqsave(&pollQueueLock, flags);
+   for (i = 0; i < pollQueueCount; i++) {
+      if (current == pollQueue[i]) {
+         retval = 1;
+         break;
+      }
+   }
+   spin_unlock_irqrestore(&pollQueueLock, flags);
+
+   return retval;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverFlushPollQueue --
+ *
+ *      Signal to queue that timer event occurred.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+LinuxDriverFlushPollQueue(void)
+{
+   unsigned long flags;
+
+   spin_lock_irqsave(&pollQueueLock, flags);
+   pollQueueCount = 0;
+   spin_unlock_irqrestore(&pollQueueLock, flags);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverWakeUp --
+ *
+ *      Wake up processes waiting on timer event.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+LinuxDriverWakeUp(Bool selective)  // IN:
+{
+   if (selective && linuxState.pollList != NULL) {
+      struct timeval tv;
+      VmTimeType now;
+      VMLinux *p;
+      VMLinux *next;
+
+      HostIF_PollListLock(1);
+      do_gettimeofday(&tv);
+      now = tv.tv_sec * 1000000ULL + tv.tv_usec;
+
+      for (p = linuxState.pollList; p != NULL; p = next) {
+         next = p->pollForw;
+
+         if (p->pollTime <= now) {
+            if ((*p->pollBack = next) != NULL) {
+               next->pollBack = p->pollBack;
+            }
+            p->pollForw = NULL;
+            p->pollBack = NULL;
+            wake_up(&p->pollQueue);
+         }
+      }
+      HostIF_PollListUnlock(1);
+   }
+
+   LinuxDriverFlushPollQueue();
+   wake_up(&linuxState.pollQueue);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriverPoll  --
+ *
+ *      This is used to wake up the VMX when a user call arrives, or
+ *      to wake up select() or poll() at the next clock tick.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static unsigned int
+LinuxDriverPoll(struct file *filp,  // IN:
+                poll_table *wait)   // IN:
+{
+   VMLinux *vmLinux = (VMLinux *) filp->private_data;
+   unsigned int mask = 0;
+
+   /*
+    * Set up or check the timeout for fast wakeup.
+    *
+    * Thanks to Petr for this simple and correct implementation:
+    *
+    * There are four cases of wait == NULL:
+    *    another file descriptor is ready in the same poll()
+    *    just slept and woke up
+    *    nonblocking poll()
+    *    did not sleep due to memory allocation on 2.4.21-9.EL
+    * In first three cases, it's okay to return POLLIN.
+    * Unfortunately, for 4th variant we have to do some
+    * bookkeeping to not return POLLIN when timer did not expire
+    * yet.
+    *
+    * We may schedule a timer unnecessarily if an existing
+    * timer fires between poll_wait() and timer_pending().
+    *
+    * -- edward
+    */
+
+   if (wait == NULL) {
+      if (vmLinux->pollBack == NULL && !LinuxDriverIsPollQueued()) {
+         mask = POLLIN;
+      }
+   } else {
+      if (linuxState.fastClockThread && vmLinux->pollTimeoutPtr != NULL) {
+         struct timeval tv;
+
+         do_gettimeofday(&tv);
+         poll_wait(filp, &vmLinux->pollQueue, wait);
+         vmLinux->pollTime = *vmLinux->pollTimeoutPtr +
+                                       tv.tv_sec * 1000000ULL + tv.tv_usec;
+         if (vmLinux->pollBack == NULL) {
+            HostIF_PollListLock(2);
+            if (vmLinux->pollBack == NULL) {
+               if ((vmLinux->pollForw = linuxState.pollList) != NULL) {
+                  vmLinux->pollForw->pollBack = &vmLinux->pollForw;
+               }
+               linuxState.pollList = vmLinux;
+               vmLinux->pollBack = &linuxState.pollList;
+            }
+            HostIF_PollListUnlock(2);
+         }
+      } else {
+         LinuxDriverQueuePoll();
+         poll_wait(filp, &linuxState.pollQueue, wait);
+
+         if (!timer_pending(&linuxState.pollTimer)) {
+            mod_timer(&linuxState.pollTimer, jiffies + 1);
+         }
+      }
+   }
+
+   return mask;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriverPollTimeout  --
+ *
+ *      Wake up a process waiting in poll/select.  This is called from
+ *      the timer, and hence processed in the bottom half
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+LinuxDriverPollTimeout(unsigned long clientData)  // IN:
+{
+   LinuxDriverWakeUp(FALSE);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverNoPage/LinuxDriverFault --
+ *
+ *      Callback for returning allocated page for memory mapping
+ *
+ * Results:
+ *    NoPage:
+ *      Page or page address on success, NULL or 0 on failure.
+ *    Fault:
+ *      Error code; 0, minor page fault.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(VMW_NOPAGE_2624)
+static int LinuxDriverFault(struct vm_area_struct *vma, //IN
+                            struct vm_fault *fault)     //IN/OUT
+#else
+static struct page *LinuxDriverNoPage(struct vm_area_struct *vma, //IN
+                                      unsigned long address,      //IN
+                                      int *type)                  //OUT: Fault type
+#endif
+{
+   VMLinux *vmLinux = (VMLinux *) vma->vm_file->private_data;
+   unsigned long pg;
+   struct page* page;
+
+#ifdef VMW_NOPAGE_2624
+   pg = fault->pgoff;
+#else
+   pg = ((address - vma->vm_start) >> PAGE_SHIFT) + vma->vm_pgoff;
+#endif
+   pg = VMMON_MAP_OFFSET(pg);
+   if (pg >= vmLinux->size4Gb) {
+#ifdef VMW_NOPAGE_2624
+      return VM_FAULT_SIGBUS;
+#else
+      return 0;
+#endif
+   }
+   page = vmLinux->pages4Gb[pg];
+   get_page(page);
+#ifdef VMW_NOPAGE_2624
+   fault->page = page;
+   return 0;
+#else
+   *type = VM_FAULT_MINOR;
+   return page;
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverAllocContig --
+ *
+ *      Create mapping for contiguous memory areas.
+ *
+ * Results:
+ *
+ *      0       on success,
+ *      -EINVAL on invalid arguments or
+ *      -ENOMEM on out of memory
+ *
+ * Side effects:
+ *      Pages for mapping are allocated.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static int LinuxDriverAllocContig(VMLinux *vmLinux,
+                                  struct vm_area_struct *vma,
+                                  unsigned long off,
+                                  unsigned long size)
+{
+   unsigned long vmaOrder = VMMON_MAP_ORDER(off);
+   unsigned long vmaAllocSize;
+   unsigned int gfpFlag;
+   unsigned long i;
+
+   if (VMMON_MAP_RSVD(off)) {
+      /* Reserved bits set... */
+      return -EINVAL;
+   }
+   if (VMMON_MAP_OFFSET(off)) {
+      /* We do not need non-zero offsets... */
+      return -EINVAL;
+   }
+   switch (VMMON_MAP_MT(off)) {
+      case VMMON_MAP_MT_LOW4GB:
+#ifdef GFP_DMA32
+         gfpFlag = GFP_USER | GFP_DMA32;
+#else
+         gfpFlag = GFP_USER | GFP_DMA;
+#endif
+         break;
+      case VMMON_MAP_MT_LOW16MB:
+         gfpFlag = GFP_USER | GFP_DMA;
+         break;
+      case VMMON_MAP_MT_ANY:
+         gfpFlag = GFP_HIGHUSER;
+         break;
+      default:
+         /* Invalid memory type */
+         return -EINVAL;
+   }
+   if (size > VMMON_MAP_OFFSET_MASK + 1) {
+      /* Size is too big to fit to our window. */
+      return -ENOMEM;
+   }
+
+   /* 16 pages looks like a good limit... */
+   if (size > VMMON_MAX_LOWMEM_PAGES) {
+      return -ENOMEM;
+   }
+   /* Sorry. Only one mmap per one open. */
+   down(&vmLinux->lock4Gb);
+   if (vmLinux->size4Gb) {
+      up(&vmLinux->lock4Gb);
+      return -EINVAL;
+   }
+   vmaAllocSize = 1 << vmaOrder;
+   for (i = 0; i < size; i += vmaAllocSize) {
+      int err;
+
+      err = LinuxDriverAllocPages(gfpFlag, vmaOrder,
+                                  vmLinux->pages4Gb + i, size - i);
+      if (err) {
+         while (i > 0) {
+            put_page(vmLinux->pages4Gb[--i]);
+         }
+         up(&vmLinux->lock4Gb);
+
+         return err;
+      }
+   }
+   vmLinux->size4Gb = size;
+   up(&vmLinux->lock4Gb);
+   vma->vm_ops = &vmuser_mops;
+
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverMmap --
+ *
+ *      Create mapping for lowmem or locked memory.
+ *
+ * Results:
+ *
+ *      0       on success,
+ *      -EINVAL on invalid arguments or
+ *      -ENOMEM on out of memory
+ *
+ * Side effects:
+ *      Pages for mapping are allocated.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static int
+LinuxDriverMmap(struct file *filp,
+                struct vm_area_struct *vma)
+{
+   VMLinux *vmLinux = (VMLinux *) filp->private_data;
+   unsigned long size;
+   int err;
+
+   /* Only shared mappings */
+   if (!(vma->vm_flags & VM_SHARED)) {
+      return -EINVAL;
+   }
+   if ((vma->vm_end | vma->vm_start) & (PAGE_SIZE - 1)) {
+      return -EINVAL;
+   }
+   size = (vma->vm_end - vma->vm_start) >> PAGE_SHIFT;
+   if (size < 1) {
+      return -EINVAL;
+   }
+   if (vmLinux->vm) {
+      err = -EINVAL;
+   } else {
+      err = LinuxDriverAllocContig(vmLinux, vma, vma->vm_pgoff, size);
+   }
+   if (err) {
+      return err;
+   }
+   /* Clear VM_IO, otherwise SuSE's kernels refuse to do get_user_pages */
+   vma->vm_flags &= ~VM_IO;
+
+   return 0;
+}
+
+
+typedef Bool (*SyncFunc)(void *data, unsigned cpu);
+
+typedef struct {
+   Atomic_uint32 numCPUs;
+   Atomic_uint32 ready;
+   Atomic_uint32 failures;
+   Atomic_uint32 done;
+   SyncFunc      func;
+   void          *data;
+} SyncFuncArgs;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverSyncCallHook --
+ *
+ *      Called on each CPU, waits for them all to show up, and executes
+ *      the callback.
+ *
+ * Results:
+ *
+ * Side effects:
+ *      Whatever side effects the callback has.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+LinuxDriverSyncCallHook(void *data)  // IN:
+{
+   Bool success;
+   uint32 numCPUs;
+   volatile unsigned iterations = 1000 * 1000;
+   SyncFuncArgs *args = (SyncFuncArgs *)data;
+   unsigned cpu = smp_processor_id();
+
+   /*
+    * We need to careful about reading cpu_online_map on kernels that
+    * have hot add/remove cpu support.  The kernel's smp_call_function
+    * blocks hot add from occuring between the time it computes the set
+    * of cpus it will IPI and when all those cpus have entered their IPI
+    * handlers.  Additionally, we disabled preemption on the initiating
+    * cpu during the entire sync call sequence.  So, since a cpu hot add
+    * is initiated from process context, a cpu cannot be hot added until
+    * at least one cpu has exited this code, and therefore it is safe
+    * for the first cpu to reach this point to read cpu_online_map.
+    *
+    * Hot remove works by stopping the entire machine, which is done by
+    * waiting for a set of kernel threads to be scheduled on all cpus.
+    * This cannot happen until all cpus are preemptible.  Since the
+    * initiating cpu has preemption disabled during this entire
+    * sequence, this code is also safe from cpu hot remove.
+    *
+    * So, the first cpu to reach this code will read the same value of
+    * cpu_online_map that was used by smp_call_function, and therefore
+    * we can safely assume that numCPUs cpus will execute this routine.
+    */
+
+   Atomic_CMPXCHG32(&args->numCPUs, 0, num_online_cpus());
+   numCPUs = Atomic_Read(&args->numCPUs);
+
+   Atomic_Inc(&args->ready);
+
+   /*
+    * Wait for all CPUs, but not forever since we could deadlock.  The
+    * potential deadlock scenerio is this: cpu0 has IF=1 and holds a
+    * lock.  cpu1 has IF=0 and is spinning waiting for the lock.
+    */
+
+   while (Atomic_Read(&args->ready) != numCPUs && --iterations) ;
+
+   /* Now simultaneously call the routine. */
+   success = args->func(args->data, cpu);
+
+   if (!iterations || !success) {
+      /* Indicate that we either timed out or the callback failed. */
+      Atomic_Inc(&args->failures);
+   }
+   /* Indicate that we are finished. */
+   Atomic_Inc(&args->done);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverSyncCallOnEachCPU --
+ *
+ *      Calls func on each cpu at (nearly) the same time.
+ *
+ * Results:
+ *      TRUE if func was called at the same time on all cpus.  Note that
+ *      func is called regardless of whether all cpus showed up in time.
+ *
+ * Side effects:
+ *      func's side effects, on all cpus.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+LinuxDriverSyncCallOnEachCPU(SyncFunc func,  // IN:
+                             void *data)     // IN:
+{
+   SyncFuncArgs args;
+   uintptr_t flags;
+
+   ASSERT(HostIF_GlobalLockIsHeld());
+
+   args.func = func;
+   args.data = data;
+
+   Atomic_Write(&args.numCPUs, 0); // Must be calculated inside the callback.
+   Atomic_Write(&args.ready, 0);
+   Atomic_Write(&args.failures, 0);
+   Atomic_Write(&args.done, 0);
+
+   preempt_disable();
+
+   /*
+    * Call all other CPUs, but do not wait so we can enter the callback
+    * on this CPU too.
+    */
+
+   compat_smp_call_function(LinuxDriverSyncCallHook, &args, 0);
+
+   /*
+    * smp_call_function doesn't return until all cpus have been
+    * interrupted.  It's safe to disable interrupts now that all other
+    * cpus are in their IPI handlers.
+    */
+
+   SAVE_FLAGS(flags);
+   CLEAR_INTERRUPTS();
+
+   LinuxDriverSyncCallHook(&args);
+
+   RESTORE_FLAGS(flags);
+   preempt_enable();
+
+   /*
+    * Wait for everyone else to finish so we can get an accurate
+    * failures count.
+    */
+
+   while (Atomic_Read(&args.done) != Atomic_Read(&args.numCPUs)) ;
+
+   /*
+    * This routine failed if any CPU bailed out early to avoid deadlock,
+    * or the callback routine failed on any CPU.  Both conditions are
+    * recorded in the failures field.
+    */
+
+   return Atomic_Read(&args.failures) == 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverReadTSC --
+ *
+ *      Callback that is executed simultaneously on all cpus to read the TSCs.
+ *
+ * Results:
+ *      TRUE.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+LinuxDriverReadTSC(void *data,   // OUT: TSC values
+                   unsigned cpu) // IN: the pcpu number
+{
+   TSCDelta *tscDelta = (TSCDelta *)data;
+   uint64 tsc, old;
+
+   if (LIKELY(CPUID_SSE2Supported())) {
+      RDTSC_BARRIER();
+   }
+   tsc = RDTSC();
+
+   /* Any looping means another CPU changed min/max. */
+   do {
+      old = Atomic_Read64(&tscDelta->min);
+   } while (old > tsc && !Atomic_CMPXCHG64(&tscDelta->min, &old, &tsc));
+   do {
+      old = Atomic_Read64(&tscDelta->max);
+   } while (old < tsc && !Atomic_CMPXCHG64(&tscDelta->max, &old, &tsc));
+
+   return TRUE;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriverSyncReadTSCs --
+ *
+ *      Simultaneously read the TSCs on all cpus.
+ *
+ * Results:
+ *      The set of all TSCs.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+__attribute__((always_inline)) static Bool
+LinuxDriverSyncReadTSCs(uint64 *delta) // OUT: TSC max - TSC min
+{
+   TSCDelta tscDelta;
+   unsigned i;
+   Bool okay = FALSE;
+
+   /* Take the global lock to block concurrent calls. */
+   HostIF_GlobalLock(14);
+
+   /* Loop to warm up the cache. */
+   for (i = 0; i < 3; i++) {
+      Atomic_Write64(&tscDelta.min, ~CONST64U(0));
+      Atomic_Write64(&tscDelta.max, CONST64U(0));
+
+      if (LinuxDriverSyncCallOnEachCPU(LinuxDriverReadTSC, &tscDelta)) {
+         /* We return the last successful simultaneous read of the TSCs. */
+         *delta = Atomic_Read64(&tscDelta.max) - Atomic_Read64(&tscDelta.min);
+         okay = TRUE;
+      }
+   }
+   HostIF_GlobalUnlock(14);
+
+   return okay;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LinuxDriver_Ioctl --
+ *
+ *      Main path for UserRPC
+ *
+ *      Be VERY careful with stack usage; gcc's stack allocation is iffy
+ *      and allocations from individual "case" statements do not overlap,
+ *      so it is easy to use kilobytes of stack space here.
+ *
+ * Results:
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+long
+LinuxDriver_Ioctl(struct file *filp,    // IN:
+                  u_int iocmd,          // IN:
+                  unsigned long ioarg)  // IN:
+{
+   VMLinux *vmLinux = (VMLinux *) filp->private_data;
+   int retval = 0;
+   Vcpuid vcpuid;
+   VMDriver *vm;
+
+   if (vmLinux == NULL) {
+      return -EINVAL;
+   }
+
+   vm = vmLinux->vm;
+
+   /*
+    * Validate the VM pointer for those IOCTLs that require it.
+    */
+
+   switch (iocmd) {
+   case IOCTL_VMX86_VERSION:
+   case IOCTL_VMX86_CREATE_VM:
+   case IOCTL_VMX86_INIT_CROSSGDT:
+   case IOCTL_VMX86_SET_UID:
+   case IOCTL_VMX86_LOOK_UP_MPN:
+   case IOCTL_VMX86_GET_NUM_VMS:
+   case IOCTL_VMX86_GET_TOTAL_MEM_USAGE:
+   case IOCTL_VMX86_SET_HARD_LIMIT:
+   case IOCTL_VMX86_PAE_ENABLED:
+   case IOCTL_VMX86_VMX_ENABLED:
+   case IOCTL_VMX86_GET_IPI_VECTORS:
+   case IOCTL_VMX86_GET_KHZ_ESTIMATE:
+   case IOCTL_VMX86_GET_ALL_CPUID:
+   case IOCTL_VMX86_GET_ALL_MSRS:
+   case IOCTL_VMX86_READ_PAGE:
+   case IOCTL_VMX86_WRITE_PAGE:
+   case IOCTL_VMX86_SET_POLL_TIMEOUT_PTR:
+   case IOCTL_VMX86_GET_KERNEL_CLOCK_RATE:
+   case IOCTL_VMX86_GET_REFERENCE_CLOCK_HZ:
+   case IOCTL_VMX86_INIT_PSEUDO_TSC:
+   case IOCTL_VMX86_CHECK_PSEUDO_TSC:
+   case IOCTL_VMX86_GET_PSEUDO_TSC:
+   case IOCTL_VMX86_SET_HOST_CLOCK_PRIORITY:
+   case IOCTL_VMX86_SYNC_GET_TSCS:
+   case IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS:
+      break;
+
+   default:
+      if (vm == NULL) {
+         retval = -EINVAL;
+         goto exit;
+      }
+   }
+
+   /*
+    * Perform the IOCTL operation.
+    */
+
+   switch (iocmd) {
+   case IOCTL_VMX86_VERSION:
+      retval = VMMON_VERSION;
+      break;
+
+   case IOCTL_VMX86_CREATE_VM:
+      if (vm != NULL) {
+         retval = -EINVAL;
+         break;
+      }
+
+      vm = Vmx86_CreateVM();
+
+      if (vm == NULL) {
+         retval = -ENOMEM;
+      } else {
+         vmLinux->vm = vm;
+         retval = vm->userID;
+      }
+      break;
+
+   case IOCTL_VMX86_RELEASE_VM:
+      vmLinux->vm = NULL;
+      Vmx86_ReleaseVM(vm);
+      break;
+
+   case IOCTL_VMX86_ALLOC_CROSSGDT: {
+      InitBlock initBlock;
+
+      if (Task_AllocCrossGDT(&initBlock)) {
+         retval = HostIF_CopyToUser((char *)ioarg, &initBlock,
+                                    sizeof initBlock);
+      } else {
+         retval = -EINVAL;
+      }
+      break;
+   }
+
+   case IOCTL_VMX86_INIT_VM: {
+      InitBlock initParams;
+
+      retval = HostIF_CopyFromUser(&initParams, (char *)ioarg,
+                                   sizeof initParams);
+      if (retval != 0) {
+         break;
+      }
+      if (Vmx86_InitVM(vm, &initParams)) {
+         retval = -EINVAL;
+         break;
+      }
+      retval = HostIF_CopyToUser((char *)ioarg, &initParams,
+                                 sizeof initParams);
+      break;
+   }
+
+   case IOCTL_VMX86_INIT_CROSSGDT: {
+      InitCrossGDT initCrossGDT;
+
+      retval = HostIF_CopyFromUser(&initCrossGDT, (char *)ioarg,
+                                   sizeof initCrossGDT);
+
+      if ((retval == 0) && Task_InitCrossGDT(&initCrossGDT)) {
+         retval = -EIO;
+      }
+      break;
+   }
+
+   case IOCTL_VMX86_RUN_VM:
+      vcpuid = ioarg;
+
+      if (vcpuid >= vm->numVCPUs) {
+         retval = -EINVAL;
+         break;
+      }
+      retval = Vmx86_RunVM(vm, vcpuid);
+      break;
+
+   case IOCTL_VMX86_SET_UID:
+#ifdef VMX86_DEVEL
+      devel_suid();
+#else
+      retval = -EPERM;
+#endif
+      break;
+
+   case IOCTL_VMX86_LOCK_PAGE: {
+      VMLockPage args;
+
+      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      if (retval) {
+         break;
+      }
+      args.ret.status = Vmx86_LockPage(vm, args.uAddr, FALSE, &args.ret.mpn);
+      retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
+      break;
+   }
+
+   case IOCTL_VMX86_LOCK_PAGE_NEW: {
+      VMLockPage args;
+
+      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      if (retval) {
+         break;
+      }
+      args.ret.status = Vmx86_LockPage(vm, args.uAddr, TRUE, &args.ret.mpn);
+      retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
+      break;
+   }
+
+   case IOCTL_VMX86_UNLOCK_PAGE: {
+      VA64 uAddr;
+
+      retval = HostIF_CopyFromUser(&uAddr, (void *)ioarg, sizeof uAddr);
+      if (retval) {
+         break;
+      }
+      retval = Vmx86_UnlockPage(vm, uAddr);
+      break;
+   }
+
+   case IOCTL_VMX86_UNLOCK_PAGE_BY_MPN: {
+      VMMUnlockPageByMPN args;
+
+      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      if (retval) {
+         break;
+      }
+      retval = Vmx86_UnlockPageByMPN(vm, args.mpn, args.uAddr);
+      break;
+   }
+
+   case IOCTL_VMX86_LOOK_UP_MPN: {
+      VMLockPage args;
+
+      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      if (retval) {
+         break;
+      }
+      args.ret.status = HostIF_LookupUserMPN(vm, args.uAddr, &args.ret.mpn);
+      retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
+      break;
+   }
+
+   case IOCTL_VMX86_GET_NUM_VMS:
+      retval = Vmx86_GetNumVMs();
+      break;
+
+   case IOCTL_VMX86_GET_TOTAL_MEM_USAGE:
+      retval = Vmx86_GetTotalMemUsage();
+      break;
+
+   case IOCTL_VMX86_SET_HARD_LIMIT: {
+      int32 limit;
+
+      retval = HostIF_CopyFromUser(&limit, (void *)ioarg, sizeof limit);
+      if (retval != 0) {
+         break;
+      }
+      if (!Vmx86_SetConfiguredLockedPagesLimit(limit)) {
+         retval = -EINVAL;
+      }
+      break;
+   }
+
+   case IOCTL_VMX86_ADMIT: {
+      VMMemInfoArgs args;
+
+      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      if (retval != 0) {
+         break;
+      }
+      Vmx86_Admit(vm, &args);
+      retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
+      break;
+   }
+
+   case IOCTL_VMX86_READMIT: {
+      OvhdMem_Deltas delta;
+
+      retval = HostIF_CopyFromUser(&delta, (void *)ioarg, sizeof delta);
+      if (retval != 0) {
+         break;
+      }
+      if (!Vmx86_Readmit(vm, &delta)) {
+         retval = -1;
+      }
+
+      break;
+   }
+
+   case IOCTL_VMX86_UPDATE_MEM_INFO: {
+      VMMemMgmtInfoPatch patch;
+
+      retval = HostIF_CopyFromUser(&patch, (void *)ioarg, sizeof patch);
+      if (retval == 0) {
+         Vmx86_UpdateMemInfo(vm, &patch);
+      }
+      break;
+   }
+
+   case IOCTL_VMX86_GET_MEM_INFO: {
+      VA64 uAddr;
+      VMMemInfoArgs *userVA;
+      VMMemInfoArgs in;
+      VMMemInfoArgs *out;
+
+      retval = HostIF_CopyFromUser(&uAddr, (void *)ioarg, sizeof uAddr);
+      if (retval) {
+         break;
+      }
+
+      userVA = VA64ToPtr(uAddr);
+      retval = HostIF_CopyFromUser(&in, userVA, sizeof in);
+      if (retval) {
+         break;
+      }
+
+      if (in.numVMs < 1 || in.numVMs > MAX_VMS) {
+         retval = -EINVAL;
+         break;
+      }
+      out = HostIF_AllocKernelMem(VM_GET_MEM_INFO_SIZE(in.numVMs), TRUE);
+      if (!out) {
+         retval = -ENOMEM;
+         break;
+      }
+
+      *out = in;
+      if (!Vmx86_GetMemInfo(vm, FALSE, out, VM_GET_MEM_INFO_SIZE(in.numVMs))) {
+         HostIF_FreeKernelMem(out);
+         retval = -ENOBUFS;
+         break;
+      }
+
+      retval = HostIF_CopyToUser(userVA, out,
+                                 VM_GET_MEM_INFO_SIZE(out->numVMs));
+      HostIF_FreeKernelMem(out);
+      break;
+   }
+
+   case IOCTL_VMX86_PAE_ENABLED:
+      retval = Vmx86_PAEEnabled();
+      break;
+
+   case IOCTL_VMX86_VMX_ENABLED:
+      retval = Vmx86_VMXEnabled();
+      break;
+
+   case IOCTL_VMX86_APIC_INIT: {
+      VMAPICInfo info;
+      Bool setVMPtr;
+      Bool probe;
+
+      retval = HostIF_CopyFromUser(&info, (VMAPICInfo *)ioarg, sizeof info);
+      if (retval != 0) {
+         break;
+      }
+      setVMPtr = ((info.flags & APIC_FLAG_DISABLE_NMI) != 0);
+      probe = ((info.flags & APIC_FLAG_PROBE) != 0);
+
+      /*
+       * Kernel uses NMIs for deadlock detection - set APIC VMptr so that
+       * NMIs get disabled in the monitor.
+       */
+
+      setVMPtr = TRUE;
+
+      retval = HostIF_APICInit(vm, setVMPtr, probe) ? 0 : -ENODEV;
+      break;
+   }
+
+   case IOCTL_VMX86_SET_HOST_CLOCK_RATE:
+      retval = -Vmx86_SetHostClockRate(vm, (unsigned)ioarg);
+      break;
+
+   case IOCTL_VMX86_SEND_IPI: {
+      VCPUSet ipiTargets;
+
+      retval = HostIF_CopyFromUser(&ipiTargets, (VCPUSet *) ioarg,
+                                   sizeof ipiTargets);
+
+      if (retval == 0) {
+         HostIF_IPI(vm, &ipiTargets);
+      }
+
+      break;
+   }
+
+   case IOCTL_VMX86_GET_IPI_VECTORS: {
+      IPIVectors ipiVectors;
+
+      ipiVectors.hostIPIVectors[0] = CALL_FUNCTION_VECTOR;
+#ifdef CALL_FUNCTION_SINGLE_VECTOR
+      ipiVectors.hostIPIVectors[1] = CALL_FUNCTION_SINGLE_VECTOR;
+#else
+      ipiVectors.hostIPIVectors[1] = 0;
+#endif
+      ipiVectors.monitorIPIVector = monitorIPIVector;
+      ipiVectors.hvIPIVector      = hvIPIVector;
+
+      retval = HostIF_CopyToUser((void *)ioarg, &ipiVectors,
+                                  sizeof ipiVectors);
+      break;
+   }
+
+   case IOCTL_VMX86_GET_KHZ_ESTIMATE:
+      retval = LinuxDriverEstimateTSCkHz();
+      break;
+
+   case IOCTL_VMX86_GET_ALL_CPUID: {
+      VA64 uAddr;
+      CPUIDQuery *userVA;
+      CPUIDQuery in;
+      CPUIDQuery *out;
+
+      retval = HostIF_CopyFromUser(&uAddr, (void *)ioarg, sizeof uAddr);
+      if (retval) {
+         break;
+      }
+
+      userVA = VA64ToPtr(uAddr);
+      retval = HostIF_CopyFromUser(&in, userVA, sizeof in);
+      if (retval) {
+         break;
+      }
+
+      /*
+       * Some kernels panic on kmalloc request larger than 128KB.
+       * XXX This test should go inside HostIF_AllocKernelMem() then.
+       */
+
+      if (in.numLogicalCPUs >
+                        (131072 - sizeof *out) / sizeof out->logicalCPUs[0]) {
+         retval = -EINVAL;
+         break;
+      }
+      out = HostIF_AllocKernelMem(
+         sizeof *out + in.numLogicalCPUs * sizeof out->logicalCPUs[0],
+         TRUE);
+      if (!out) {
+         retval = -ENOMEM;
+         break;
+      }
+
+      *out = in;
+      if (!HostIF_GetAllCpuInfo(out)) {
+         HostIF_FreeKernelMem(out);
+         retval = -ENOBUFS;
+         break;
+      }
+
+      retval = HostIF_CopyToUser((int8 *)userVA + sizeof *userVA,
+                                  &out->logicalCPUs[0],
+                           out->numLogicalCPUs * sizeof out->logicalCPUs[0]);
+      HostIF_FreeKernelMem(out);
+      break;
+   }
+
+   case IOCTL_VMX86_GET_ALL_MSRS: {
+      VA64 uAddr;
+      MSRQuery *userVA;
+      MSRQuery in;
+      MSRQuery *out;
+
+      retval = HostIF_CopyFromUser(&uAddr, (void *)ioarg, sizeof uAddr);
+      if (retval) {
+         break;
+      }
+
+      userVA = VA64ToPtr(uAddr);
+      retval = HostIF_CopyFromUser(&in, userVA, sizeof in);
+      if (retval) {
+         break;
+      }
+
+      /*
+       * Some kernels panic on kmalloc request larger than 128KB.
+       * XXX This test should go inside HostIF_AllocKernelMem() then.
+       */
+
+      if (in.numLogicalCPUs >
+                        (131072 - sizeof *out) / sizeof out->logicalCPUs[0]) {
+         retval = -EINVAL;
+         break;
+      }
+      out = HostIF_AllocKernelMem(
+         sizeof *out + in.numLogicalCPUs * sizeof out->logicalCPUs[0],
+         TRUE);
+      if (!out) {
+         retval = -ENOMEM;
+         break;
+      }
+
+      *out = in;
+      if (!Vmx86_GetAllMSRs(out)) {
+         HostIF_FreeKernelMem(out);
+         retval = -ENOBUFS;
+         break;
+      }
+
+      retval = HostIF_CopyToUser((int8 *)userVA + sizeof *userVA,
+                                  &out->logicalCPUs[0],
+                            out->numLogicalCPUs * sizeof out->logicalCPUs[0]);
+      HostIF_FreeKernelMem(out);
+      break;
+   }
+
+   case IOCTL_VMX86_ALLOC_LOCKED_PAGES:
+   case IOCTL_VMX86_FREE_LOCKED_PAGES: {
+         VMMPNList req;
+
+         retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+         if (retval) {
+           break;
+         }
+         if (iocmd == IOCTL_VMX86_ALLOC_LOCKED_PAGES) {
+            retval = Vmx86_AllocLockedPages(vm, req.mpnList,
+                                            req.mpnCount, FALSE,
+                                            req.ignoreLimits);
+         } else {
+            retval = Vmx86_FreeLockedPages(vm, req.mpnList,
+                                           req.mpnCount, FALSE);
+         }
+         break;
+      }
+
+   case IOCTL_VMX86_GET_NEXT_ANON_PAGE: {
+      VMMPNNext req;
+
+      retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+      if (retval) {
+         req.outMPN = INVALID_MPN;
+      } else {
+         req.outMPN = Vmx86_GetNextAnonPage(vm, req.inMPN);
+      }
+      retval = HostIF_CopyToUser((void *)ioarg, &req, sizeof req);
+      break;
+   }
+
+   case IOCTL_VMX86_GET_LOCKED_PAGES_LIST: {
+         VMMPNList req;
+
+         retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+         if (retval) {
+            break;
+         }
+         retval = Vmx86_GetLockedPageList(vm, req.mpnList, req.mpnCount);
+         break;
+      }
+
+   case IOCTL_VMX86_READ_PAGE: {
+         VMMReadWritePage req;
+
+         retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+         if (retval) {
+            break;
+         }
+         retval = HostIF_ReadPage(req.mpn, req.uAddr, FALSE);
+         break;
+      }
+
+   case IOCTL_VMX86_WRITE_PAGE: {
+         VMMReadWritePage req;
+
+         retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+         if (retval) {
+            break;
+         }
+         retval = HostIF_WritePage(req.mpn, req.uAddr, FALSE);
+         break;
+      }
+
+   case IOCTL_VMX86_SET_POLL_TIMEOUT_PTR: {
+      vmLinux->pollTimeoutPtr = NULL;
+      HostIF_UnmapUserMem(vmLinux->pollTimeoutHandle);
+      if (ioarg != 0) {
+         vmLinux->pollTimeoutPtr = HostIF_MapUserMem((VA)ioarg,
+                                              sizeof *vmLinux->pollTimeoutPtr,
+                                                 &vmLinux->pollTimeoutHandle);
+
+         if (vmLinux->pollTimeoutPtr == NULL) {
+            retval = -EINVAL;
+            break;
+         }
+      }
+      break;
+   }
+
+   case IOCTL_VMX86_GET_KERNEL_CLOCK_RATE:
+      retval = HZ;
+      break;
+
+   case IOCTL_VMX86_FAST_SUSP_RES_SET_OTHER_FLAG:
+      retval = Vmx86_FastSuspResSetOtherFlag(vm, ioarg);
+      break;
+
+   case IOCTL_VMX86_FAST_SUSP_RES_GET_MY_FLAG:
+      retval = Vmx86_FastSuspResGetMyFlag(vm, ioarg);
+      break;
+
+   case IOCTL_VMX86_GET_REFERENCE_CLOCK_HZ: {
+      uint64 refClockHz = HostIF_UptimeFrequency();
+
+      retval = HostIF_CopyToUser((void *)ioarg, &refClockHz,
+                                 sizeof refClockHz);
+      break;
+   }
+
+   case IOCTL_VMX86_INIT_PSEUDO_TSC: {
+      PTSCInitParams params;
+
+      retval = HostIF_CopyFromUser(&params, (void *)ioarg, sizeof params);
+      if (retval != 0) {
+         break;
+      }
+      Vmx86_InitPseudoTSC(&params);
+      retval = HostIF_CopyToUser((void *)ioarg, &params, sizeof params);
+      break;
+   }
+
+   case IOCTL_VMX86_CHECK_PSEUDO_TSC: {
+      PTSCCheckParams params;
+
+      retval = HostIF_CopyFromUser(&params, (void *)ioarg, sizeof params);
+      if (retval != 0) {
+         break;
+      }
+      params.usingRefClock = Vmx86_CheckPseudoTSC(&params.lastTSC,
+                                                  &params.lastRC);
+
+      retval = HostIF_CopyToUser((void *)ioarg, &params, sizeof params);
+      break;
+   }
+
+   case IOCTL_VMX86_GET_PSEUDO_TSC: {
+      uint64 ptsc = Vmx86_GetPseudoTSC();
+
+      retval = HostIF_CopyToUser((void *)ioarg, &ptsc, sizeof ptsc);
+      break;
+   }
+
+   case IOCTL_VMX86_SET_HOST_CLOCK_PRIORITY:
+      /*
+       * This affects the global fast clock priority, and it only
+       * takes effect when the fast clock rate transitions from zero
+       * to a non-zero value.
+       *
+       * This is used to allow VMs to optionally work around
+       * bug 218750 by disabling our default priority boost. If any
+       * VM chooses to apply this workaround, the effect is permanent
+       * until vmmon is reloaded!
+       */
+
+      HostIF_FastClockLock(3);
+      linuxState.fastClockPriority = MAX(-20, MIN(19, (int)ioarg));
+      HostIF_FastClockUnlock(3);
+      retval = 0;
+      break;
+
+   case IOCTL_VMX86_SYNC_GET_TSCS: {
+      uint64 delta;
+
+      if (LinuxDriverSyncReadTSCs(&delta)) {
+         retval = HostIF_CopyToUser((void *)ioarg, &delta, sizeof delta);
+       } else {
+         retval = -EBUSY;
+      }
+      break;
+   }
+
+   case IOCTL_VMX86_SET_HOST_SWAP_SIZE: {
+      uint64 swapSize;
+      retval = HostIF_CopyFromUser(&swapSize, (void *)ioarg, sizeof swapSize);
+      if (retval != 0) {
+         Warning("Could not copy swap size from user, status %d\n", retval);
+	 break;
+      }
+      linuxState.swapSize = swapSize;
+      break;
+   }
+
+   case IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS: {
+      uint64 ctrs = Vmx86_GetUnavailablePerfCtrs();
+      retval = HostIF_CopyToUser((void *)ioarg, &ctrs, sizeof ctrs);
+      break;
+   }
+
+   default: 
+      Warning("Unknown ioctl %d\n", iocmd);
+      retval = -EINVAL;
+   }
+
+exit:
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriverQueue --
+ *
+ *      add the vmLinux to the global queue
+ *
+ * Results:
+ *
+ *      void
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+LinuxDriverQueue(VMLinux *vmLinux)  // IN/OUT:
+{
+   /*
+    * insert in global vm queue
+    */
+
+   HostIF_GlobalLock(12);
+
+   vmLinux->next = linuxState.head;
+   linuxState.head = vmLinux;
+
+   HostIF_GlobalUnlock(12);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriveDequeue --
+ *
+ *      remove from active list
+ *
+ * Results:
+ *
+ *      void
+ * Side effects:
+ *      printk if it is not in the list (error condition)
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+LinuxDriverDequeue(VMLinux *vmLinux)  // IN/OUT:
+{
+   VMLinux **p;
+
+   HostIF_GlobalLock(13);
+   for (p = &linuxState.head; *p != vmLinux; p = &(*p)->next) {
+      ASSERT(*p != NULL);
+   }
+   *p = vmLinux->next;
+   vmLinux->next = NULL;
+   HostIF_GlobalUnlock(13);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CheckPadding --
+ *
+ *      check for expected padding --
+ *      this check currently fails on the egcs compiler
+ *
+ * Results:
+ *
+ *      TRUE if the check succeeds -- module will be loaded
+ *
+ *
+ *
+ * Side effects:
+ *      output to kernel log on error
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+LinuxDriverCheckPadding(void)
+{
+   DTRWords32 dtr;
+   uint16 *x;
+
+   memset(&dtr, 0, sizeof dtr);
+   dtr.dtr.limit = 0x1111;
+   dtr.dtr.offset = 0x22223333;
+
+   x = (uint16 *) &dtr;
+
+   if (x[0] == 0x1111 && x[1] == 0x3333 && x[2] == 0x2222) {
+   } else {
+      Warning("DTR padding\n");
+      goto error;
+   }
+
+   return TRUE;
+
+error:
+   printk("/dev/vmmon: Cannot load module. Use standard gcc compiler\n");
+
+   return FALSE;
+}
+
+
+MODULE_AUTHOR("VMware, Inc.");
+MODULE_DESCRIPTION("VMware Virtual Machine Monitor.");
+MODULE_LICENSE("GPL v2");
+/*
+ * Starting with SLE10sp2, Novell requires that IHVs sign a support agreement
+ * with them and mark their kernel modules as externally supported via a
+ * change to the module header. If this isn't done, the module will not load
+ * by default (i.e., neither mkinitrd nor modprobe will accept it).
+ */
+MODULE_INFO(supported, "external");
diff --git a/vmmon-only/linux/driver.h b/vmmon-only/linux/driver.h
new file mode 100644
index 00000000..698afc9f
--- /dev/null
+++ b/vmmon-only/linux/driver.h
@@ -0,0 +1,118 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __DRIVER_H__
+#define __DRIVER_H__
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include <linux/miscdevice.h>
+#include <linux/mutex.h>
+#include <linux/sched.h>
+#include <linux/wait.h>
+
+#include "vmx86.h"
+#include "compat_semaphore.h"
+#include "driver_vmcore.h"
+
+
+/*
+ * Used to track a piece of memory that's been mapped into the kernel from
+ * userlevel.
+ */
+typedef struct VMMappedUserMem {
+   void *addr;
+   size_t numPages;
+   struct page *pages[0];
+} VMMappedUserMem;
+
+
+/*
+ * Per-instance driver state
+ */
+
+struct VMDriver;
+
+/* 16 pages (64KB) looks as a good limit for one allocation */
+#define VMMON_MAX_LOWMEM_PAGES	16
+
+typedef struct VMLinux {
+   struct VMLinux *next;
+   struct VMDriver *vm;
+
+   /*
+    * The semaphore protect accesses to size4Gb and pages4Gb
+    * in mmap(). mmap() may happen only once, and all other
+    * accesses except cleanup are read-only, and may happen
+    * only after successful mmap.
+    */
+   struct semaphore lock4Gb;
+   unsigned int size4Gb;
+   struct page *pages4Gb[VMMON_MAX_LOWMEM_PAGES];
+
+   /*
+    * LinuxDriverPoll() support
+    */
+
+   wait_queue_head_t pollQueue;
+   volatile uint32 *pollTimeoutPtr;
+   VMMappedUserMem *pollTimeoutHandle;
+   VmTimeType pollTime;
+   struct VMLinux *pollForw;
+   struct VMLinux **pollBack;
+} VMLinux;
+
+
+/*
+ * Static driver state.
+ */
+
+#define VM_DEVICE_NAME_SIZE 32
+#define LINUXLOG_BUFFER_SIZE  1024
+
+typedef struct VMXLinuxState {
+   int major;
+   int minor;
+   struct miscdevice misc;
+   char deviceName[VM_DEVICE_NAME_SIZE];
+   char buf[LINUXLOG_BUFFER_SIZE];
+   VMLinux *head;
+
+   /*
+    * for LinuxDriverPoll()
+    */
+
+   struct timer_list pollTimer;
+   wait_queue_head_t pollQueue;
+
+   struct VMLinux *pollList;
+
+   struct task_struct *fastClockThread;
+   struct file *fastClockFile;
+   unsigned fastClockRate;
+   long fastClockPriority;
+   uint64 swapSize;
+} VMXLinuxState;
+
+extern VMXLinuxState linuxState;
+extern uint8 monitorIPIVector;
+extern uint8 hvIPIVector;
+
+#endif
diff --git a/vmmon-only/linux/driverLog.c b/vmmon-only/linux/driverLog.c
new file mode 100644
index 00000000..39779f34
--- /dev/null
+++ b/vmmon-only/linux/driverLog.c
@@ -0,0 +1,207 @@
+/*********************************************************
+ * Copyright (C) 2007-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * driverLog.c --
+ *
+ *      Common logging functions for Linux kernel modules.
+ */
+
+#include "driver-config.h"
+#include "compat_kernel.h"
+#include "compat_sched.h"
+#include <asm/current.h>
+
+#include "driverLog.h"
+
+#define LINUXLOG_BUFFER_SIZE 1024
+
+static const char *driverLogPrefix = "";
+
+/*
+ * vsnprintf was born in 2.4.10. Fall back on vsprintf if we're
+ * an older kernel.
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 10)
+# define vsnprintf(str, size, fmt, args) vsprintf(str, fmt, args)
+#endif
+
+
+/*
+ *----------------------------------------------------------------------------
+ *
+ * DriverLog_Init --
+ *
+ *      Initializes the Linux logging.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------------
+ */
+
+void
+DriverLog_Init(const char *prefix) // IN
+{
+   driverLogPrefix = prefix ? prefix : "";
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * DriverLogPrint --
+ *
+ *      Log error message from a Linux module.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+DriverLogPrint(const char *level,     // IN: KERN_* constant
+               const char *fmt,       // IN: error format string
+               va_list args)          // IN: arguments for format string
+{
+   static char staticBuf[LINUXLOG_BUFFER_SIZE];
+   char stackBuf[128];
+   va_list args2;
+   const char *buf;
+
+   /*
+    * By default, use a small buffer on the stack (thread safe). If it is too
+    * small, fall back to a larger static buffer (not thread safe).
+    */
+   va_copy(args2, args);
+   if (vsnprintf(stackBuf, sizeof stackBuf, fmt, args2) < sizeof stackBuf) {
+      buf = stackBuf;
+   } else {
+      vsnprintf(staticBuf, sizeof staticBuf, fmt, args);
+      buf = staticBuf;
+   }
+   va_end(args2);
+
+   printk("%s%s[%d]: %s", level, driverLogPrefix, current->pid, buf);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Warning --
+ *
+ *      Warning messages from kernel module: logged into kernel log
+ *      as warnings.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Warning(const char *fmt, ...)  // IN: warning format string
+{
+   va_list args;
+
+   va_start(args, fmt);
+   DriverLogPrint(KERN_WARNING, fmt, args);
+   va_end(args);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Log --
+ *
+ *      Log messages from kernel module: logged into kernel log
+ *      as debug information.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Log(const char *fmt, ...)  // IN: log format string
+{
+   va_list args;
+
+   /*
+    * Use the kernel log with at least a KERN_DEBUG level
+    * so it doesn't garbage the screen at (re)boot time on RedHat 6.0.
+    */
+
+   va_start(args, fmt);
+   DriverLogPrint(KERN_DEBUG, fmt, args);
+   va_end(args);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Panic --
+ *
+ *      ASSERTION failures and Panics from kernel module get here.
+ *      Message is logged to the kernel log and on console.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Never returns
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Panic(const char *fmt, ...)  // IN: panic format string
+{
+   va_list args;
+
+   va_start(args, fmt);
+   DriverLogPrint(KERN_EMERG, fmt, args);
+   va_end(args);
+
+#ifdef BUG
+   BUG();
+#else
+   /* Should die with %cs unwritable, or at least with page fault. */
+   asm volatile("movb $0, %cs:(0)");
+#endif
+
+   while (1);
+}
diff --git a/vmmon-only/linux/driverLog.h b/vmmon-only/linux/driverLog.h
new file mode 100644
index 00000000..04dd07cd
--- /dev/null
+++ b/vmmon-only/linux/driverLog.h
@@ -0,0 +1,37 @@
+/*********************************************************
+ * Copyright (C) 2007-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * driverLog.h --
+ *
+ *      Logging functions for Linux kernel modules.
+ */
+
+#ifndef __DRIVERLOG_H__
+#define __DRIVERLOG_H__
+
+/*
+ * The definitions of Warning(), Log(), and Panic() come from vm_assert.h for
+ * consistency.
+ */
+#include "vm_assert.h"
+
+void DriverLog_Init(const char *prefix);
+
+#endif /* __DRIVERLOG_H__ */
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
new file mode 100644
index 00000000..fd320130
--- /dev/null
+++ b/vmmon-only/linux/hostif.c
@@ -0,0 +1,3603 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * hostif.c --
+ *
+ *    This file implements the platform-specific (here Linux) interface that
+ *    the cross-platform code uses --hpreg
+ *
+ */
+
+
+/* Must come before any kernel header file --hpreg */
+#include "driver-config.h"
+
+/* Must come before vmware.h --hpreg */
+#include "compat_page.h"
+#include <linux/binfmts.h>
+#include <linux/delay.h>
+#include <linux/file.h>
+#include <linux/kernel.h>
+
+#include <linux/vmalloc.h>
+#include <linux/slab.h>
+
+#include <linux/preempt.h>
+#include <linux/poll.h>
+#include <linux/mman.h>
+
+#include <linux/smp.h>
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 25)
+#   include <asm/asm.h>
+#endif
+#if defined(_ASM_EXTABLE)
+#   define VMW_ASM_EXTABLE(from, to) _ASM_EXTABLE(from, to)
+#else
+    /* Compat version copied from asm.h of 2.6.25 kernel */
+#   define VMW_ASM_FORM(x)  " " #x " "
+#   define VMW_ASM_EX_SEC   " .section __ex_table,\"a\"\n"
+#   ifdef CONFIG_X86_32
+#      define VMW_ASM_SEL(a,b) VMW_ASM_FORM(a)
+#   else
+#      define VMW_ASM_SEL(a,b) VMW_ASM_FORM(b)
+#   endif
+#   define VMW_ASM_PTR        VMW_ASM_SEL(.long, .quad)
+#   define VMW_ASM_ALIGN      VMW_ASM_SEL(.balign 4, .balign 8)
+#   define VMW_ASM_EXTABLE(from,to) \
+           VMW_ASM_EX_SEC    \
+           VMW_ASM_ALIGN "\n" \
+           VMW_ASM_PTR #from "," #to "\n" \
+           " .previous\n"
+#endif
+
+#include <asm/io.h>
+#include <asm/uaccess.h>
+#include <linux/mc146818rtc.h>
+#include <linux/capability.h>
+#include <linux/kthread.h>
+#include <linux/wait.h>
+
+
+#include "vmware.h"
+#include "x86apic.h"
+#include "vm_asm.h"
+#include "modulecall.h"
+#include "memtrack.h"
+#include "phystrack.h"
+#include "cpuid.h"
+#include "cpuid_info.h"
+#include "hostif.h"
+#include "hostif_priv.h"
+#include "driver.h"
+#include "vmhost.h"
+#include "x86msr.h"
+#include "apic.h"
+#include "memDefaults.h"
+#include "vcpuid.h"
+
+#include "pgtbl.h"
+#include "vmmonInt.h"
+#include "versioned_atomic.h"
+
+/*
+ * Determine if we can use high resolution timers.
+ */
+
+#ifdef CONFIG_HIGH_RES_TIMERS
+#   include <linux/hrtimer.h>
+#   define VMMON_USE_HIGH_RES_TIMERS
+#   if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 28)
+#      define VMMON_USE_SCHEDULE_HRTIMEOUT
+#   else
+#      define VMMON_USE_COMPAT_SCHEDULE_HRTIMEOUT
+static void HostIFWakeupClockThread(unsigned long data);
+static DECLARE_TASKLET(timerTasklet, HostIFWakeupClockThread, 0);
+#   endif
+#   define close_rtc(filp, files) do {} while(0)
+#else
+#   define close_rtc(filp, files) filp_close(filp, files)
+#endif
+
+#define UPTIME_FREQ CONST64(1000000)
+
+/*
+ * When CONFIG_NO_HZ_FULL is set processors can run tickless
+ * if there is only one runnable process.  When set, the rate
+ * checks in HostIF_SetFastClockRate and HostIFFastClockThread
+ * need to be relaxed to allow any non-zero rate to run.
+ *
+ * This code can potentially be removed if/when we stop using
+ * HostIFFastClockThread to drive MonTimer.  See PR1088247.
+ */
+#ifdef CONFIG_NO_HZ_FULL
+#define MIN_RATE (0)
+#else
+#define MIN_RATE ((HZ) + (HZ) / 16)
+#endif
+
+/*
+ * Linux seems to like keeping free memory around 30MB
+ * even under severe memory pressure.  Let's give it a little
+ * more leeway than that for safety.
+ */
+#define LOCKED_PAGE_SLACK 10000
+
+static struct {
+   Atomic_uint64     uptimeBase;
+   VersionedAtomic   version;
+   uint64            monotimeBase;
+   unsigned long     jiffiesBase;
+   struct timer_list timer;
+} uptimeState;
+
+/*
+ * First Page Locking strategy
+ * ---------------------------
+ *
+ * An early implementation hacked the lock bit for the purpose of locking
+ * memory. This had a couple of advantages:
+ *   - the vmscan algorithm would never eliminate mappings from the process
+ *     address space
+ *   - easy to assert that things are ok
+ *   - it worked with anonymous memory. Basically, vmscan jumps over these
+ *     pages, their use count stays high, ....
+ *
+ * This approach however had a couple of problems:
+ *
+ *   - it relies on an undocumented interface. (in another words, a total hack)
+ *   - it creates deadlock situations if the application gets a kill -9 or
+ *     otherwise dies ungracefully. linux first tears down the address space,
+ *     then closes file descriptors (including our own device). Unfortunately,
+ *     this leads to a deadlock of the process on pages with the lock bit set.
+ *
+ *     There is a workaround for that, namely to detect that condition using
+ *     a linux timer. (ugly)
+ *
+ * Current Page Locking strategy
+ * -----------------------------
+ *
+ * The current scheme does not use the lock bit, rather it increments the use
+ * count on the pages that need to be locked down in memory.
+ *
+ * The problem is that experiments on certain linux systems (e.g. 2.2.0-pre9)
+ * showed that linux somehow swaps out anonymous pages, even with the
+ * increased ref counter.
+ * Swapping them out to disk is not that big of a deal, but bringing them back
+ * to a different location is.  In any case, anonymous pages in linux are not
+ * intended to be write-shared (e.g. try to MAP_SHARED /dev/zero).
+ *
+ * As a result, the current locking strategy requires that all locked pages are
+ * backed by the filesystem, not by swap. For now, we use both mapped files and
+ * sys V shared memory. The user application is responsible to cover these
+ * cases.
+ *
+ */
+
+
+#define HOST_UNLOCK_PFN(_vm, _pfn) do {                  \
+   _vm = _vm;                                            \
+   put_page(pfn_to_page(_pfn));                          \
+} while (0)
+
+#define HOST_UNLOCK_PFN_BYMPN(_vm, _pfn) do {            \
+   PhysTrack_Remove((_vm)->vmhost->lockedPages, (_pfn)); \
+   put_page(pfn_to_page(_pfn));                          \
+} while (0)
+
+uint8 monitorIPIVector;
+uint8 hvIPIVector;
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MutexInit --
+ *
+ *      Initialize a Mutex. --hpreg
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#ifdef VMX86_DEBUG
+static INLINE void
+MutexInit(Mutex *mutex,     // IN
+          char const *name) // IN
+{
+   ASSERT(mutex);
+   ASSERT(name);
+
+   sema_init(&mutex->sem, 1);
+   mutex->name = name;
+   mutex->cur.pid = -1;
+}
+#else
+#   define MutexInit(_mutex, _name) sema_init(&(_mutex)->sem, 1)
+#endif
+
+
+#ifdef VMX86_DEBUG
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MutexIsLocked --
+ *
+ *      Determine if a Mutex is locked by the current thread. --hpreg
+ *
+ * Results:
+ *      TRUE if yes
+ *      FALSE if no
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+MutexIsLocked(Mutex *mutex) // IN
+{
+   ASSERT(mutex);
+
+   return mutex->cur.pid == current->pid;
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MutexLock --
+ *
+ *      Acquire a Mutex. --hpreg
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#ifdef VMX86_DEBUG
+static INLINE void
+MutexLock(Mutex *mutex, // IN
+          int callerID) // IN
+{
+   ASSERT(mutex);
+   ASSERT(!MutexIsLocked(mutex));
+
+   down(&mutex->sem);
+   mutex->cur.pid = current->pid;
+   mutex->cur.callerID = callerID;
+}
+#else
+#   define MutexLock(_mutex, _callerID) down(&(_mutex)->sem)
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MutexUnlock --
+ *
+ *      Release a Mutex. --hpreg
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#ifdef VMX86_DEBUG
+static INLINE void
+MutexUnlock(Mutex *mutex, // IN
+            int callerID) // IN
+{
+   ASSERT(mutex);
+
+   ASSERT(MutexIsLocked(mutex) && mutex->cur.callerID == callerID);
+   mutex->prev = mutex->cur;
+   mutex->cur.pid = -1;
+   up(&mutex->sem);
+}
+#else
+#   define MutexUnlock(_mutex, _callerID) up(&(_mutex)->sem)
+#endif
+
+
+/* This mutex protects the driver-wide state. --hpreg */
+static Mutex globalMutex;
+
+/*
+ * This mutex protects the fast clock rate and is held while
+ * creating/destroying the fastClockThread.  It ranks below
+ * globalMutex.  We can't use globalMutex for this purpose because the
+ * fastClockThread itself acquires the globalMutex, so trying to hold
+ * the mutex while destroying the thread can cause a deadlock.
+ */
+static Mutex fastClockMutex;
+
+/* This mutex protects linuxState.pollList.  */
+static Mutex pollListMutex;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_PrepareWaitForThreads --
+ *
+ *      Prepare to wait for another vCPU thread.
+ *
+ * Results:
+ *      FALSE: no way on Linux to determine we've already been signalled.
+ *
+ * Side effects:
+ *      Current task is interruptible.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+HostIF_PrepareWaitForThreads(VMDriver *vm,     // IN:
+                             Vcpuid currVcpu)  // IN:
+{
+   set_current_state(TASK_INTERRUPTIBLE);
+   vm->vmhost->vcpuSemaTask[currVcpu] = current;
+   return FALSE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_WaitForThreads --
+ *
+ *      Wait for another vCPU thread.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Current task may block.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_WaitForThreads(VMDriver *vm,     // UNUSED:
+                      Vcpuid currVcpu)  // UNUSED:
+
+{
+#ifdef VMMON_USE_SCHEDULE_HRTIMEOUT
+   ktime_t timeout = ktime_set(0, CROSSCALL_SLEEP_US * 1000);
+   schedule_hrtimeout(&timeout, HRTIMER_MODE_REL);
+#else
+   /* Fallback to ms timer resolution is fine for older kernels. */
+   schedule_timeout(msecs_to_jiffies(CROSSCALL_SLEEP_US / 1000) + 1);
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_CancelWaitForThreads --
+ *
+ *      Cancel waiting for another vCPU thread.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Current task is running and no longer interruptible.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_CancelWaitForThreads(VMDriver *vm,     // IN:
+                            Vcpuid currVcpu)  // IN:
+{
+   vm->vmhost->vcpuSemaTask[currVcpu] = NULL;
+   set_current_state(TASK_RUNNING);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_WakeUpYielders --
+ *
+ *      Wakeup vCPUs that are waiting for the current vCPU.
+ *      
+ * Results:
+ *      The requested vCPUs are nudged if they are sleeping due to
+ *      Vmx86_YieldToSet.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_WakeUpYielders(VMDriver *vm,     // IN:
+                      Vcpuid currVcpu)  // IN:
+{
+   VCPUSet req;
+   Vcpuid vcpuid;
+   uint64 subset;
+
+   /*
+    * PR 1142958: if the VCPUs woken in the crosscallWaitSet re-add themselves
+    * to this set faster than it can be fully drained, this function never
+    * exits.  Instead, we copy and remove a snapshot of the crosscallWaitSet
+    * and locally wake up just that snapshot.  It is ok that we don't get a
+    * fully coherent snapshot, as long as the subset copy-and-remove is atomic
+    * so no VCPU added is lost entirely.
+    */
+
+   VCPUSet_Empty(&req);
+   FOR_EACH_SUBSET_IN_SET(subIdx) {
+      subset = VCPUSet_AtomicReadWriteSubset(&vm->crosscallWaitSet[currVcpu],
+                                             0, subIdx);
+      VCPUSet_UnionSubset(&req, subset, subIdx);
+   } ROF_EACH_SUBSET_IN_SET();
+
+   preempt_disable();
+   while ((vcpuid = VCPUSet_FindFirst(&req)) != VCPUID_INVALID) {
+      struct task_struct *t = vm->vmhost->vcpuSemaTask[vcpuid];
+      VCPUSet_Remove(&req, vcpuid);
+      if (t && (t->state & TASK_INTERRUPTIBLE)) {
+         wake_up_process(t);
+      }
+   }
+   preempt_enable();
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_InitGlobalLock --
+ *
+ *      Initialize the global (across all VMs and vmmon) locks.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_InitGlobalLock(void)
+{
+   MutexInit(&globalMutex, "global");
+   MutexInit(&fastClockMutex, "fastClock");
+   MutexInit(&pollListMutex, "pollList");
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_GlobalLock --
+ *
+ *      Grabs the global data structure lock.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Should be a very low contention lock. 
+ *      The current thread is rescheduled if the lock is busy.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_GlobalLock(int callerID) // IN
+{
+   MutexLock(&globalMutex, callerID);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_GlobalUnlock --
+ *
+ *      Releases the global data structure lock.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_GlobalUnlock(int callerID) // IN
+{
+   MutexUnlock(&globalMutex, callerID);
+}
+
+
+#ifdef VMX86_DEBUG
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_GlobalLockIsHeld --
+ *
+ *      Determine if the global lock is held by the current thread.
+ * 
+ * Results:
+ *      TRUE if yes
+ *      FALSE if no
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+HostIF_GlobalLockIsHeld(void)
+{
+   return MutexIsLocked(&globalMutex);
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_FastClockLock --
+ *
+ *      Grabs the fast clock data structure lock.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Should be a very low contention lock. 
+ *      The current thread is rescheduled if the lock is busy.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_FastClockLock(int callerID) // IN
+{
+   MutexLock(&fastClockMutex, callerID);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_FastClockUnlock --
+ *
+ *      Releases the fast clock data structure lock.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_FastClockUnlock(int callerID) // IN
+{
+   MutexUnlock(&fastClockMutex, callerID);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_PollListLock --
+ *
+ *      Grabs the linuxState.pollList lock.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      The current thread is rescheduled if the lock is busy.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_PollListLock(int callerID) // IN
+{
+   MutexLock(&pollListMutex, callerID);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_PollListUnlock --
+ *
+ *      Releases the linuxState.pollList lock.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_PollListUnlock(int callerID) // IN
+{
+   MutexUnlock(&pollListMutex, callerID);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MapCrossPage & UnmapCrossPage
+ *
+ *    Both x86-64 and ia32 need to map crosspage to an executable
+ *    virtual address. We use the vmap interface instead of kmap
+ *    due to bug 43907.
+ *
+ * Side effects:
+ *
+ *    UnmapCrossPage assumes that the page has been refcounted up
+ *    so it takes care of the put_page.
+ *
+ *----------------------------------------------------------------------
+ */
+static void *
+MapCrossPage(struct page *p)  // IN:
+{
+   return vmap(&p, 1, VM_MAP, VM_PAGE_KERNEL_EXEC);
+}
+
+
+static void
+UnmapCrossPage(struct page *p,  // IN:
+               void *va)        // IN:
+{
+   vunmap(va);
+   put_page(p);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFHostMemInit --
+ *
+ *      Initialize per-VM pages lists.
+ *
+ * Results:
+ *      0 on success,
+ *      non-zero on failure.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+HostIFHostMemInit(VMDriver *vm)  // IN:
+{
+   VMHost *vmh = vm->vmhost;
+   
+   vmh->lockedPages = PhysTrack_Alloc(vm);
+   if (!vmh->lockedPages) {
+      return -1;
+   }
+   vmh->AWEPages = PhysTrack_Alloc(vm);
+   if (!vmh->AWEPages) {
+      return -1;
+   }
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFHostMemCleanup --
+ *
+ *      Release per-VM pages lists.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Locked and AWE pages are released.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+HostIFHostMemCleanup(VMDriver *vm)  // IN:
+{
+   MPN mpn;
+   VMHost *vmh = vm->vmhost;
+
+   if (!vmh) {
+      return;
+   }
+
+   HostIF_VMLock(vm, 32); // Debug version of PhysTrack wants VM's lock.
+   if (vmh->lockedPages) {
+      for (mpn = 0;
+           INVALID_MPN != (mpn = PhysTrack_GetNext(vmh->lockedPages, mpn));) {
+         HOST_UNLOCK_PFN_BYMPN(vm, mpn);
+      }
+      PhysTrack_Free(vmh->lockedPages);
+      vmh->lockedPages = NULL;
+   }
+
+   if (vmh->AWEPages) {
+      for (mpn = 0;
+           INVALID_MPN != (mpn = PhysTrack_GetNext(vmh->AWEPages, mpn));) {
+         PhysTrack_Remove(vmh->AWEPages, mpn);
+         put_page(pfn_to_page(mpn));
+      }
+      PhysTrack_Free(vmh->AWEPages);
+      vmh->AWEPages = NULL;
+   }
+   HostIF_VMUnlock(vm, 32);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_AllocMachinePage --
+ *
+ *      Alloc non-swappable memory page. The page is not billed to
+ *      a particular VM. Preferably the page should not be mapped into
+ *      the kernel addresss space.
+ *
+ * Results:
+ *      INVALID_MPN or a valid host mpn.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+HostIF_AllocMachinePage(void)
+{
+  struct page *pg = alloc_page(GFP_HIGHUSER);
+
+  return (pg) ? ((MPN)page_to_pfn(pg)) : INVALID_MPN;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_FreeMachinePage --
+ *
+ *      Free an anonymous machine page allocated by 
+ *      HostIF_AllocMachinePage().  This page is not tracked in any 
+ *      phystracker.
+ *
+ * Results:
+ *      Host page is unlocked.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_FreeMachinePage(MPN mpn)  // IN:
+{
+  struct page *pg = pfn_to_page(mpn);
+
+  __free_page(pg);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_AllocLockedPages --
+ *
+ *      Alloc non-swappable memory.
+ *
+ * Results:
+ *      negative value on complete failure
+ *      non-negative value on partial/full completion, number of MPNs
+ *          allocated & filled in pmpn returned.
+ *
+ * Side effects:
+ *      Pages allocated.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIF_AllocLockedPages(VMDriver *vm,	     // IN: VM instance pointer
+			VA64 addr,	     // OUT: pointer to user or kernel buffer for MPNs
+			unsigned numPages,   // IN: number of pages to allocate
+			Bool kernelMPNBuffer)// IN: is the MPN buffer in kernel or user address space?
+{
+   MPN *pmpn = VA64ToPtr(addr);
+
+   VMHost *vmh = vm->vmhost;
+   unsigned int cnt;
+   int err = 0;
+
+   if (!vmh || !vmh->AWEPages) {
+      return -EINVAL;
+   }
+   for (cnt = 0; cnt < numPages; cnt++) {
+      struct page* pg;
+      MPN mpn;
+
+      pg = alloc_page(GFP_HIGHUSER);
+      if (!pg) {
+         err = -ENOMEM;
+	 break;
+      }
+      mpn = (MPN)page_to_pfn(pg);
+      if (kernelMPNBuffer) {
+         *pmpn = mpn;
+      } else if (HostIF_CopyToUser(pmpn, &mpn, sizeof *pmpn) != 0) {
+	__free_page(pg);
+	err = -EFAULT;
+	break;
+      }
+      pmpn++;
+      if (PhysTrack_Test(vmh->AWEPages, mpn)) {
+	Warning("%s: duplicate MPN %016" FMT64 "x\n", __func__, mpn);
+      }
+      PhysTrack_Add(vmh->AWEPages, mpn);
+   }
+
+   return cnt ? cnt : err;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_FreeLockedPages --
+ *
+ *      Free non-swappable memory.
+ *
+ * Results:
+ *      On success: 0. All pages were unlocked.
+ *      On failure: Non-zero system error code. No page was unlocked.
+ *
+ * Side effects:
+ *      Pages freed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIF_FreeLockedPages(VMDriver *vm,	     // IN: VM instance pointer
+		       VA64 addr,            // IN: user or kernel array of MPNs
+		       unsigned numPages,    // IN: number of pages to free
+		       Bool kernelMPNBuffer) // IN: is the MPN buffer in kernel or user address space?
+{
+   const int MPN_BATCH = 64;
+   MPN const *pmpn = VA64ToPtr(addr);
+   VMHost *vmh = vm->vmhost;
+   unsigned int cnt;
+   struct page *pg;
+   MPN *mpns;
+
+   mpns = HostIF_AllocKernelMem(sizeof *mpns * MPN_BATCH, TRUE);
+
+   if (mpns == NULL) {
+      return -ENOMEM;
+   }
+   if (!vmh || !vmh->AWEPages) {
+      HostIF_FreeKernelMem(mpns);
+      return -EINVAL;
+   }
+
+   if (!kernelMPNBuffer) {
+      if (numPages > MPN_BATCH) {
+         HostIF_FreeKernelMem(mpns);
+         return -EINVAL;
+      }
+
+      if (HostIF_CopyFromUser(mpns, pmpn, numPages * sizeof *pmpn)) {
+         printk(KERN_DEBUG "Cannot read from process address space at %p\n",
+                pmpn);
+         HostIF_FreeKernelMem(mpns);
+         return -EINVAL;
+      }
+
+      pmpn = mpns;
+   }
+
+   for (cnt = 0; cnt < numPages; cnt++) {
+      if (!PhysTrack_Test(vmh->AWEPages, pmpn[cnt])) {
+         printk(KERN_DEBUG "Attempted to free unallocated MPN %016" FMT64 "X\n",
+                pmpn[cnt]);
+         HostIF_FreeKernelMem(mpns);
+         return -EINVAL;
+      }
+
+      pg = pfn_to_page(pmpn[cnt]);
+      if (page_count(pg) != 1) {
+         // should this case be considered a failure?
+         printk(KERN_DEBUG "Page %016" FMT64 "X is still used by someone "
+                "(use count %u, VM %p)\n", pmpn[cnt],
+                 page_count(pg), vm);
+      }
+   }
+
+   for (cnt = 0; cnt < numPages; cnt++) {
+      pg = pfn_to_page(pmpn[cnt]);
+      PhysTrack_Remove(vmh->AWEPages, pmpn[cnt]);
+      __free_page(pg);
+   }
+   HostIF_FreeKernelMem(mpns);
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_Init --
+ *
+ *      Initialize the host-dependent part of the driver.
+ *
+ * Results:
+ *     zero on success, non-zero on error.
+ *
+ * Side effects:
+ *     None
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIF_Init(VMDriver *vm)  // IN:
+{
+   vm->memtracker = MemTrack_Init();
+   if (vm->memtracker == NULL) {
+      return -1;
+   }
+
+   vm->vmhost = (VMHost *) HostIF_AllocKernelMem(sizeof *vm->vmhost, TRUE);
+   if (vm->vmhost == NULL) {
+      return -1;
+   }
+   memset(vm->vmhost, 0, sizeof *vm->vmhost);
+
+   if (HostIFHostMemInit(vm)) {
+      return -1;
+   }
+   MutexInit(&vm->vmhost->vmMutex, "vm");
+
+   return 0;
+}
+
+
+/*
+ *------------------------------------------------------------------------------
+ *
+ * HostIF_LookupUserMPN --
+ *
+ *      Lookup the MPN of a locked user page by user VA.
+ *
+ * Results:
+ *      A status code and the MPN on success.
+ *
+ * Side effects:
+ *     None
+ *
+ *------------------------------------------------------------------------------
+ */
+
+int
+HostIF_LookupUserMPN(VMDriver *vm, // IN: VMDriver
+                     VA64 uAddr,   // IN: user VA of the page
+                     MPN *mpn)     // OUT
+{
+   void *uvAddr = VA64ToPtr(uAddr);
+   int retval = PAGE_LOCK_SUCCESS;
+
+   *mpn = PgtblVa2MPN((VA)uvAddr);
+
+   /*
+    * On failure, check whether the page is locked.
+    *
+    * While we don't require the page to be locked by HostIF_LockPage(),
+    * it does provide extra information.
+    *
+    * -- edward
+    */
+   if (*mpn == INVALID_MPN) {
+      if (vm == NULL) {
+         retval += PAGE_LOOKUP_NO_VM;
+      } else {
+         MemTrackEntry *entryPtr =
+            MemTrack_LookupVPN(vm->memtracker, PTR_2_VPN(uvAddr));
+         if (entryPtr == NULL) {
+            retval += PAGE_LOOKUP_NOT_TRACKED;
+         } else if (entryPtr->mpn == 0) {
+            retval += PAGE_LOOKUP_NO_MPN;
+         } else {
+            /*
+             * Kernel can remove PTEs/PDEs from our pagetables even if pages
+             * are locked...
+             */
+            volatile int c;
+
+            get_user(c, (char *)uvAddr);
+            *mpn = PgtblVa2MPN((VA)uvAddr);
+            if (*mpn == entryPtr->mpn) {
+#ifdef VMX86_DEBUG
+               printk(KERN_DEBUG "Page %p disappeared from %s(%u)... "
+                      "now back at %016" FMT64 "x\n",
+                      uvAddr, current->comm, current->pid, *mpn);
+#endif
+            } else if (*mpn != INVALID_MPN) {
+               printk(KERN_DEBUG "Page %p disappeared from %s(%u)... "
+                      "now back at %016" FMT64"x (old=%016" FMT64 "x)\n",
+                      uvAddr, current->comm, current->pid, *mpn,
+                      entryPtr->mpn);
+               *mpn = INVALID_MPN;
+            } else {
+               printk(KERN_DEBUG "Page %p disappeared from %s(%u)... "
+                      "and is lost (old=%016" FMT64 "x)\n", uvAddr, current->comm,
+                      current->pid, entryPtr->mpn);
+               *mpn = entryPtr->mpn;
+            }
+         }
+      }
+   }
+
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_InitFP --
+ *
+ *      masks IRQ13 if not previously the case.
+ *
+ * Results:
+ *      prevents INTR #0x2d (IRQ 13) from being generated --
+ *      assume that Int16 works for interrupt reporting
+ *      
+ *
+ * Side effects:
+ *      PIC
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_InitFP(VMDriver *vm)  // IN:
+{
+   int mask = (1 << (0xD - 0x8));
+
+   uint8 val = inb(0xA1);
+
+   if (!(val & mask)) { 
+      val = val | mask;
+      outb(val, 0xA1);
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIFGetUserPages --
+ *
+ *      Lock the pages of an user-level address space in memory.
+ *      If ppages is NULL, pages are only marked as dirty.
+ *
+ * Results:
+ *      Zero on success, non-zero on failure. 
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static int
+HostIFGetUserPages(void *uvAddr,          // IN
+                   struct page **ppages,  // OUT
+                   unsigned int numPages) // IN
+{
+   int retval;
+
+   down_read(&current->mm->mmap_sem);
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 9, 0)
+   retval = get_user_pages((unsigned long)uvAddr, numPages, 0, ppages, NULL);
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 6, 0)
+   retval = get_user_pages((unsigned long)uvAddr, numPages, 0, 0, ppages, NULL);
+#else
+   retval = get_user_pages(current, current->mm, (unsigned long)uvAddr,
+                           numPages, 0, 0, ppages, NULL);
+#endif
+   up_read(&current->mm->mmap_sem);
+
+   return retval != numPages;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_IsLockedByMPN --
+ *
+ *      Checks if mpn was locked using allowMultipleMPNsPerVA.  
+ *
+ * Results:
+ *      TRUE if mpn is present in the physTracker.
+ *      
+ *
+ * Side effects:
+ *     None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+HostIF_IsLockedByMPN(VMDriver *vm,  // IN:
+                     MPN mpn)       // IN:
+{
+  return PhysTrack_Test(vm->vmhost->lockedPages, mpn);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_LockPage --
+ *
+ *     Lockup the MPN of an pinned user-level address space
+ *
+ * Results:
+ *     A PAGE_LOCK_* status code and the MPN on success.
+ *
+ * Side effects:
+ *      Adds the page to the MemTracker, if allowMultipleMPNsPerVA then the page
+ *      is added to the VM's PhysTracker.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+HostIF_LockPage(VMDriver *vm,                // IN: VMDriver
+                VA64 uAddr,                  // IN: user VA of the page
+                Bool allowMultipleMPNsPerVA, // IN: allow to lock many pages per VA
+                MPN *mpn)                    // OUT: pinned page
+{
+   void *uvAddr = VA64ToPtr(uAddr);
+   struct page *page;
+   VPN vpn;
+   MemTrackEntry *entryPtr = NULL;
+
+   vpn = PTR_2_VPN(uvAddr);
+   if (!allowMultipleMPNsPerVA) {
+      entryPtr = MemTrack_LookupVPN(vm->memtracker, vpn);
+
+      /*
+       * Already tracked and locked
+       */
+
+      if (entryPtr != NULL && entryPtr->mpn != 0) {
+         return PAGE_LOCK_ALREADY_LOCKED;
+      }
+   }
+
+   if (HostIFGetUserPages(uvAddr, &page, 1)) {
+      return PAGE_LOCK_FAILED;
+   }
+
+   *mpn = (MPN)page_to_pfn(page);
+
+   if (allowMultipleMPNsPerVA) {
+      /*
+       *  Add the MPN to the PhysTracker that tracks locked pages.
+       */
+
+      struct PhysTracker* const pt = vm->vmhost->lockedPages;
+
+      if (PhysTrack_Test(pt, *mpn)) {
+         put_page(page);
+         return PAGE_LOCK_ALREADY_LOCKED;
+      }
+      PhysTrack_Add(pt, *mpn);
+   } else {
+      /*
+       * If the entry doesn't exist, add it to the memtracker
+       * otherwise we just update the mpn.
+       */
+
+      if (entryPtr == NULL) {
+         entryPtr = MemTrack_Add(vm->memtracker, vpn, *mpn);
+         if (entryPtr == NULL) {
+            HOST_UNLOCK_PFN(vm, *mpn);
+            return PAGE_LOCK_MEMTRACKER_ERROR;
+         }
+      } else {
+         entryPtr->mpn = *mpn;
+      }
+   }
+
+   return PAGE_LOCK_SUCCESS;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_UnlockPage --
+ *
+ *      Unlock an pinned user-level page.
+ *
+ * Results:
+ *      Status PAGE_UNLOCK_* code.
+ *
+ * Side effects:
+ *     None
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIF_UnlockPage(VMDriver *vm,  // IN:
+                  VA64 uAddr)    // IN:
+{
+   void *addr = VA64ToPtr(uAddr);
+   VPN vpn;
+   MemTrackEntry *e;
+
+   vpn = VA_2_VPN((VA)addr);
+   e = MemTrack_LookupVPN(vm->memtracker, vpn);
+    
+   if (e == NULL) {
+      return PAGE_UNLOCK_NOT_TRACKED;
+   }
+   if (e->mpn == 0) {
+      return PAGE_UNLOCK_NO_MPN;
+   }
+
+   HOST_UNLOCK_PFN(vm, e->mpn);
+   e->mpn = 0;
+
+   return PAGE_UNLOCK_SUCCESS;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_UnlockPageByMPN --
+ *
+ *      Unlock a locked user mode page. The page doesn't need to be mapped
+ *      anywhere.
+ *
+ * Results:
+ *      Status code. Returns a PAGE_LOOKUP_* error if the page can't be found or
+ *      a PAGE_UNLOCK_* error if the page can't be unlocked.
+ *
+ * Side effects:
+ *     Removes the MPN from from VM's PhysTracker.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIF_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
+                       MPN mpn,      // IN: the MPN to unlock
+                       VA64 uAddr)   // IN: optional(debugging) VA for the MPN
+{
+   if (!PhysTrack_Test(vm->vmhost->lockedPages, mpn)) {
+      return PAGE_UNLOCK_NO_MPN;
+   }
+
+#ifdef VMX86_DEBUG
+   {
+      void *va = VA64ToPtr(uAddr);
+      MemTrackEntry *e;
+      
+      /*
+       * Verify for debugging that VA and MPN make sense.
+       * PgtblVa2MPN() can fail under high memory pressure.
+       */
+
+      if (va != NULL) {
+         MPN lookupMpn = PgtblVa2MPN((VA)va);
+
+         if (lookupMpn != INVALID_MPN && mpn != lookupMpn) {
+            Warning("Page lookup fail %#"FMT64"x %016" FMT64 "x %p\n",
+                    mpn, lookupMpn, va);
+
+            return PAGE_LOOKUP_INVALID_ADDR;
+         }
+      }
+
+      /*
+       * Verify that this MPN was locked with 
+       * HostIF_LockPage(allowMultipleMPNsPerVA = TRUE).
+       * That means that this MPN should not be in the MemTracker.
+       */
+
+      e = MemTrack_LookupMPN(vm->memtracker, mpn);
+      if (e) {
+         Warning("%s(): mpn=%#"FMT64"x va=%p was permanently locked with "
+                 "vpn=0x%"FMT64"x\n", __func__, mpn, va, e->vpn);
+
+         return PAGE_UNLOCK_MISMATCHED_TYPE;
+      }
+   }
+#endif 
+
+   HOST_UNLOCK_PFN_BYMPN(vm, mpn);
+
+   return PAGE_UNLOCK_SUCCESS;
+}
+
+
+static void 
+UnlockEntry(void *clientData,         // IN:
+            MemTrackEntry *entryPtr)  // IN:
+{
+   VMDriver *vm = (VMDriver *)clientData;
+
+   if (entryPtr->mpn) {
+      HOST_UNLOCK_PFN(vm,entryPtr->mpn);
+      entryPtr->mpn = 0;
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_FreeAllResources --
+ *
+ *      Free all host-specific VM resources.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_FreeAllResources(VMDriver *vm) // IN
+{
+   unsigned int cnt;
+
+   HostIFHostMemCleanup(vm);
+   if (vm->memtracker) {
+      MemTrack_Cleanup(vm->memtracker, UnlockEntry, vm);
+      vm->memtracker = NULL;
+   }
+   if (vm->vmhost) {
+      for (cnt = vm->vmhost->crosspagePagesCount; cnt > 0; ) {
+         struct page* p = vm->vmhost->crosspagePages[--cnt];
+         UnmapCrossPage(p, vm->crosspage[cnt]);
+      }
+      vm->vmhost->crosspagePagesCount = 0;
+      if (vm->vmhost->hostAPICIsMapped) {
+	 ASSERT(vm->hostAPIC.base != NULL);
+	 iounmap((void*)vm->hostAPIC.base);
+	 vm->hostAPIC.base = NULL;
+	 vm->vmhost->hostAPICIsMapped = FALSE;
+      }
+      HostIF_FreeKernelMem(vm->vmhost);
+      vm->vmhost = NULL;
+   }
+}
+
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_AllocKernelMem
+ *
+ *      Allocate some kernel memory for the driver. 
+ *
+ * Results:
+ *      The address allocated or NULL on error. 
+ *      
+ *
+ * Side effects:
+ *      memory is malloced
+ *----------------------------------------------------------------------
+ */
+
+void *
+HostIF_AllocKernelMem(size_t size,  // IN:
+                      int wired)    // IN:
+{
+   void * ptr = kmalloc(size, GFP_KERNEL);
+   
+   if (ptr == NULL) { 
+      Warning("%s failed (size=%p)\n", __func__, (void*)size);
+   }
+
+   return ptr;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_AllocPage --
+ *
+ *    Allocate a page (whose content is undetermined)
+ *
+ * Results:
+ *    The kernel virtual address of the page
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void *
+HostIF_AllocPage(void)
+{
+   VA kvAddr;
+   
+   kvAddr = __get_free_page(GFP_KERNEL);
+   if (kvAddr == 0) {
+      Warning("%s: __get_free_page() failed\n", __func__);
+   }
+
+   return (void *)kvAddr;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_FreeKernelMem
+ *
+ *      Free kernel memory allocated for the driver. 
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      memory is freed.
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_FreeKernelMem(void *ptr)  // IN:
+{
+   kfree(ptr);
+}
+
+
+void
+HostIF_FreePage(void *ptr)  // IN:
+{
+   VA vAddr = (VA)ptr;
+
+   if (vAddr & (PAGE_SIZE-1)) {
+      Warning("%s %p misaligned\n", __func__, (void*)vAddr);
+   } else {
+      free_page(vAddr);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_EstimateLockedPageLimit --
+ *
+ *      Estimates how many memory pages can be locked or allocated
+ *      from the kernel without causing the host to die or to be really upset.
+ *
+ * Results:
+ *	The maximum number of pages that can be locked. 
+ *
+ * Side effects:
+ *      none
+ *
+ *----------------------------------------------------------------------
+ */
+
+unsigned int
+HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
+			       unsigned int currentlyLockedPages) // IN
+{
+   /*
+    * This variable is available and exported to modules,
+    * since at least 2.6.0.
+    */
+
+   extern unsigned long totalram_pages;
+
+   unsigned int totalPhysicalPages = totalram_pages;
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 28)
+   return MemDefaults_CalcMaxLockedPages(totalPhysicalPages);
+#else
+   /*
+    * Use the memory information linux exports as of late for a more
+    * precise estimate of locked memory.  All kernel page-related structures
+    * (slab, pagetable) are as good as locked.  Unevictable includes things
+    * that are explicitly marked as such (like mlock()).  Huge pages are 
+    * also as good as locked, since we don't use them.  Lastly, without 
+    * available swap, anonymous pages become locked in memory as well. 
+    */
+
+   unsigned int forHost;
+   unsigned int reservedPages = MEMDEFAULTS_MIN_HOST_PAGES;
+   unsigned int hugePages = (vm == NULL) ? 0 :
+      BYTES_2_PAGES(vm->memInfo.hugePageBytes);
+   unsigned int lockedPages = global_page_state(NR_PAGETABLE) +
+                              global_page_state(NR_SLAB_UNRECLAIMABLE) +
+                              global_page_state(NR_UNEVICTABLE) +
+                              hugePages + reservedPages;
+   unsigned int anonPages =
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 8, 0)
+      global_page_state(NR_ANON_MAPPED);
+#else
+      global_page_state(NR_ANON_PAGES);
+#endif
+   unsigned int swapPages = BYTES_2_PAGES(linuxState.swapSize);
+
+   if (anonPages > swapPages) {
+      lockedPages += anonPages - swapPages; 
+   }
+   forHost = lockedPages + LOCKED_PAGE_SLACK;
+   if (forHost > totalPhysicalPages) {
+      forHost = totalPhysicalPages;
+   }
+
+   return totalPhysicalPages - forHost;
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_Wait --
+ *
+ *      Waits for specified number of milliseconds.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_Wait(unsigned int timeoutMs)
+{
+   msleep_interruptible(timeoutMs);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_WaitForFreePages --
+ *
+ *      Waits for pages to be available for allocation or locking.
+ *
+ * Results:
+ *	New pages are likely to be available for allocation or locking.
+ *
+ * Side effects:
+ *      none
+ *
+ *----------------------------------------------------------------------
+ */
+
+void 
+HostIF_WaitForFreePages(unsigned int timeoutMs)  // IN:
+{
+   static unsigned count;
+   msleep_interruptible(timeoutMs);
+   count++;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFReadUptimeWork --
+ *
+ *      Reads the current uptime.  The uptime is based on getimeofday,
+ *      which provides the needed high resolution.  However, we don't
+ *      want uptime to be warped by e.g. calls to settimeofday.  So, we
+ *      use a jiffies based monotonic clock to sanity check the uptime.
+ *      If the uptime is more than one second from the monotonic time,
+ *      we assume that the time of day has been set, and recalculate the
+ *      uptime base to get uptime back on track with monotonic time.  On
+ *      the other hand, we do expect jiffies based monotonic time and
+ *      timeofday to have small drift (due to NTP rate correction, etc).
+ *      We handle this by rebasing the jiffies based monotonic clock
+ *      every second (see HostIFUptimeResyncMono).
+ *      
+ * Results:
+ *      The uptime, in units of UPTIME_FREQ.  Also returns the jiffies
+ *      value that was used in the monotonic time calculation.
+ *
+ * Side effects:
+ *      May reset the uptime base in the case gettimeofday warp was 
+ *      detected.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static uint64
+HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies 
+{
+   struct timeval tv;
+   uint64 monotime, uptime, upBase, monoBase;
+   int64 diff;
+   uint32 version;
+   unsigned long jifs, jifBase;
+   unsigned int attempts = 0;
+
+   /* Assert that HostIF_InitUptime has been called. */
+   ASSERT(uptimeState.timer.function);
+
+ retry:
+   do {
+      version  = VersionedAtomic_BeginTryRead(&uptimeState.version);
+      jifs     = jiffies;
+      jifBase  = uptimeState.jiffiesBase;
+      monoBase = uptimeState.monotimeBase;
+   } while (!VersionedAtomic_EndTryRead(&uptimeState.version, version));
+
+   do_gettimeofday(&tv);
+   upBase = Atomic_Read64(&uptimeState.uptimeBase);
+   
+   monotime = (uint64)(jifs - jifBase) * (UPTIME_FREQ / HZ);
+   monotime += monoBase;
+
+   uptime = tv.tv_usec * (UPTIME_FREQ / 1000000) + tv.tv_sec * UPTIME_FREQ;
+   uptime += upBase;
+   
+   /* 
+    * Use the jiffies based monotonic time to sanity check gettimeofday.
+    * If they differ by more than one second, assume the time of day has
+    * been warped, and use the jiffies time to undo (most of) the warp.
+    */
+
+   diff = uptime - monotime;
+   if (UNLIKELY(diff < -UPTIME_FREQ || diff > UPTIME_FREQ)) {
+      /* Compute a new uptimeBase to get uptime back on track. */
+      uint64 newUpBase = monotime - (uptime - upBase);
+
+      attempts++;
+      if (!Atomic_CMPXCHG64(&uptimeState.uptimeBase, &upBase, &newUpBase) && 
+          attempts < 5) {
+         /* Another thread updated uptimeBase.  Recalculate uptime. */
+         goto retry;
+      }
+      uptime = monotime;
+
+      Log("%s: detected settimeofday: fixed uptimeBase old %"FMT64"u "
+          "new %"FMT64"u attempts %u\n", __func__,
+          upBase, newUpBase, attempts);
+   }
+   *j = jifs;
+
+   return uptime;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFUptimeResyncMono --
+ *
+ *      Timer that fires ever second to resynchronize the jiffies based
+ *      monotonic time with the uptime.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Resets the monotonic time bases so that jiffies based monotonic
+ *      time does not drift from gettimeofday over the long term.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+HostIFUptimeResyncMono(unsigned long data)  // IN: ignored
+{
+   unsigned long jifs;
+   uintptr_t flags;
+
+   /* 
+    * Read the uptime and the corresponding jiffies value.  This will
+    * also correct the uptime (which is based on time of day) if needed
+    * before we rebase monotonic time (which is based on jiffies).
+    */
+
+   uint64 uptime = HostIFReadUptimeWork(&jifs);
+
+   /* 
+    * Every second, recalculate monoBase and jiffiesBase to squash small
+    * drift between gettimeofday and jiffies.  Also, this prevents
+    * (jiffies - jiffiesBase) wrap on 32-bits.
+    */
+
+   SAVE_FLAGS(flags);
+   CLEAR_INTERRUPTS();
+   VersionedAtomic_BeginWrite(&uptimeState.version);
+
+   uptimeState.monotimeBase = uptime;
+   uptimeState.jiffiesBase  = jifs;
+
+   VersionedAtomic_EndWrite(&uptimeState.version);
+   RESTORE_FLAGS(flags);
+
+   /* Reschedule this timer to expire in one second. */
+   mod_timer(&uptimeState.timer, jifs + HZ);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_InitUptime --
+ *
+ *      Initialize the uptime clock's state.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Sets the initial values for the uptime state, and schedules
+ *      the uptime timer.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_InitUptime(void)
+{
+   struct timeval tv;
+
+   uptimeState.jiffiesBase = jiffies;
+   do_gettimeofday(&tv);
+   Atomic_Write64(&uptimeState.uptimeBase, 
+                  -(tv.tv_usec * (UPTIME_FREQ / 1000000) + 
+                    tv.tv_sec * UPTIME_FREQ));
+
+   init_timer(&uptimeState.timer);
+   uptimeState.timer.function = HostIFUptimeResyncMono;
+   mod_timer(&uptimeState.timer, jiffies + HZ);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_CleanupUptime --
+ *
+ *      Cleanup uptime state, called at module unloading time.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Deschedule the uptime timer.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_CleanupUptime(void)
+{
+   del_timer_sync(&uptimeState.timer);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_ReadUptime --
+ *
+ *      Read the system time.  Returned value has no particular absolute
+ *      value, only difference since previous call should be used.
+ *
+ * Results:
+ *      Units are given by HostIF_UptimeFrequency.
+ *
+ * Side effects:
+ *      See HostIFReadUptimeWork
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint64
+HostIF_ReadUptime(void)
+{
+   unsigned long jifs;
+
+   return HostIFReadUptimeWork(&jifs);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_UptimeFrequency
+ *
+ *      Return the frequency of the counter that HostIF_ReadUptime reads.
+ *
+ * Results:
+ *      Frequency in Hz.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint64
+HostIF_UptimeFrequency(void)
+{
+   return UPTIME_FREQ;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_CopyFromUser --
+ *
+ *      Copy memory from the user application into a kernel buffer. This
+ *      function may block, so don't call it while holding any kind of
+ *      lock. --hpreg
+ *
+ * Results:
+ *      0 on success
+ *      -EFAULT on failure.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+HostIF_CopyFromUser(void *dst,        // OUT
+                    const void *src,  // IN
+                    unsigned int len) // IN
+{
+   return copy_from_user(dst, src, len) ? -EFAULT : 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_CopyToUser --
+ *
+ *      Copy memory to the user application from a kernel buffer. This
+ *      function may block, so don't call it while holding any kind of
+ *      lock. --hpreg
+ *
+ * Results:
+ *      0 on success
+ *      -EFAULT on failure.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int 
+HostIF_CopyToUser(void *dst,        // OUT
+                  const void *src,  // IN
+                  unsigned int len) // IN
+{
+   return copy_to_user(dst, src, len) ? -EFAULT : 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_MapCrossPage --
+ *    
+ *    Obtain kernel pointer to crosspage. 
+ *
+ *    We must return a VA that is obtained through a kernel mapping, so that 
+ *    the mapping never goes away (see bug 29753).
+ *
+ *    However, the LA corresponding to that VA must not overlap with the 
+ *    monitor (see bug 32922). The userland code ensures that by only 
+ *    allocating cross pages from low memory. For those pages, the kernel 
+ *    uses a permanent mapping, instead of a temporary one with a high LA.
+ *
+ * Results:
+ *    The kernel virtual address on success
+ *    NULL on failure
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void *
+HostIF_MapCrossPage(VMDriver *vm, // IN
+                    VA64 uAddr)   // IN
+{
+   void *p = VA64ToPtr(uAddr);
+   struct page *page;
+   VA           vPgAddr;
+   VA           ret;
+
+   if (HostIFGetUserPages(p, &page, 1)) {
+      return NULL;
+   }
+   vPgAddr = (VA) MapCrossPage(page);
+   HostIF_GlobalLock(16);
+   if (vm->vmhost->crosspagePagesCount >= MAX_INITBLOCK_CPUS) {
+      HostIF_GlobalUnlock(16);
+      UnmapCrossPage(page, (void*)vPgAddr);
+
+      return NULL;
+   }
+   vm->vmhost->crosspagePages[vm->vmhost->crosspagePagesCount++] = page;
+   HostIF_GlobalUnlock(16);
+
+   ret = vPgAddr | (((VA)p) & (PAGE_SIZE - 1));
+
+   return (void*)ret;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_AllocCrossGDT --
+ *
+ *      Allocate the per-vmmon cross GDT page set.
+ *
+ *      See bora/doc/worldswitch-pages.txt for the requirements on the cross
+ *      GDT page set addresses.
+ *
+ * Results:
+ *      On success: Host kernel virtual address of the first cross GDT page.
+ *                  Use HostIF_FreeCrossGDT() with the same value to free.
+ *                  The 'crossGDTMPNs' array is filled with the MPNs of all the
+ *                  cross GDT pages.
+ *      On failure: NULL.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void *
+HostIF_AllocCrossGDT(uint32 numPages,     // IN: Number of pages
+                     MPN maxValidFirst,   // IN: Highest valid MPN of first page
+                     MPN *crossGDTMPNs)   // OUT: Array of MPNs
+{
+   MPN startMPN;
+   struct page *pages;
+   uint32 i;
+   void *crossGDT;
+
+   /*
+    * In practice, allocating a low page (MPN <= 0x100000 - 1) is equivalent to
+    * allocating a page with MPN <= 0xFEC00 - 1:
+    *
+    * o PC architecture guarantees that there is no RAM in top 16MB of 4GB
+    *   range.
+    *
+    * o 0xFEC00000 is IOAPIC base.  There could be RAM immediately below,
+    *   but not above.
+    *
+    * How do we allocate a low page? We can safely use GFP_DMA32 when
+    * available.  On 64bit kernels before GFP_DMA32 was introduced we
+    * fall back to DMA zone (which is not quite necessary for boxes
+    * with less than ~3GB of memory).  On 32bit kernels we are using
+    * normal zone - which is usually 1GB, and at most 4GB (for 4GB/4GB
+    * kernels).  And for 4GB/4GB kernels same restriction as for 64bit
+    * kernels applies - there is no RAM in top 16MB immediately below
+    * 4GB so alloc_pages() cannot return such page.
+    */
+
+   ASSERT(0xFEC00 - 1 <= maxValidFirst);
+   for (i = 0; (1 << i) < numPages; i++) { }
+#ifdef GFP_DMA32
+   pages = alloc_pages(GFP_KERNEL | GFP_DMA32, i);
+#else
+   pages = alloc_pages(GFP_KERNEL | GFP_DMA, i);
+#endif
+   crossGDT = NULL;
+   if (pages == NULL) {
+      Warning("%s: unable to alloc crossGDT (%u)\n", __func__, i);
+   } else {
+      startMPN = page_to_pfn(pages);
+      for (i = 0; i < numPages; i++) {
+         crossGDTMPNs[i] = startMPN + i;
+      }
+      crossGDT = (void *)page_address(pages);
+   }
+
+   return crossGDT;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_FreeCrossGDT --
+ *
+ *      Free the per-vmmon cross GDT page set allocated with
+ *      HostIF_AllocCrossGDT().
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_FreeCrossGDT(uint32 numPages, // IN: Number of pages
+                    void *crossGDT)  // IN: Kernel VA of first cross GDT page
+{
+   uint32 i;
+
+   for (i = 0; (1 << i) < numPages; i++) { }
+   free_pages((VA)crossGDT, i);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_VMLock --
+ *
+ *      Grabs per-VM data structure lock. The lock is not recursive.
+ *      The global lock has lower rank so the global lock should be grabbed
+ *      first if both locks are acquired.
+ *
+ *      It should be a medium contention lock. Also it should be fast:
+ *      it is used for protecting of frequent page allocation and locking.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      The current thread is rescheduled if the lock is busy.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_VMLock(VMDriver *vm, // IN
+              int callerID) // IN
+{
+   ASSERT(vm);
+
+   ASSERT(vm->vmhost);
+   MutexLock(&vm->vmhost->vmMutex, callerID);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_VMUnlock --
+ *
+ *      Releases per-VM data structure lock.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Can wake up the thread blocked on this lock. 
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_VMUnlock(VMDriver *vm, // IN
+                int callerID) // IN
+{
+   ASSERT(vm);
+
+   ASSERT(vm->vmhost);
+   MutexUnlock(&vm->vmhost->vmMutex, callerID);
+}
+
+
+#ifdef VMX86_DEBUG
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_VMLockIsHeld --
+ *
+ *      Determine if the per-VM lock is held by the current thread.
+ * 
+ * Results:
+ *      TRUE if yes
+ *      FALSE if no
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+HostIF_VMLockIsHeld(VMDriver *vm) // IN
+{
+   ASSERT(vm);
+   ASSERT(vm->vmhost);
+
+   return MutexIsLocked(&vm->vmhost->vmMutex);
+}
+#endif
+
+
+/*
+ * Utility routines for accessing and enabling the APIC
+ */
+
+/*
+ * Defines for accessing the APIC.  We use readl/writel to access the APIC
+ * which is how Linux wants you to access I/O memory (though on the x86
+ * just dereferencing a pointer works just fine).
+ */
+#define APICR_TO_ADDR(apic, reg)      (apic + (reg << 4))
+#define GET_APIC_REG(apic, reg)       (readl(APICR_TO_ADDR(apic, reg)))
+#define SET_APIC_REG(apic, reg, val)  (writel(val, APICR_TO_ADDR(apic, reg)))
+
+#define APIC_MAXLVT(apic)             ((GET_APIC_REG(apic, APICR_VERSION) >> 16) & 0xff)
+#define APIC_VERSIONREG(apic)         (GET_APIC_REG(apic, APICR_VERSION) & 0xff)
+
+
+#if defined(CONFIG_SMP) || defined(CONFIG_X86_UP_IOAPIC) || \
+    defined(CONFIG_X86_UP_APIC) || defined(CONFIG_X86_LOCAL_APIC)
+/*
+ *----------------------------------------------------------------------
+ *
+ * isVAReadable --
+ *
+ *      Verify that passed VA is accessible without crash...
+ *
+ * Results:
+ *      TRUE if address is readable, FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+ 
+static Bool
+isVAReadable(VA r)  // IN:
+{
+   mm_segment_t old_fs;
+   uint32 dummy;
+   int ret;
+   
+   old_fs = get_fs();
+   set_fs(get_ds());
+   r = APICR_TO_ADDR(r, APICR_VERSION);
+   ret = HostIF_CopyFromUser(&dummy, (void*)r, sizeof(dummy));
+   set_fs(old_fs);
+
+   return ret == 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SetVMAPICAddr --
+ *
+ *      Maps the host cpu's APIC.  The virtual address is stashed in
+ *      the VMDriver structure.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      The VMDriver structure is updated.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+SetVMAPICAddr(VMDriver *vm, // IN/OUT: driver state
+              MA ma)	    // IN: host APIC's ma
+{
+   volatile void *hostapic;
+
+   ASSERT_ON_COMPILE(APICR_SIZE <= PAGE_SIZE);
+   hostapic = (volatile void *) ioremap_nocache(ma, PAGE_SIZE);
+   if (hostapic) {
+      if ((APIC_VERSIONREG(hostapic) & 0xF0) == 0x10) {
+	 vm->hostAPIC.base = (volatile uint32 (*)[4]) hostapic;
+	 ASSERT(vm->vmhost != NULL);
+	 vm->vmhost->hostAPICIsMapped = TRUE;
+      } else {
+	 iounmap((void*)hostapic);
+      }
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * ProbeAPIC --
+ *
+ *      Attempts to map the host APIC.
+ *
+ *      Most versions of Linux already provide access to a mapped
+ *      APIC.  This function is just a backup.
+ *
+ *      Caveat: We assume that the APIC physical address is the same
+ *      on all host cpus.
+ *
+ * Results:
+ *      TRUE if APIC was found, FALSE if not.
+ *
+ * Side effects:
+ *      May map the APIC.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+ProbeAPIC(VMDriver *vm,   // IN/OUT: driver state
+	  Bool setVMPtr)  // IN: set a pointer to the APIC's virtual address
+{
+   MA ma = APIC_GetMA();
+   
+   if (ma == (MA)-1) {
+      return FALSE;
+   }
+
+   if (setVMPtr) {
+      SetVMAPICAddr(vm, ma);
+   } else {
+      vm->hostAPIC.base = NULL;
+   }
+
+   return TRUE;
+}
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_APICInit --
+ *
+ *      Initialize APIC behavior.
+ *      Attempts to map the host APIC into vm->hostAPIC.
+ *
+ *      We don't attempt to refresh the mapping after a host cpu
+ *      migration.  Fortunately, hosts tend to use the same address
+ *      for all APICs.
+ *
+ *      Most versions of Linux already provide a mapped APIC.  We
+ *      have backup code to read APIC_BASE and map it, if needed.
+ *
+ * Results:
+ *      TRUE
+ *
+ * Side effects:
+ *      May map the host APIC.
+ *
+ *----------------------------------------------------------------------
+ */
+Bool
+HostIF_APICInit(VMDriver *vm,   // IN:
+                Bool setVMPtr,  // IN:
+                Bool probe)     // IN: force probing
+{
+#if defined(CONFIG_SMP)         || defined(CONFIG_X86_UP_IOAPIC) || \
+    defined(CONFIG_X86_UP_APIC) || defined(CONFIG_X86_LOCAL_APIC)
+   static Bool apicIPILogged = FALSE;
+   VA kAddr;
+
+   monitorIPIVector = SPURIOUS_APIC_VECTOR;
+#if defined(POSTED_INTR_VECTOR)
+   hvIPIVector      = POSTED_INTR_VECTOR;
+#else
+   hvIPIVector      = 0;
+#endif
+
+
+   if (!apicIPILogged) {
+      Log("Monitor IPI vector: %x\n", monitorIPIVector);
+      Log("HV      IPI vector: %x\n", hvIPIVector);
+      apicIPILogged = TRUE;
+   }
+
+   if ((__GET_MSR(MSR_APIC_BASE) & APIC_MSR_X2APIC_ENABLED) != 0) {
+      if (setVMPtr) {
+         vm->hostAPIC.base = NULL;
+         vm->vmhost->hostAPICIsMapped = FALSE;
+         vm->hostAPIC.isX2 = TRUE;
+      }
+      return TRUE;
+   }
+
+   if (probe && ProbeAPIC(vm, setVMPtr)) {
+      return TRUE;
+   }
+
+   /*
+    * Normal case: use Linux's pre-mapped APIC.
+    */
+   kAddr = __fix_to_virt(FIX_APIC_BASE);
+   if (!isVAReadable(kAddr)) {
+      return TRUE;
+   }
+   if (setVMPtr) {
+      vm->hostAPIC.base = (void *)kAddr;
+   } else {
+      vm->hostAPIC.base = NULL;
+   }
+#endif
+   return TRUE;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_SemaphoreWait --
+ *
+ *    Perform the semaphore wait (P) operation, possibly blocking.
+ *
+ * Result:
+ *    1 (which equals MX_WAITNORMAL) if success, 
+ *    negated error code otherwise.
+ *
+ * Side-effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int   
+HostIF_SemaphoreWait(VMDriver *vm,   // IN:
+                     Vcpuid vcpuid,  // IN:
+                     uint64 *args)   // IN:
+{
+   struct file *file;
+   mm_segment_t old_fs;
+   int res;
+   int waitFD = args[0];
+   int timeoutms = args[2];
+   uint64 value;
+
+   file = vmware_fget(waitFD);
+   if (file == NULL) {
+      return MX_WAITERROR;
+   }
+
+   old_fs = get_fs();
+   set_fs(get_ds());
+
+   {
+      struct poll_wqueues table;
+      unsigned int mask;
+      
+      poll_initwait(&table);
+      current->state = TASK_INTERRUPTIBLE;
+      mask = file->f_op->poll(file, &table.pt);
+      if (!(mask & (POLLIN | POLLERR | POLLHUP))) {
+         vm->vmhost->vcpuSemaTask[vcpuid] = current;
+         schedule_timeout(timeoutms * HZ / 1000);  // convert to Hz
+         vm->vmhost->vcpuSemaTask[vcpuid] = NULL;
+      }
+      current->state = TASK_RUNNING;
+      poll_freewait(&table);
+   }
+
+   /*
+    * Userland only writes in multiples of sizeof(uint64). This will allow
+    * the code to happily deal with a pipe or an eventfd. We only care about
+    * reading no bytes (EAGAIN - non blocking fd) or sizeof(uint64).
+    */
+
+   res = file->f_op->read(file, (char *) &value, sizeof value, &file->f_pos);
+
+   if (res == sizeof value) {
+      res = MX_WAITNORMAL;
+   } else {
+      if (res == 0) {
+         res = -EBADF;
+      }
+   }
+
+   set_fs(old_fs);
+   fput(file);
+
+   /*
+    * Handle benign errors:
+    * EAGAIN is MX_WAITTIMEDOUT.
+    * The signal-related errors are all mapped into MX_WAITINTERRUPTED.
+    */
+
+   switch (res) {
+   case -EAGAIN:
+      res = MX_WAITTIMEDOUT;
+      break;
+   case -EINTR:
+   case -ERESTART:
+   case -ERESTARTSYS:
+   case -ERESTARTNOINTR:
+   case -ERESTARTNOHAND:
+      res = MX_WAITINTERRUPTED;
+      break;
+   case -EBADF:
+      res = MX_WAITERROR;
+      break;
+   }
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_SemaphoreForceWakeup --
+ *
+ *    For each VCPU in the set whose target process is lightly sleeping (i.e.
+ *    TASK_INTERRUPTIBLE), wake it up.  The target process can be waiting on a
+ *    semaphore or due to a call to Vmx86_YieldToSet.
+ *
+ * Result:
+ *    None.
+ *
+ * Side-effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void 
+HostIF_SemaphoreForceWakeup(VMDriver *vm,       // IN:
+                            const VCPUSet *vcs) // IN:
+{
+   FOR_EACH_VCPU_IN_SET(vcs, vcpuid) {
+      struct task_struct *t = vm->vmhost->vcpuSemaTask[vcpuid];
+      vm->vmhost->vcpuSemaTask[vcpuid] = NULL;
+      if (t && (t->state & TASK_INTERRUPTIBLE)) {
+         wake_up_process(t);
+      }
+   } ROF_EACH_VCPU_IN_SET();
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_SemaphoreSignal --
+ *
+ *      Perform the semaphore signal (V) operation.
+ *
+ * Result:
+ *      On success: MX_WAITNORMAL (1).
+ *      On error: MX_WAITINTERRUPTED (3) if interrupted by a Unix signal (we
+ *                   can block on a preemptive kernel).
+ *                MX_WAITERROR (0) on generic error.
+ *                Negated system error (< 0).
+ *
+ * Side-effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+HostIF_SemaphoreSignal(uint64 *args)  // IN:
+{
+   struct file *file;
+   mm_segment_t old_fs;
+   int res;
+   int signalFD = args[1];
+   uint64 value = 1;  // make an eventfd happy should it be there
+
+   file = vmware_fget(signalFD);
+   if (!file) {
+      return MX_WAITERROR;
+   }
+
+   old_fs = get_fs();
+   set_fs(get_ds());
+
+   /*
+    * Always write sizeof(uint64) bytes. This works fine for eventfd and
+    * pipes. The data written is formatted to make an eventfd happy should
+    * it be present.
+    */
+
+   res = file->f_op->write(file, (char *) &value, sizeof value, &file->f_pos);
+
+   if (res == sizeof value) {
+      res = MX_WAITNORMAL;
+   }
+
+   set_fs(old_fs);
+   fput(file);
+
+   /*
+    * Handle benign errors:
+    * EAGAIN is MX_WAITTIMEDOUT.
+    * The signal-related errors are all mapped into MX_WAITINTERRUPTED.
+    */
+
+   switch (res) {
+   case -EAGAIN:
+      // The pipe is full, so it is already signalled. Success.
+      res = MX_WAITNORMAL;
+      break;
+   case -EINTR:
+   case -ERESTART:
+   case -ERESTARTSYS:
+   case -ERESTARTNOINTR:
+   case -ERESTARTNOHAND:
+      res = MX_WAITINTERRUPTED;
+      break;
+   }
+   return res;
+}
+
+#if ((LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 27)) || !defined(CONFIG_SMP))
+#   define VMMON_USE_CALL_FUNC
+#endif
+
+#if defined(VMMON_USE_CALL_FUNC)
+/*
+ *----------------------------------------------------------------------
+ *
+ * LinuxDriverIPIHandler  --
+ *
+ *      Null IPI handler - for monitor to notice AIO completion
+ *
+ *----------------------------------------------------------------------
+ */
+void
+LinuxDriverIPIHandler(void *info)
+{
+   return;
+}
+
+#if LINUX_VERSION_CODE > KERNEL_VERSION(2, 6, 17)
+#define VMMON_CALL_FUNC_SYNC 0  // async; we've not seen any problems
+#else
+#define VMMON_CALL_FUNC_SYNC 1  // sync; insure no problems from old releases
+#endif
+
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_IPI --
+ *
+ *    If the passed VCPU threads are on some CPUs in the system,
+ *    attempt to hit them with an IPI.
+ *
+ *    On older Linux systems we do a broadcast.
+ *
+ * Result:
+ *    The mode used to send IPIs.
+ *
+ *----------------------------------------------------------------------
+ */
+
+HostIFIPIMode
+HostIF_IPI(VMDriver *vm,                // IN:
+           const VCPUSet *ipiTargets)   // IN:
+{
+   HostIFIPIMode mode = IPI_NONE;
+
+   ASSERT(vm);
+
+   FOR_EACH_VCPU_IN_SET(ipiTargets, v) {
+      uint32 targetHostCpu = vm->currentHostCpu[v];
+      if (targetHostCpu != INVALID_PCPU) {
+         ASSERT(targetHostCpu < MAX_PCPUS);
+#if defined(VMMON_USE_CALL_FUNC)
+         /* older kernels IPI broadcast; use async when possible */
+         (void) compat_smp_call_function(LinuxDriverIPIHandler,
+                                         NULL, VMMON_CALL_FUNC_SYNC);
+	 mode = IPI_BROADCAST;
+	 break;
+#else
+         /* Newer kernels have (async) IPI targetting */
+         arch_send_call_function_single_ipi(targetHostCpu);
+	 mode = IPI_UNICAST;
+#endif
+      }
+   } ROF_EACH_VCPU_IN_SET();
+
+   return mode;
+}
+
+
+typedef struct {
+   Atomic_uint32 index;
+   CPUIDQuery *query;
+} HostIFGetCpuInfoData;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIFGetCpuInfo --
+ *
+ *      Collect CPUID information on the current logical CPU.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      'data->index' is atomically incremented by one.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+HostIFGetCpuInfo(void *clientData) // IN/OUT: A HostIFGetCpuInfoData *
+{
+   HostIFGetCpuInfoData *data = (HostIFGetCpuInfoData *)clientData;
+   CPUIDQuery *query;
+   uint32 index;
+
+   ASSERT(data);
+   query = data->query;
+   ASSERT(query);
+
+   index = Atomic_ReadInc32(&data->index);
+   if (index >= query->numLogicalCPUs) {
+      return;
+   }
+
+   query->logicalCPUs[index].tag = HostIF_GetCurrentPCPU();
+   __GET_CPUID2(query->eax, query->ecx, &query->logicalCPUs[index].regs);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_GetAllCpuInfo --
+ *
+ *      Collect CPUID information on all logical CPUs.
+ *
+ *      'query->numLogicalCPUs' is the size of the 'query->logicalCPUs' output
+ *      array.
+ *
+ * Results:
+ *      On success: TRUE. 'query->logicalCPUs' is filled and
+ *                  'query->numLogicalCPUs' is adjusted accordingly.
+ *      On failure: FALSE. Happens if 'query->numLogicalCPUs' was too small.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+HostIF_GetAllCpuInfo(CPUIDQuery *query) // IN/OUT
+{
+   HostIFGetCpuInfoData data;
+
+   Atomic_Write32(&data.index, 0);
+   data.query = query;
+
+   /*
+    * XXX Linux has userland APIs to bind a thread to a processor, so we could
+    *     probably implement this in userland like we do on Win32.
+    */
+
+   HostIF_CallOnEachCPU(HostIFGetCpuInfo, &data);
+
+   /*
+    * At this point, Atomic_Read32(&data.index) is the number of logical CPUs
+    * who replied.
+    */
+
+   if (Atomic_Read32(&data.index) > query->numLogicalCPUs) {
+      return FALSE;
+   }
+
+   ASSERT(Atomic_Read32(&data.index) <= query->numLogicalCPUs);
+   query->numLogicalCPUs = Atomic_Read32(&data.index);
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_CallOnEachCPU --
+ *
+ *      Call specified function once on each CPU.  No ordering guarantees.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.  May be slow.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_CallOnEachCPU(void (*func)(void*), // IN: function to call
+                     void *data)          // IN/OUT: argument to function
+{
+   preempt_disable();
+   (*func)(data);
+   (void)compat_smp_call_function(*func, data, 1);
+   preempt_enable();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_ReadPage --
+ *
+ *      puts the content of a machine page into a kernel or user mode 
+ *      buffer. 
+ *
+ * Results:
+ *      0 on success
+ *      negative error code on error
+ *
+ * Side effects:
+ *      none
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIF_ReadPage(MPN mpn,             // MPN of the page
+                VA64 addr,           // buffer for data
+                Bool kernelBuffer)   // is the buffer in kernel space?
+{
+   void *buf = VA64ToPtr(addr);
+   int ret = 0;
+   const void* ptr;
+   struct page* page;
+
+   if (mpn == INVALID_MPN) {
+      return -EFAULT;
+   }
+
+   page = pfn_to_page(mpn);
+   ptr = kmap(page);
+   if (ptr == NULL) {
+      return -ENOMEM;
+   }
+   
+   if (kernelBuffer) {
+      memcpy(buf, ptr, PAGE_SIZE);
+   } else {
+      ret = HostIF_CopyToUser(buf, ptr, PAGE_SIZE);
+   }
+   kunmap(page);
+
+   return ret;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_WritePage --
+ *
+ *      Put the content of a kernel or user mode buffer into a machine 
+ *      page.
+ *
+ * Results:
+ *      0 on success
+ *      negative error code on error
+ *
+ * Side effects:
+ *      none
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIF_WritePage(MPN mpn,              // MPN of the page
+                 VA64 addr,            // data to write to the page
+                 Bool kernelBuffer)    // is the buffer in kernel space?
+{
+   void const *buf = VA64ToPtr(addr);
+   int ret = 0;
+   void* ptr;
+   struct page* page;
+
+   if (mpn == INVALID_MPN) {
+      return -EFAULT;
+   }
+
+   page = pfn_to_page(mpn);
+   ptr = kmap(page);
+   if (ptr == NULL) {
+      return -ENOMEM;
+   }
+
+   if (kernelBuffer) {
+      memcpy(ptr, buf, PAGE_SIZE);
+   } else {
+      ret = HostIF_CopyFromUser(ptr, buf, PAGE_SIZE);
+   }
+   kunmap(page);
+
+   return ret;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_GetLockedPageList --
+ *
+ *      puts MPNs of pages that were allocated by HostIF_AllocLockedPages()
+ *      into user mode buffer.
+ *
+ * Results:
+ *      non-negative number of the MPNs in the buffer on success.
+ *      negative error code on error (-EFAULT)
+ *
+ * Side effects:
+ *      none
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIF_GetLockedPageList(VMDriver* vm,          // IN: VM instance pointer
+                         VA64 uAddr,            // OUT: user mode buffer for MPNs
+                         unsigned int numPages) // IN: size of the buffer in MPNs
+{
+   MPN *mpns = VA64ToPtr(uAddr);
+   MPN mpn;
+   unsigned count;
+
+   struct PhysTracker* AWEPages;
+
+   if (!vm->vmhost || !vm->vmhost->AWEPages) {
+      return 0;
+   }
+   AWEPages = vm->vmhost->AWEPages;
+
+   for (mpn = 0, count = 0;
+        (count < numPages) &&
+        (INVALID_MPN != (mpn = PhysTrack_GetNext(AWEPages, mpn)));
+        count++) {
+
+      if (HostIF_CopyToUser(&mpns[count], &mpn, sizeof *mpns) != 0) {
+         return -EFAULT;
+      }
+   }
+
+   return count;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_GetNextAnonPage --
+ *
+ *      If "inMPN" is INVALID_MPN gets the first MPN in the anon mpn list else
+ *      gets the anon mpn after "inMPN" in the anon mpn list.
+ *
+ * Results:
+ *      Next anon MPN. If the list has been exhausted, returns INVALID_MPN.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+MPN
+HostIF_GetNextAnonPage(VMDriver *vm, MPN inMPN)
+{
+   if (!vm->vmhost || !vm->vmhost->AWEPages) {
+      return INVALID_MPN;
+   }
+   return PhysTrack_GetNext(vm->vmhost->AWEPages, inMPN);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_GetCurrentPCPU --
+ *
+ *    Get current physical CPU id.  Interrupts should be disabled so
+ *    that the thread cannot move to another CPU.
+ *
+ * Results:
+ *    Host CPU number.
+ *
+ * Side effects:
+ *    None.
+ *
+ *---------------------------------------------------------------------- 
+ */
+
+uint32
+HostIF_GetCurrentPCPU(void)
+{
+   return smp_processor_id();
+}
+
+
+#ifdef VMMON_USE_COMPAT_SCHEDULE_HRTIMEOUT
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFWakeupClockThread --
+ *
+ *      Wake up the fast clock thread.  Can't do this from the timer
+ *      callback, because it holds locks that the scheduling code
+ *      might take. 
+ *
+ * Results:
+ *      None.
+ *      
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void 
+HostIFWakeupClockThread(unsigned long data)  //IN:
+{
+   wake_up_process(linuxState.fastClockThread);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFTimerCallback --
+ *      
+ *      Schedule a tasklet to wake up the fast clock thread.
+ *
+ * Results:
+ *      Tell the kernel not to restart the timer.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+ 
+static enum hrtimer_restart 
+HostIFTimerCallback(struct hrtimer *timer)  //IN:
+{
+   tasklet_schedule(&timerTasklet);
+
+   return HRTIMER_NORESTART;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFScheduleHRTimeout --
+ *      
+ *      Schedule an hrtimer to wake up the fast clock thread.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Sleep.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void 
+HostIFScheduleHRTimeout(ktime_t *expires)  //IN:
+{
+   struct hrtimer t;
+
+   if (expires && !expires->tv64) {
+      __set_current_state(TASK_RUNNING);
+
+      return;
+   }
+
+   hrtimer_init(&t, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
+   t.function = HostIFTimerCallback;
+   hrtimer_start(&t, *expires, HRTIMER_MODE_REL);
+
+   if (hrtimer_active(&t)) {
+      schedule();
+   }
+   
+   hrtimer_cancel(&t);
+   __set_current_state(TASK_RUNNING);
+}
+#endif //VMMON_USE_COMPAT_SCHEDULE_HRTIMEOUT
+
+
+#ifndef VMMON_USE_HIGH_RES_TIMERS
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFDoIoctl --
+ *
+ *    Issue ioctl.  Assume kernel is not locked.  It is not true now,
+ *    but it makes things easier to understand, and won't surprise us
+ *    later when we get rid of kernel lock from our code.
+ *
+ * Results:
+ *    Same as ioctl method.
+ *
+ * Side effects:
+ *    none.
+ *
+ *---------------------------------------------------------------------- 
+ */
+
+static long
+HostIFDoIoctl(struct file *filp,
+              u_int iocmd,
+              unsigned long ioarg)
+{
+   if (filp->f_op->unlocked_ioctl) {
+      return filp->f_op->unlocked_ioctl(filp, iocmd, ioarg);
+   }
+   return -ENOIOCTLCMD;
+}
+#endif //VMON_USE_HIGH_RES_TIMERS
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFStartTimer --
+ *
+ *      Starts the timer using either /dev/rtc or high-resolution timers.
+ *
+ * Results:
+ *      Returns 0 on success, -1 on failure.
+ *
+ * Side effects:
+ *      Sleep until timer expires.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+HostIFStartTimer(Bool rateChanged,  //IN: Did rate change? 
+		 unsigned int rate, //IN: current clock rate
+                 struct file *filp) //IN: /dev/rtc descriptor
+{
+#ifdef VMMON_USE_HIGH_RES_TIMERS
+   static unsigned long slack = 0;
+   static ktime_t expires;
+   int timerPeriod;
+
+   if (rateChanged) {
+      timerPeriod = NSEC_PER_SEC / rate; 
+      expires = ktime_set(0, timerPeriod);
+      /*
+       * Allow the kernel to expire the timer at its convenience.
+       * ppoll() uses 0.1% of the timeout value.  I think we can
+       * tolerate 1%.
+       */
+          
+      slack = timerPeriod / 100;
+   }
+   set_current_state(TASK_INTERRUPTIBLE);
+#   ifdef VMMON_USE_SCHEDULE_HRTIMEOUT
+   schedule_hrtimeout_range(&expires, slack, HRTIMER_MODE_REL);
+#   else
+   HostIFScheduleHRTimeout(&expires);
+#   endif
+#else
+   unsigned p2rate;
+   int res;
+   unsigned long buf;
+   loff_t pos = 0;
+
+   if (rateChanged) {
+      /*
+       * The host will already have HZ timer interrupts per second.  So
+       * in order to satisfy the requested rate, we need up to (rate -
+       * HZ) additional interrupts generated by the RTC.  That way, if
+       * the guest ask for a bit more than 1024 virtual interrupts per
+       * second (which is a common case for Windows with multimedia
+       * timers), we'll program the RTC to 1024 rather than 2048, which
+       * saves a considerable amount of CPU.  PR 519228.
+       */
+      if (rate > HZ) {
+         rate -= HZ;
+      } else {
+         rate = 0;
+      }
+      /*
+       * Don't set the RTC rate to 64 Hz or lower: some kernels have a
+       * bug in the HPET emulation of RTC that will cause the RTC
+       * frequency to get stuck at 64Hz.  See PR 519228 comment #23.
+       */
+      p2rate = 128;
+      // Hardware rate must be a power of 2
+      while (p2rate < rate && p2rate < 8192) {
+         p2rate <<= 1;
+      }
+
+      res = HostIFDoIoctl(filp, RTC_IRQP_SET, p2rate);
+      if (res < 0) {
+         Warning("/dev/rtc set rate %d failed: %d\n", p2rate, res);
+
+         return -1;
+      }
+      if (kthread_should_stop()) {
+         return -1;
+      }
+   }
+   res = filp->f_op->read(filp, (void *) &buf, sizeof(buf), &pos);
+   if (res <= 0) {
+      if (res != -ERESTARTSYS) {
+         Log("/dev/rtc read failed: %d\n", res);
+      }
+
+      return -1;
+   }
+#endif
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFFastClockThread --
+ *
+ *      Kernel thread that provides finer-grained wakeups than the
+ *      main system timers by using /dev/rtc.  We can't do this at
+ *      user level because /dev/rtc is not sharable (PR 19266).  Also,
+ *      we want to avoid the overhead of a context switch out to user
+ *      level on every RTC interrupt.
+ *
+ * Results:
+ *      Returns 0.
+ *
+ * Side effects:
+ *      Wakeups and IPIs.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+HostIFFastClockThread(void *data)  // IN:
+{
+   struct file *filp = (struct file *) data;
+   int res;
+   mm_segment_t oldFS;
+   unsigned int rate = 0;
+   unsigned int prevRate = 0;
+
+   oldFS = get_fs();
+   set_fs(KERNEL_DS);
+   allow_signal(SIGKILL);
+   set_user_nice(current, linuxState.fastClockPriority);
+
+   while ((rate = linuxState.fastClockRate) > MIN_RATE) {
+      if (kthread_should_stop()) {
+         goto out;
+      }
+      res = HostIFStartTimer(rate != prevRate, rate, filp);
+      if (res < 0) {
+         goto out;
+      }
+      prevRate = rate;
+
+#if defined(CONFIG_SMP)
+      /*
+       * IPI each VCPU thread that is in the monitor and is due to
+       * fire a MonTimer callback.
+       */
+      Vmx86_MonTimerIPI();
+#endif
+
+      /*
+       * Wake threads that are waiting for a fast poll timeout at
+       * userlevel.  This is needed only on Linux.  On Windows,
+       * we get shorter timeouts simply by increasing the host
+       * clock rate.
+       */
+
+      LinuxDriverWakeUp(TRUE);
+   }
+
+ out:
+   LinuxDriverWakeUp(TRUE);
+   set_fs(oldFS);
+
+   /*
+    * Do not exit thread until we are told to do so.
+    */
+
+   do {
+      set_current_state(TASK_UNINTERRUPTIBLE);
+      if (kthread_should_stop()) {
+         break;
+      }
+      schedule();
+   } while (1);
+   set_current_state(TASK_RUNNING);
+
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_SetFastClockRate --
+ *
+ *      The monitor wants to poll for events at the given rate.
+ *      Ensure that the host OS's timer interrupts come at least at
+ *      this rate.  If the requested rate is greater than the rate at
+ *      which timer interrupts will occur on CPUs other than 0, then
+ *      also arrange to call Vmx86_MonitorPollIPI on every timer
+ *      interrupt, in order to relay IPIs to any other CPUs that need
+ *      them.
+ *
+ * Locking:
+ *      The caller must hold the fast clock lock.
+ *
+ * Results:
+ *      0 for success; positive error code if /dev/rtc could not be opened.
+ *
+ * Side effects:
+ *      As described above.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+HostIF_SetFastClockRate(unsigned int rate) // IN: Frequency in Hz.
+{
+   ASSERT(MutexIsLocked(&fastClockMutex));
+   linuxState.fastClockRate = rate;
+
+   /*
+    * Overview
+    * --------
+    * An SMP Linux kernel programs the 8253 timer (to increment the 'jiffies'
+    * counter) _and_ all local APICs (to run the scheduler code) to deliver
+    * interrupts HZ times a second.
+    *
+    * Time
+    * ----
+    * The kernel tries very hard to spread all these interrupts evenly over
+    * time, i.e. on a 1 CPU system, the 1 local APIC phase is shifted by 1/2
+    * period compared to the 8253, and on a 2 CPU system, the 2 local APIC
+    * phases are respectively shifted by 1/3 and 2/3 period compared to the
+    * 8253. This is done to reduce contention on locks guarding the global task
+    * queue.
+    *
+    * Space
+    * -----
+    * The 8253 interrupts are distributed between physical CPUs, evenly on a P3
+    * system, whereas on a P4 system physical CPU 0 gets all of them.
+    *
+    * Long story short, unless the monitor requested rate is significantly
+    * higher than HZ, we don't need to send IPIs or exclusively grab /dev/rtc
+    * to periodically kick vCPU threads running in the monitor on all physical
+    * CPUs.
+    */
+
+   if (rate > MIN_RATE) {
+      if (!linuxState.fastClockThread) {
+         struct task_struct *rtcTask;
+         struct file *filp = NULL;
+
+#if !defined(VMMON_USE_HIGH_RES_TIMERS)
+         int res;
+
+         filp = filp_open("/dev/rtc", O_RDONLY, 0);
+         if (IS_ERR(filp)) {
+            Warning("/dev/rtc open failed: %d\n", (int)(VA)filp);
+
+            return -(int)(VA)filp;
+         }
+         res = HostIFDoIoctl(filp, RTC_PIE_ON, 0);
+         if (res < 0) {
+            Warning("/dev/rtc enable interrupt failed: %d\n", res);
+            filp_close(filp, current->files);
+
+            return -res;
+         }
+#endif
+         rtcTask = kthread_run(HostIFFastClockThread, filp, "vmware-rtc");
+         if (IS_ERR(rtcTask)) {
+            long err = PTR_ERR(rtcTask);
+
+            /*
+             * Ignore ERESTARTNOINTR silently, it occurs when signal is
+             * pending, and syscall layer automatically reissues operation
+             * after signal is handled.
+             */
+
+            if (err != -ERESTARTNOINTR) {
+               Warning("/dev/rtc cannot start watch thread: %ld\n", err);
+            }
+	    close_rtc(filp, current->files);
+
+            return -err;
+         }
+         linuxState.fastClockThread = rtcTask;
+	 linuxState.fastClockFile = filp;
+      }
+   } else {
+      if (linuxState.fastClockThread) {
+         force_sig(SIGKILL, linuxState.fastClockThread);
+         kthread_stop(linuxState.fastClockThread);
+	 close_rtc(linuxState.fastClockFile, current->files);
+
+         linuxState.fastClockThread = NULL;
+	 linuxState.fastClockFile = NULL;
+      }
+   }
+
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_MapUserMem --
+ *
+ *	Obtain kernel pointer to user memory. The pages backing the user memory
+ *      address are locked into memory (this allows the pointer to be used in
+ *      contexts where paging is undesirable or impossible).
+ *
+ * Results:
+ *      On success, returns the kernel virtual address, along with a handle to
+ *      be used for unmapping.
+ *      On failure, returns NULL.
+ *
+ * Side effects:
+ *	Yes.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void *
+HostIF_MapUserMem(VA addr,                  // IN: User memory virtual address
+                  size_t size,              // IN: Size of memory desired
+                  VMMappedUserMem **handle) // OUT: Handle to mapped memory
+{
+   void *p = (void *) (uintptr_t) addr;
+   VMMappedUserMem *newHandle;
+   VA offset = addr & (PAGE_SIZE - 1);
+   size_t numPagesNeeded = ((offset + size) / PAGE_SIZE) + 1;
+   size_t handleSize =
+      sizeof *newHandle + numPagesNeeded * sizeof newHandle->pages[0];
+   void *mappedAddr;
+
+   ASSERT(handle);
+
+   if (!access_ok(VERIFY_WRITE, p, size)) {
+      printk(KERN_ERR "%s: Couldn't verify write to uva 0x%p with size %"
+             FMTSZ"u\n", __func__, p, size);
+
+      return NULL;
+   }
+
+   newHandle = kmalloc(handleSize, GFP_KERNEL);
+   if (newHandle == NULL) {
+      printk(KERN_ERR "%s: Couldn't allocate %"FMTSZ"u bytes of memory\n",
+             __func__, handleSize);
+
+      return NULL;
+   }
+
+   if (HostIFGetUserPages(p, newHandle->pages, numPagesNeeded)) {
+      kfree(newHandle);
+      printk(KERN_ERR "%s: Couldn't get %"FMTSZ"u %s for uva 0x%p\n", __func__,
+             numPagesNeeded, numPagesNeeded > 1 ? "pages" : "page", p);
+
+      return NULL;
+   }
+
+   if (numPagesNeeded > 1) {
+      /*
+       * Unlike kmap(), vmap() can fail. If it does, we need to release the
+       * pages that we acquired in HostIFGetUserPages().
+       */
+
+      mappedAddr = vmap(newHandle->pages, numPagesNeeded, VM_MAP, PAGE_KERNEL);
+      if (mappedAddr == NULL) {
+         unsigned int i;
+         for (i = 0; i < numPagesNeeded; i++) {
+            put_page(newHandle->pages[i]);
+         }
+         kfree(newHandle);
+         printk(KERN_ERR "%s: Couldn't vmap %"FMTSZ"u %s for uva 0x%p\n",
+                __func__, numPagesNeeded,
+                numPagesNeeded > 1 ? "pages" : "page", p);
+
+         return NULL;
+      }
+   } else {
+      mappedAddr = kmap(newHandle->pages[0]);
+   }
+
+   printk(KERN_DEBUG "%s: p = 0x%p, offset = 0x%p, numPagesNeeded = %"FMTSZ"u,"
+          " handleSize = %"FMTSZ"u, mappedAddr = 0x%p\n",
+          __func__, p, (void *)offset, numPagesNeeded, handleSize, mappedAddr); 
+
+   newHandle->numPages = numPagesNeeded;
+   newHandle->addr = mappedAddr;
+   *handle = newHandle;
+
+   return mappedAddr + offset;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_UnmapUserMem --
+ *
+ *	Unmap user memory from HostIF_MapUserMem().
+ *
+ * Results:
+ *	None.
+ *
+ * Side effects:
+ *	Yes.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+HostIF_UnmapUserMem(VMMappedUserMem *handle) // IN: Handle to mapped memory
+{
+   unsigned int i;
+
+   if (handle == NULL) {
+      return;
+   }
+
+   printk(KERN_DEBUG "%s: numPages = %"FMTSZ"u, addr = 0x%p\n",
+          __func__, handle->numPages, handle->addr); 
+
+   if (handle->numPages > 1) {
+      vunmap(handle->addr);
+   } else {
+      kunmap(handle->pages[0]);
+   }
+
+   for (i = 0; i < handle->numPages; i++) {
+      put_page(handle->pages[i]);
+   }
+   kfree(handle);
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_SafeRDMSR --
+ *
+ *      Attempt to read a MSR, and handle the exception if the MSR
+ *      is unimplemented.
+ *
+ * Results:
+ *      0 if successful, and MSR value is returned via *val.
+ *
+ *      If the MSR is unimplemented, *val is set to 0, and a
+ *      non-zero value is returned: -1 for Win32, -EFAULT for Linux,
+ *      and 1 for MacOS.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+int
+HostIF_SafeRDMSR(unsigned int msr,   // IN
+                 uint64 *val)        // OUT: MSR value
+{
+   int ret;
+   unsigned low, high;
+   asm volatile("2: rdmsr ; xor %0,%0\n"
+                "1:\n\t"
+                ".section .fixup,\"ax\"\n\t"
+                "3: mov %4,%0 ; jmp 1b\n\t"
+                ".previous\n\t"
+                VMW_ASM_EXTABLE(2b, 3b)
+                : "=r"(ret), "=a"(low), "=d"(high)
+                : "c"(msr), "i"(-EFAULT), "1"(0), "2"(0)); // init eax/edx to 0
+   *val = (low | ((u64)(high) << 32));
+
+   return ret;
+}
+
diff --git a/vmmon-only/linux/hostif_priv.h b/vmmon-only/linux/hostif_priv.h
new file mode 100644
index 00000000..8e731ba8
--- /dev/null
+++ b/vmmon-only/linux/hostif_priv.h
@@ -0,0 +1,50 @@
+/*********************************************************
+ * Copyright (C) 2009-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * hostif_priv.h --
+ *
+ *      Defines several Linux-only additions to the HostIF API.
+ */
+
+#ifndef _HOSTIF_PRIV_H_
+#define _HOSTIF_PRIV_H_
+
+/* Functions for transferring data to/from userspace. */
+EXTERN int    HostIF_CopyFromUser(void *dst, const void *src, unsigned int len);
+EXTERN int    HostIF_CopyToUser(void *dst, const void *src, unsigned int len);
+
+/* Functions for dealing with the poll list lock. */
+EXTERN void   HostIF_PollListLock(int callerID);
+EXTERN void   HostIF_PollListUnlock(int callerID);
+
+/* Functions for mapping and unmapping userspace memory. */
+struct VMMappedUserMem;
+EXTERN void  *HostIF_MapUserMem(VA addr, size_t size,
+                                struct VMMappedUserMem **handle);
+EXTERN void   HostIF_UnmapUserMem(struct VMMappedUserMem *handle);
+
+/* Uptime-related functions. */
+EXTERN void   HostIF_InitUptime(void);
+EXTERN void   HostIF_CleanupUptime(void);
+
+/* Miscellaneous functions. */
+EXTERN void   HostIF_InitGlobalLock(void);
+EXTERN Bool   HostIF_GetAllCpuInfo(CPUIDQuery *query);
+
+#endif // ifdef _HOSTIF_PRIV_H_
diff --git a/vmmon-only/linux/vmhost.h b/vmmon-only/linux/vmhost.h
new file mode 100644
index 00000000..8041ba2b
--- /dev/null
+++ b/vmmon-only/linux/vmhost.h
@@ -0,0 +1,100 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __VMHOST_H__
+#define __VMHOST_H__
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "compat_semaphore.h"
+
+
+#ifdef VMX86_DEBUG
+/*
+ * A MutexHolder object. In debug builds, we record information about the
+ * holder of a Mutex. --hpreg
+ */
+typedef struct MutexHolder {
+   /* Linux task ID. --hpreg */
+   int pid;
+
+   /* Location in the code. --hpreg */
+   int callerID;
+} MutexHolder;
+#endif
+
+
+/*
+ * A Mutex object. In debug builds,
+ * o we track contention,
+ * o we check when the Mutex should be held,
+ * o we check the pairing and nesting of lock/unlock operations.
+ *  --hpreg
+ */
+typedef struct Mutex {
+   /* A binary semaphore. --hpreg */
+   struct semaphore sem;
+#ifdef VMX86_DEBUG
+
+   /*
+    * _static_ string describing the Mutex. Set once for all when the Mutex is
+    * initialized. --hpreg
+    */
+   char const *name;
+
+   /* Information about the previous holder. Protected by 'sem'. --hpreg */
+   MutexHolder prev;
+
+   /* Information about the current holder. Protected by 'sem'. --hpreg */
+   MutexHolder cur;
+#endif
+} Mutex;
+
+
+/*
+ * Per-vm host-specific state.
+ */
+
+typedef struct VMHost {
+   /* 
+    * Used for shared modifications to VM's VMDriver data, mostly page locking.
+    * It has higher rank than the global mutex.
+    */
+   Mutex vmMutex;
+
+   unsigned int       crosspagePagesCount;
+   struct page        *crosspagePages[MAX_INITBLOCK_CPUS];
+   struct task_struct *vcpuSemaTask[MAX_INITBLOCK_CPUS];
+   /*
+    * Pages that were allocated/mapped by VMX and locked by the driver and
+    * don't have a particular VA. 
+    */
+   struct PhysTracker *lockedPages;
+   /*
+    * Locked pages that were allocated by the driver and don't have 
+    * a particular VA. They are used as monitor anonymous pages or
+    * as pages for "AWE" guest memory.
+    */
+   struct PhysTracker *AWEPages; 
+   /* Is VMDriver.hostAPIC mapped or is from __fix_to_virt(FIX_APIC_BASE)? */
+   Bool               hostAPICIsMapped;
+} VMHost;
+
+#endif
diff --git a/vmmon-only/linux/vmmonInt.h b/vmmon-only/linux/vmmonInt.h
new file mode 100644
index 00000000..4dc04e90
--- /dev/null
+++ b/vmmon-only/linux/vmmonInt.h
@@ -0,0 +1,109 @@
+/*********************************************************
+ * Copyright (C) 1998,2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __VMMONINT_H__
+#define __VMMONINT_H__
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+
+/*
+ * Hide all kernel compatibility stuff in these macros and functions.
+ */
+
+#ifdef VMW_HAVE_SMP_CALL_3ARG
+#define compat_smp_call_function(fn, info, wait) smp_call_function(fn, info, wait)
+#else
+#define compat_smp_call_function(fn, info, wait) smp_call_function(fn, info, 1, wait)
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * compat_tsc_khz --
+ *
+ *    Compatibility wrapper for tsc_khz.
+ *
+ * Returns:
+ *
+ *    Returns 0 if symbol is not exported by the kernel, else
+ *    value of tsc_khz.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static inline unsigned int
+compat_tsc_khz(void)
+{
+#if defined(VMW_HAVE_TSC_KHZ)
+   return tsc_khz;
+#else
+   return 0;
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * compat_smp_call_function_single --
+ *
+ *    Compatibility wrapper for calling smp_call_function_single.
+ *    Versions prior to 2.6.20 did not export the symbol for both
+ *    i386 and x86_64 kernels.
+ *
+ * Returns:
+ *
+ *    Returns -ENOSYS if the host kernel does not implement or export
+ *    the function, else returns the error status of
+ *    smp_call_function_single.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 20)
+#   ifdef VMW_HAVE_SMP_CALL_3ARG
+#      define compat_smp_call_function_single(cpu, fn, info, wait) \
+              smp_call_function_single(cpu, fn, info, wait)
+#   else
+#      define compat_smp_call_function_single(cpu, fn, info, wait) \
+              smp_call_function_single(cpu, fn, info, 1, wait)
+#   endif // VMW_HAVE_SMP_CALL_3ARG
+#else // VERSION >= 2.6.20
+#      define compat_smp_call_function_single(cpu, fn, info, wait) (-ENOSYS)
+#endif
+
+
+/*
+ * Although this is not really related to kernel-compatibility, I put this
+ * helper macro here for now for a lack of better place --hpreg
+ *
+ * The exit(2) path does, in this order:
+ * . set current->files to NULL
+ * . close all fds, which potentially calls LinuxDriver_Close()
+ *
+ * fget() requires current->files != NULL, so we must explicitely check --hpreg
+ */
+#define vmware_fget(_fd) (current->files ? fget(_fd) : NULL)
+
+extern void LinuxDriverWakeUp(Bool selective);
+
+#endif /* __VMMONINT_H__ */
diff --git a/vmmon-only/vmcore/driver_vmcore.h b/vmmon-only/vmcore/driver_vmcore.h
new file mode 100644
index 00000000..3863424a
--- /dev/null
+++ b/vmmon-only/vmcore/driver_vmcore.h
@@ -0,0 +1,34 @@
+/*********************************************************
+ * Copyright (C) 2004 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _DRIVER_VMCORE_H_
+#define _DRIVER_VMCORE_H_
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vmx86.h"
+
+/*
+ * Exported vmcore functions.
+ */
+
+int Vmx86_RunVM(VMDriver *vm, Vcpuid vcpuid);
+
+#endif
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/vmcore/moduleloop.c
new file mode 100644
index 00000000..94aab9eb
--- /dev/null
+++ b/vmmon-only/vmcore/moduleloop.c
@@ -0,0 +1,265 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * moduleloop.c --
+ *
+ *     Platform independent routines, private to VMCORE,  to
+ *     support module calls and user calls in the module.
+ *
+ */
+
+#if defined(linux)
+/* Must come before any kernel header file */
+#   include "driver-config.h"
+#   include <linux/kernel.h>
+#   include <linux/sched.h>
+#endif
+#include "vmware.h"
+#include "modulecall.h"
+#include "vmx86.h"
+#include "task.h"
+#include "initblock.h"
+#include "vm_basic_asm.h"
+#include "iocontrols.h"
+#include "hostif.h"
+#include "memtrack.h"
+#include "driver_vmcore.h"
+#include "usercalldefs.h"
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_RunVM  --
+ *
+ *      Main interaction between the module and the monitor:
+ *
+ *      Run the monitor
+ *      Process module calls from the monitor
+ *      Make cross user calls to the main thread
+ *      Return to userlevel to process normal user calls
+ *      and to signal timeout or errors.
+ *
+ * Results:
+ *      Positive: user call number.
+ *      USERCALL_RESTART: (Linux only)
+ *      USERCALL_VMX86ALLOCERR: error (message already output)
+ *
+ * Side effects:
+ *      Not really, just a switch to monitor and back, that's all.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_RunVM(VMDriver *vm,   // IN:
+            Vcpuid vcpuid)  // IN:
+{
+   uint32           retval    = MODULECALL_USERRETURN;
+   VMCrossPageData *crosspage = &vm->crosspage[vcpuid]->crosspageData;
+   int              bailValue = 0;
+
+   ASSERT(crosspage);
+
+   /*
+    * Check if we were interrupted by signal.
+    */
+   if (crosspage->moduleCallInterrupted) {
+      crosspage->moduleCallInterrupted = FALSE;
+      goto skipTaskSwitch;
+   }
+
+   for (;;) {
+      /*
+       * Task_Switch changes the world to the monitor.
+       * The monitor is waiting in the BackToHost routine.
+       */
+      UCTIMESTAMP(crosspage, SWITCHING_TO_MONITOR);
+      Task_Switch(vm, vcpuid);
+      UCTIMESTAMP(crosspage, SWITCHED_TO_MODULE);
+
+      /*
+       * Wake up anything that was waiting for this vcpu to run
+       */
+
+      if ((VCPUSet_IsEmpty(&crosspage->yieldVCPUs) &&
+           crosspage->moduleCallType != MODULECALL_COSCHED) ||
+          crosspage->moduleCallType == MODULECALL_SEMAWAIT) {
+         HostIF_WakeUpYielders(vm, vcpuid);
+      }
+
+      if (!VCPUSet_IsEmpty(&crosspage->yieldVCPUs) &&
+          crosspage->moduleCallType != MODULECALL_COSCHED &&
+          crosspage->moduleCallType != MODULECALL_SEMAWAIT) {
+         Vmx86_YieldToSet(vm, vcpuid, &crosspage->yieldVCPUs, 0, TRUE);
+      }
+
+skipTaskSwitch:;
+
+      retval = MODULECALL_USERRETURN;
+
+      if (crosspage->userCallType != MODULECALL_USERCALL_NONE) {
+         /*
+          * This is the main user call path.  Handle by returning
+          * from the ioctl (back to the userlevel side of a VCPU thread).
+          */
+         bailValue = crosspage->userCallType;
+         crosspage->retval = retval;
+         goto bailOut;
+      }
+
+      switch (crosspage->moduleCallType) {
+      case MODULECALL_NONE:
+         break;
+
+      case MODULECALL_INTR:    // Already done in task.c
+         break;
+
+      case MODULECALL_GET_RECYCLED_PAGES: {
+         MPN mpns[MODULECALL_NUM_ARGS];
+         int nPages = MIN((int)crosspage->args[0], MODULECALL_NUM_ARGS);
+
+         retval = Vmx86_AllocLockedPages(vm, PtrToVA64(mpns), nPages, TRUE,
+                                         FALSE);
+         if (retval <= nPages) {
+            int i;
+            for (i = 0; i < retval; i++) {
+               crosspage->args[i] = mpns[i];
+            }
+         } else {
+            // retval is holding an error code
+            Warning("Failed to alloc %u pages: %d\n", nPages, (int)retval);
+            retval = 0;
+         }
+         break;
+      }
+
+      case MODULECALL_SEMAWAIT: {
+         retval = HostIF_SemaphoreWait(vm, vcpuid, crosspage->args);
+
+         if (retval == MX_WAITINTERRUPTED) {
+            crosspage->moduleCallInterrupted = TRUE;
+            bailValue = USERCALL_RESTART;
+            goto bailOut;
+         }
+         break;
+      }
+
+      case MODULECALL_SEMASIGNAL: {
+         retval = HostIF_SemaphoreSignal(crosspage->args);
+
+         if (retval == MX_WAITINTERRUPTED) {
+             crosspage->moduleCallInterrupted = TRUE;
+             bailValue = USERCALL_RESTART;
+             goto bailOut;
+         }
+         break;
+      }
+
+      case MODULECALL_SEMAFORCEWAKEUP: {
+         ASSERT_ON_COMPILE(sizeof(VCPUSet) <= sizeof(crosspage->args));
+         HostIF_SemaphoreForceWakeup(vm, (VCPUSet *) &crosspage->args[0]);
+         break;
+      }
+
+      case MODULECALL_IPI: {
+         HostIFIPIMode mode;
+         ASSERT_ON_COMPILE(sizeof(VCPUSet) <= sizeof(crosspage->args));
+         mode = HostIF_IPI(vm, (VCPUSet *) &crosspage->args[0]);
+         retval = (mode != IPI_NONE);
+         break;
+      }
+
+      case MODULECALL_RELEASE_ANON_PAGES: {
+         unsigned count;
+         MPN mpns[MODULECALL_NUM_ARGS];
+         for (count = 0; count < MODULECALL_NUM_ARGS; count++) {
+            mpns[count] = (MPN)crosspage->args[count];
+            if (mpns[count] == INVALID_MPN) {
+               break;
+            }
+         }
+         ASSERT(count > 0);
+         retval = Vmx86_FreeLockedPages(vm, PtrToVA64(mpns), count, TRUE);
+         break;
+      }
+
+      case MODULECALL_LOOKUP_MPN: {
+         int i;
+         VPN64  vpn    = (VPN64)crosspage->args[0];
+         uint32 nPages = (uint32)crosspage->args[1];
+         VA64   uAddr  = (VA64)VPN_2_VA(vpn);
+         ASSERT(nPages <= MODULECALL_NUM_ARGS);
+         for (i = 0; i < nPages; i++) {
+            MPN mpn;
+            HostIF_LookupUserMPN(vm, uAddr + i * PAGE_SIZE, &mpn);
+            crosspage->args[i] = mpn;
+         }
+         break;
+      }
+
+      case MODULECALL_PIN_MPN: {
+         MPN mpn;
+         VPN64 vpn = crosspage->args[0];
+         VA64   va = VPN_2_VA(vpn);
+         retval = Vmx86_LockPage(vm, va, FALSE, &mpn);
+         crosspage->args[0] = mpn;
+         break;
+      }
+
+      case MODULECALL_COSCHED: {
+         uint32 spinUS = (uint32)crosspage->args[2];
+         ASSERT_ON_COMPILE(sizeof(VCPUSet) + sizeof(uint32) <=
+                           sizeof(crosspage->args));
+         Vmx86_YieldToSet(vm, vcpuid, (VCPUSet *) &crosspage->args[0],
+                          spinUS, FALSE);
+         break;
+      }
+
+      case MODULECALL_ALLOC_VMX_PAGE: {
+         if (Task_GetHVRootPageForPCPU(crosspage->pcpuNum) == INVALID_MPN) {
+            bailValue = USERCALL_VMX86ALLOCERR;
+            goto bailOut;
+         }
+
+         retval = crosspage->retval;
+      } break;
+
+      case MODULECALL_ALLOC_TMP_GDT: {
+         if (!Task_GetTmpGDT(crosspage->pcpuNum)) {
+            bailValue = USERCALL_VMX86ALLOCERR;
+            goto bailOut;
+         }
+
+         retval = crosspage->retval;
+      } break;
+
+      default:
+         Warning("ModuleCall %d not supported\n", crosspage->moduleCallType);
+      }
+
+      crosspage->retval = retval;
+
+#if defined(linux)
+      cond_resched(); // Other kernels are preemptable
+#endif
+   }
+
+bailOut:
+   return bailValue;
+}
diff --git a/vmnet-only/COPYING b/vmnet-only/COPYING
new file mode 100644
index 00000000..d511905c
--- /dev/null
+++ b/vmnet-only/COPYING
@@ -0,0 +1,339 @@
+		    GNU GENERAL PUBLIC LICENSE
+		       Version 2, June 1991
+
+ Copyright (C) 1989, 1991 Free Software Foundation, Inc.,
+ 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+			    Preamble
+
+  The licenses for most software are designed to take away your
+freedom to share and change it.  By contrast, the GNU General Public
+License is intended to guarantee your freedom to share and change free
+software--to make sure the software is free for all its users.  This
+General Public License applies to most of the Free Software
+Foundation's software and to any other program whose authors commit to
+using it.  (Some other Free Software Foundation software is covered by
+the GNU Lesser General Public License instead.)  You can apply it to
+your programs, too.
+
+  When we speak of free software, we are referring to freedom, not
+price.  Our General Public Licenses are designed to make sure that you
+have the freedom to distribute copies of free software (and charge for
+this service if you wish), that you receive source code or can get it
+if you want it, that you can change the software or use pieces of it
+in new free programs; and that you know you can do these things.
+
+  To protect your rights, we need to make restrictions that forbid
+anyone to deny you these rights or to ask you to surrender the rights.
+These restrictions translate to certain responsibilities for you if you
+distribute copies of the software, or if you modify it.
+
+  For example, if you distribute copies of such a program, whether
+gratis or for a fee, you must give the recipients all the rights that
+you have.  You must make sure that they, too, receive or can get the
+source code.  And you must show them these terms so they know their
+rights.
+
+  We protect your rights with two steps: (1) copyright the software, and
+(2) offer you this license which gives you legal permission to copy,
+distribute and/or modify the software.
+
+  Also, for each author's protection and ours, we want to make certain
+that everyone understands that there is no warranty for this free
+software.  If the software is modified by someone else and passed on, we
+want its recipients to know that what they have is not the original, so
+that any problems introduced by others will not reflect on the original
+authors' reputations.
+
+  Finally, any free program is threatened constantly by software
+patents.  We wish to avoid the danger that redistributors of a free
+program will individually obtain patent licenses, in effect making the
+program proprietary.  To prevent this, we have made it clear that any
+patent must be licensed for everyone's free use or not licensed at all.
+
+  The precise terms and conditions for copying, distribution and
+modification follow.
+
+		    GNU GENERAL PUBLIC LICENSE
+   TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION
+
+  0. This License applies to any program or other work which contains
+a notice placed by the copyright holder saying it may be distributed
+under the terms of this General Public License.  The "Program", below,
+refers to any such program or work, and a "work based on the Program"
+means either the Program or any derivative work under copyright law:
+that is to say, a work containing the Program or a portion of it,
+either verbatim or with modifications and/or translated into another
+language.  (Hereinafter, translation is included without limitation in
+the term "modification".)  Each licensee is addressed as "you".
+
+Activities other than copying, distribution and modification are not
+covered by this License; they are outside its scope.  The act of
+running the Program is not restricted, and the output from the Program
+is covered only if its contents constitute a work based on the
+Program (independent of having been made by running the Program).
+Whether that is true depends on what the Program does.
+
+  1. You may copy and distribute verbatim copies of the Program's
+source code as you receive it, in any medium, provided that you
+conspicuously and appropriately publish on each copy an appropriate
+copyright notice and disclaimer of warranty; keep intact all the
+notices that refer to this License and to the absence of any warranty;
+and give any other recipients of the Program a copy of this License
+along with the Program.
+
+You may charge a fee for the physical act of transferring a copy, and
+you may at your option offer warranty protection in exchange for a fee.
+
+  2. You may modify your copy or copies of the Program or any portion
+of it, thus forming a work based on the Program, and copy and
+distribute such modifications or work under the terms of Section 1
+above, provided that you also meet all of these conditions:
+
+    a) You must cause the modified files to carry prominent notices
+    stating that you changed the files and the date of any change.
+
+    b) You must cause any work that you distribute or publish, that in
+    whole or in part contains or is derived from the Program or any
+    part thereof, to be licensed as a whole at no charge to all third
+    parties under the terms of this License.
+
+    c) If the modified program normally reads commands interactively
+    when run, you must cause it, when started running for such
+    interactive use in the most ordinary way, to print or display an
+    announcement including an appropriate copyright notice and a
+    notice that there is no warranty (or else, saying that you provide
+    a warranty) and that users may redistribute the program under
+    these conditions, and telling the user how to view a copy of this
+    License.  (Exception: if the Program itself is interactive but
+    does not normally print such an announcement, your work based on
+    the Program is not required to print an announcement.)
+
+These requirements apply to the modified work as a whole.  If
+identifiable sections of that work are not derived from the Program,
+and can be reasonably considered independent and separate works in
+themselves, then this License, and its terms, do not apply to those
+sections when you distribute them as separate works.  But when you
+distribute the same sections as part of a whole which is a work based
+on the Program, the distribution of the whole must be on the terms of
+this License, whose permissions for other licensees extend to the
+entire whole, and thus to each and every part regardless of who wrote it.
+
+Thus, it is not the intent of this section to claim rights or contest
+your rights to work written entirely by you; rather, the intent is to
+exercise the right to control the distribution of derivative or
+collective works based on the Program.
+
+In addition, mere aggregation of another work not based on the Program
+with the Program (or with a work based on the Program) on a volume of
+a storage or distribution medium does not bring the other work under
+the scope of this License.
+
+  3. You may copy and distribute the Program (or a work based on it,
+under Section 2) in object code or executable form under the terms of
+Sections 1 and 2 above provided that you also do one of the following:
+
+    a) Accompany it with the complete corresponding machine-readable
+    source code, which must be distributed under the terms of Sections
+    1 and 2 above on a medium customarily used for software interchange; or,
+
+    b) Accompany it with a written offer, valid for at least three
+    years, to give any third party, for a charge no more than your
+    cost of physically performing source distribution, a complete
+    machine-readable copy of the corresponding source code, to be
+    distributed under the terms of Sections 1 and 2 above on a medium
+    customarily used for software interchange; or,
+
+    c) Accompany it with the information you received as to the offer
+    to distribute corresponding source code.  (This alternative is
+    allowed only for noncommercial distribution and only if you
+    received the program in object code or executable form with such
+    an offer, in accord with Subsection b above.)
+
+The source code for a work means the preferred form of the work for
+making modifications to it.  For an executable work, complete source
+code means all the source code for all modules it contains, plus any
+associated interface definition files, plus the scripts used to
+control compilation and installation of the executable.  However, as a
+special exception, the source code distributed need not include
+anything that is normally distributed (in either source or binary
+form) with the major components (compiler, kernel, and so on) of the
+operating system on which the executable runs, unless that component
+itself accompanies the executable.
+
+If distribution of executable or object code is made by offering
+access to copy from a designated place, then offering equivalent
+access to copy the source code from the same place counts as
+distribution of the source code, even though third parties are not
+compelled to copy the source along with the object code.
+
+  4. You may not copy, modify, sublicense, or distribute the Program
+except as expressly provided under this License.  Any attempt
+otherwise to copy, modify, sublicense or distribute the Program is
+void, and will automatically terminate your rights under this License.
+However, parties who have received copies, or rights, from you under
+this License will not have their licenses terminated so long as such
+parties remain in full compliance.
+
+  5. You are not required to accept this License, since you have not
+signed it.  However, nothing else grants you permission to modify or
+distribute the Program or its derivative works.  These actions are
+prohibited by law if you do not accept this License.  Therefore, by
+modifying or distributing the Program (or any work based on the
+Program), you indicate your acceptance of this License to do so, and
+all its terms and conditions for copying, distributing or modifying
+the Program or works based on it.
+
+  6. Each time you redistribute the Program (or any work based on the
+Program), the recipient automatically receives a license from the
+original licensor to copy, distribute or modify the Program subject to
+these terms and conditions.  You may not impose any further
+restrictions on the recipients' exercise of the rights granted herein.
+You are not responsible for enforcing compliance by third parties to
+this License.
+
+  7. If, as a consequence of a court judgment or allegation of patent
+infringement or for any other reason (not limited to patent issues),
+conditions are imposed on you (whether by court order, agreement or
+otherwise) that contradict the conditions of this License, they do not
+excuse you from the conditions of this License.  If you cannot
+distribute so as to satisfy simultaneously your obligations under this
+License and any other pertinent obligations, then as a consequence you
+may not distribute the Program at all.  For example, if a patent
+license would not permit royalty-free redistribution of the Program by
+all those who receive copies directly or indirectly through you, then
+the only way you could satisfy both it and this License would be to
+refrain entirely from distribution of the Program.
+
+If any portion of this section is held invalid or unenforceable under
+any particular circumstance, the balance of the section is intended to
+apply and the section as a whole is intended to apply in other
+circumstances.
+
+It is not the purpose of this section to induce you to infringe any
+patents or other property right claims or to contest validity of any
+such claims; this section has the sole purpose of protecting the
+integrity of the free software distribution system, which is
+implemented by public license practices.  Many people have made
+generous contributions to the wide range of software distributed
+through that system in reliance on consistent application of that
+system; it is up to the author/donor to decide if he or she is willing
+to distribute software through any other system and a licensee cannot
+impose that choice.
+
+This section is intended to make thoroughly clear what is believed to
+be a consequence of the rest of this License.
+
+  8. If the distribution and/or use of the Program is restricted in
+certain countries either by patents or by copyrighted interfaces, the
+original copyright holder who places the Program under this License
+may add an explicit geographical distribution limitation excluding
+those countries, so that distribution is permitted only in or among
+countries not thus excluded.  In such case, this License incorporates
+the limitation as if written in the body of this License.
+
+  9. The Free Software Foundation may publish revised and/or new versions
+of the General Public License from time to time.  Such new versions will
+be similar in spirit to the present version, but may differ in detail to
+address new problems or concerns.
+
+Each version is given a distinguishing version number.  If the Program
+specifies a version number of this License which applies to it and "any
+later version", you have the option of following the terms and conditions
+either of that version or of any later version published by the Free
+Software Foundation.  If the Program does not specify a version number of
+this License, you may choose any version ever published by the Free Software
+Foundation.
+
+  10. If you wish to incorporate parts of the Program into other free
+programs whose distribution conditions are different, write to the author
+to ask for permission.  For software which is copyrighted by the Free
+Software Foundation, write to the Free Software Foundation; we sometimes
+make exceptions for this.  Our decision will be guided by the two goals
+of preserving the free status of all derivatives of our free software and
+of promoting the sharing and reuse of software generally.
+
+			    NO WARRANTY
+
+  11. BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY
+FOR THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW.  EXCEPT WHEN
+OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES
+PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED
+OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.  THE ENTIRE RISK AS
+TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH YOU.  SHOULD THE
+PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY SERVICING,
+REPAIR OR CORRECTION.
+
+  12. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
+WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY AND/OR
+REDISTRIBUTE THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES,
+INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING
+OUT OF THE USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED
+TO LOSS OF DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY
+YOU OR THIRD PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER
+PROGRAMS), EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE
+POSSIBILITY OF SUCH DAMAGES.
+
+		     END OF TERMS AND CONDITIONS
+
+	    How to Apply These Terms to Your New Programs
+
+  If you develop a new program, and you want it to be of the greatest
+possible use to the public, the best way to achieve this is to make it
+free software which everyone can redistribute and change under these terms.
+
+  To do so, attach the following notices to the program.  It is safest
+to attach them to the start of each source file to most effectively
+convey the exclusion of warranty; and each file should have at least
+the "copyright" line and a pointer to where the full notice is found.
+
+    <one line to give the program's name and a brief idea of what it does.>
+    Copyright (C) <year>  <name of author>
+
+    This program is free software; you can redistribute it and/or modify
+    it under the terms of the GNU General Public License as published by
+    the Free Software Foundation; either version 2 of the License, or
+    (at your option) any later version.
+
+    This program is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU General Public License for more details.
+
+    You should have received a copy of the GNU General Public License along
+    with this program; if not, write to the Free Software Foundation, Inc.,
+    51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
+
+Also add information on how to contact you by electronic and paper mail.
+
+If the program is interactive, make it output a short notice like this
+when it starts in an interactive mode:
+
+    Gnomovision version 69, Copyright (C) year name of author
+    Gnomovision comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
+    This is free software, and you are welcome to redistribute it
+    under certain conditions; type `show c' for details.
+
+The hypothetical commands `show w' and `show c' should show the appropriate
+parts of the General Public License.  Of course, the commands you use may
+be called something other than `show w' and `show c'; they could even be
+mouse-clicks or menu items--whatever suits your program.
+
+You should also get your employer (if you work as a programmer) or your
+school, if any, to sign a "copyright disclaimer" for the program, if
+necessary.  Here is a sample; alter the names:
+
+  Yoyodyne, Inc., hereby disclaims all copyright interest in the program
+  `Gnomovision' (which makes passes at compilers) written by James Hacker.
+
+  <signature of Ty Coon>, 1 April 1989
+  Ty Coon, President of Vice
+
+This General Public License does not permit incorporating your program into
+proprietary programs.  If your program is a subroutine library, you may
+consider it more useful to permit linking proprietary applications with the
+library.  If this is what you want to do, use the GNU Lesser General
+Public License instead of this License.
diff --git a/vmnet-only/Makefile b/vmnet-only/Makefile
new file mode 100644
index 00000000..459846e1
--- /dev/null
+++ b/vmnet-only/Makefile
@@ -0,0 +1,150 @@
+#!/usr/bin/make -f
+##########################################################
+# Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+#
+# This program is free software; you can redistribute it and/or modify it
+# under the terms of the GNU General Public License as published by the
+# Free Software Foundation version 2 and no later version.
+#
+# This program is distributed in the hope that it will be useful, but
+# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+# or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+# for more details.
+#
+# You should have received a copy of the GNU General Public License along
+# with this program; if not, write to the Free Software Foundation, Inc.,
+# 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+#
+##########################################################
+
+####
+####  VMware kernel module Makefile to be distributed externally
+####
+
+####
+#### SRCROOT _must_ be a relative path.
+####
+SRCROOT = .
+
+#
+# open-vm-tools doesn't replicate shared source files for different modules;
+# instead, files are kept in shared locations. So define a few useful macros
+# to be able to handle both cases cleanly.
+#
+INCLUDE      :=
+ifdef OVT_SOURCE_DIR
+AUTOCONF_DIR := $(OVT_SOURCE_DIR)/modules/linux/shared/autoconf
+VMLIB_PATH   = $(OVT_SOURCE_DIR)/lib/$(1)
+INCLUDE      += -I$(OVT_SOURCE_DIR)/modules/linux/shared
+INCLUDE      += -I$(OVT_SOURCE_DIR)/lib/include
+else
+AUTOCONF_DIR := $(SRCROOT)/shared/autoconf
+INCLUDE      += -I$(SRCROOT)/shared
+endif
+
+
+VM_UNAME = $(shell uname -r)
+
+# Header directory for the running kernel
+ifdef LINUXINCLUDE
+HEADER_DIR = $(LINUXINCLUDE)
+else
+HEADER_DIR = /lib/modules/$(VM_UNAME)/build/include
+endif
+
+BUILD_DIR = $(HEADER_DIR)/..
+
+DRIVER := vmnet
+PRODUCT := @@PRODUCT@@
+
+# Grep program
+GREP = /bin/grep
+
+vm_check_gcc = $(shell if $(CC) $(1) -S -o /dev/null -xc /dev/null \
+        > /dev/null 2>&1; then echo "$(1)"; else echo "$(2)"; fi)
+vm_check_file = $(shell if test -f $(1); then echo "yes"; else echo "no"; fi)
+
+ifndef VM_KBUILD
+VM_KBUILD := no
+ifeq ($(call vm_check_file,$(BUILD_DIR)/Makefile), yes)
+VM_KBUILD := yes
+endif
+export VM_KBUILD
+endif
+
+ifndef VM_KBUILD_SHOWN
+ifeq ($(VM_KBUILD), no)
+VM_DUMMY := $(shell echo >&2 "Using standalone build system.")
+else
+VM_DUMMY := $(shell echo >&2 "Using kernel build system.")
+endif
+VM_KBUILD_SHOWN := yes
+export VM_KBUILD_SHOWN
+endif
+
+ifneq ($(VM_KBUILD), no)
+
+VMCCVER := $(shell $(CC) -dumpversion)
+
+# If there is no version defined, we are in toplevel pass, not yet in kernel makefiles...
+ifeq ($(VERSION),)
+
+DRIVER_KO := $(DRIVER).ko
+
+.PHONY: $(DRIVER_KO)
+
+auto-build: $(DRIVER_KO)
+	cp -f $< $(SRCROOT)/../$(DRIVER).o
+
+# $(DRIVER_KO) is a phony target, so compare file times explicitly
+$(DRIVER): $(DRIVER_KO)
+	if [ $< -nt $@ ] || [ ! -e $@ ] ; then cp -f $< $@; fi
+
+# Pass gcc version down the chain, so we can detect if kernel attempts to use unapproved compiler
+VM_CCVER := $(VMCCVER)
+export VM_CCVER
+VM_CC := $(CC)
+export VM_CC
+
+MAKEOVERRIDES := $(filter-out CC=%,$(MAKEOVERRIDES))
+
+#
+# Define a setup target that gets built before the actual driver.
+# This target may not be used at all, but if it is then it will be defined
+# in Makefile.kernel
+#
+prebuild:: ;
+postbuild:: ;
+
+$(DRIVER_KO): prebuild
+	$(MAKE) -C $(BUILD_DIR) SUBDIRS=$$PWD SRCROOT=$$PWD/$(SRCROOT) \
+	  MODULEBUILDDIR=$(MODULEBUILDDIR) modules
+	$(MAKE) -C $$PWD SRCROOT=$$PWD/$(SRCROOT) \
+	  MODULEBUILDDIR=$(MODULEBUILDDIR) postbuild
+endif
+
+vm_check_build = $(shell if $(CC) $(KBUILD_CPPFLAGS) $(KBUILD_CFLAGS) \
+	$(CPPFLAGS) $(CFLAGS) $(CFLAGS_KERNEL) $(LINUXINCLUDE) \
+	$(EXTRA_CFLAGS) -Iinclude2/asm/mach-default \
+	-DKBUILD_BASENAME=\"$(DRIVER)\" \
+	-Werror -S -o /dev/null -xc $(1) \
+	> /dev/null 2>&1; then echo "$(2)"; else echo "$(3)"; fi)
+
+CC_WARNINGS := -Wall -Wstrict-prototypes
+CC_OPTS := $(GLOBAL_DEFS) $(CC_WARNINGS) -DVMW_USING_KBUILD
+ifdef VMX86_DEVEL
+CC_OPTS += -DVMX86_DEVEL
+endif
+ifdef VMX86_DEBUG
+CC_OPTS += -DVMX86_DEBUG
+endif
+
+include $(SRCROOT)/Makefile.kernel
+
+else
+
+include $(SRCROOT)/Makefile.normal
+
+endif
+
+#.SILENT:
diff --git a/vmnet-only/Makefile.kernel b/vmnet-only/Makefile.kernel
new file mode 100644
index 00000000..2d8e6f6c
--- /dev/null
+++ b/vmnet-only/Makefile.kernel
@@ -0,0 +1,40 @@
+#!/usr/bin/make -f
+##########################################################
+# Copyright (C) 1998 VMware, Inc. All rights reserved.
+#
+# This program is free software; you can redistribute it and/or modify it
+# under the terms of the GNU General Public License as published by the
+# Free Software Foundation version 2 and no later version.
+#
+# This program is distributed in the hope that it will be useful, but
+# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+# or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+# for more details.
+#
+# You should have received a copy of the GNU General Public License along
+# with this program; if not, write to the Free Software Foundation, Inc.,
+# 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+#
+##########################################################
+
+INCLUDE := -I$(SRCROOT)
+
+EXTRA_CFLAGS := $(CC_OPTS) $(INCLUDE)
+EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/netdev_has_net.c,-DVMW_NETDEV_HAS_NET, )
+EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/netdev_has_dev_net.c,-DVMW_NETDEV_HAS_DEV_NET, )
+EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/nfhook_uses_skb.c,-DVMW_NFHOOK_USES_SKB, )
+EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/skblin.c,  -DVMW_SKB_LINEARIZE_2618, )
+
+obj-m += $(DRIVER).o
+
+$(DRIVER)-y := driver.o hub.o userif.o netif.o bridge.o procfs.o smac_compat.o \
+	       smac.o vnetEvent.o vnetUserListener.o
+
+####
+#### Make Targets are beneath here.
+####
+
+clean:
+	rm -rf $(DRIVER).o $(DRIVER).mod.o $(DRIVER).mod.c $(DRIVER).ko \
+	       .tmp_versions Module.symvers Modules.symvers Module.markers \
+	       modules.order $($(DRIVER)-y) .*.cmd .*.o.flags
diff --git a/vmnet-only/Makefile.normal b/vmnet-only/Makefile.normal
new file mode 100644
index 00000000..a2181821
--- /dev/null
+++ b/vmnet-only/Makefile.normal
@@ -0,0 +1,77 @@
+#!/usr/bin/make -f
+##########################################################
+# Copyright (C) 1998 VMware, Inc. All rights reserved.
+#
+# This program is free software; you can redistribute it and/or modify it
+# under the terms of the GNU General Public License as published by the
+# Free Software Foundation version 2 and no later version.
+#
+# This program is distributed in the hope that it will be useful, but
+# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+# or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+# for more details.
+#
+# You should have received a copy of the GNU General Public License along
+# with this program; if not, write to the Free Software Foundation, Inc.,
+# 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+#
+##########################################################
+
+vm_check_build = $(shell if $(CC) $(CC_OPTS) $(INCLUDE) -Werror -S -o /dev/null -xc $(1) \
+	> /dev/null 2>&1; then echo "$(2)"; else echo "$(3)"; fi)
+
+DRIVERNAME := $(DRIVER)-xxx-$(VM_UNAME)
+
+ifneq (,$(filter x86_64%, $(shell $(CC) -dumpmachine)))
+   MACHINE := x86_64
+else
+   MACHINE := x386
+endif
+
+CC_WARNINGS := -Wall -Wstrict-prototypes
+# Don't use -pipe or egcs-2.91.66 (shipped with RedHat) will die
+CC_OPTS := -D__KERNEL__ -DMODULE -fomit-frame-pointer -fno-strength-reduce \
+	   -fno-common -DKBUILD_MODNAME=$(DRIVER)
+# Gcc 3.0 deprecates -m486 --hpreg
+CC_OPTS += $(call vm_check_gcc,-falign-loops=2 -falign-jumps=2 -falign-functions=2, \
+	   -malign-loops=2 -malign-jumps=2 -malign-functions=2)
+CC_OPTS += $(call vm_check_gcc,-fno-strict-aliasing,)
+ifeq ($(MACHINE),x86_64)
+CC_OPTS += -mno-red-zone -mcmodel=kernel
+else
+CC_OPTS += -DCPU=586 $(call check_gcc,-march=i586,-m486)
+endif
+
+INCLUDE := -I. -I$(HEADER_DIR)
+INCLUDE += $(shell $(CC) $(INCLUDE) -E geninclude.c \
+	   | sed -n -e 's!^APATH!-I$(HEADER_DIR)/asm!p')
+
+CC_OPTS += $(call vm_check_build, $(SRCROOT)/netdev_has_net.c,-DVMW_NETDEV_HAS_NET, )
+CC_OPTS += $(call vm_check_build, $(SRCROOT)/netdev_has_dev_net.c,-DVMW_NETDEV_HAS_DEV_NET, )
+CC_OPTS += $(call vm_check_build, $(SRCROOT)/skblin.c, -DVMW_SKB_LINEARIZE_2618, )
+
+CFLAGS := -O $(CC_WARNINGS) $(CC_OPTS) $(INCLUDE) $(GLOBAL_DEFS)
+
+OBJS := driver.o hub.o userif.o netif.o bridge.o procfs.o smac_compat.o \
+        smac.o vnetEvent.o vnetUserListener.o
+
+LIBS :=
+
+default: all
+
+all: $(DRIVER).o
+
+$(DRIVERNAME): $(OBJS)
+	$(LD) -r -o $@ $^
+
+$(DRIVER) $(DRIVER).o ../$(DRIVER).o: $(DRIVERNAME)
+	cp -f $< $@
+
+auto-build: ../$(DRIVER).o
+
+clean:
+	rm -f $(DRIVERNAME) $(DRIVER) $(DRIVER).o ../$(DRIVER).o $(OBJS)
+
+.PHONY: default all auto-build clean
+
+.SILENT:
diff --git a/vmnet-only/bridge.c b/vmnet-only/bridge.c
new file mode 100644
index 00000000..ba8bd822
--- /dev/null
+++ b/vmnet-only/bridge.c
@@ -0,0 +1,1761 @@
+/*********************************************************
+ * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "driver-config.h"
+
+#define EXPORT_SYMTAB
+
+#include <linux/kernel.h>
+#include <linux/version.h>
+#include <linux/sched.h>
+#include <linux/slab.h>
+#include <linux/poll.h>
+
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/mm.h>
+#include "compat_skbuff.h"
+#include <linux/sockios.h>
+#include <linux/spinlock.h>
+#include "compat_sock.h"
+
+#define __KERNEL_SYSCALLS__
+#include <asm/io.h>
+
+#include <linux/proc_fs.h>
+#include <linux/file.h>
+#include <linux/ip.h>
+#include <linux/tcp.h>
+#include <net/tcp.h>
+#include <net/ipv6.h>
+
+#ifdef CONFIG_NET_RADIO
+#   include <linux/wireless.h>
+#endif
+#include "vmnetInt.h"
+#include "compat_netdevice.h"
+#include "vnetInt.h"
+#include "smac.h"
+
+#define VNET_BRIDGE_HISTORY    48
+
+/*
+ * Bytes reserved before start of packet.  As Ethernet header has 14 bytes,
+ * to get aligned IP header we must skip 2 bytes before packet.  Not that it
+ * matters a lot for us, but using 2 is compatible with what newer 2.6.x
+ * kernels do.
+ */
+#ifndef NET_IP_ALIGN
+#define NET_IP_ALIGN	2
+#endif
+
+#if LOGLEVEL >= 4
+static struct timeval vnetTime;
+#endif
+
+typedef struct VNetBridge VNetBridge;
+
+struct VNetBridge {
+   struct notifier_block    notifier;       // for device state changes
+   char                     name[VNET_NAME_LEN]; // name of net device (e.g., "eth0")
+   struct net_device       *dev;            // device structure for 'name'
+   struct sock             *sk;             // socket associated with skb's
+   struct packet_type       pt;             // used to add packet handler
+   Bool                     enabledPromisc; // track if promisc enabled
+   Bool                     warnPromisc;    // tracks if warning has been logged
+   Bool                     forceSmac;      // whether to use smac unconditionally
+   struct sk_buff          *history[VNET_BRIDGE_HISTORY];  // avoid duplicate packets
+   spinlock_t		    historyLock;    // protects 'history'
+   VNetPort                 port;           // connection to virtual hub
+   Bool                     wirelessAdapter; // connected to wireless adapter?
+   struct SMACState        *smac;           // device structure for wireless
+   VNetEvent_Sender        *eventSender;    // event sender
+};
+
+typedef PacketStatus (* SMACINT SMACFunc)(struct SMACState *, SMACPackets *);
+
+static int  VNetBridgeUp(VNetBridge *bridge, Bool rtnlLock);
+static void VNetBridgeDown(VNetBridge *bridge, Bool rtnlLock);
+
+static int  VNetBridgeNotify(struct notifier_block *this, u_long msg,
+			     void *data);
+static int VNetBridgeReceiveFromDev(struct sk_buff *skb,
+                                    struct net_device *dev,
+                                    struct packet_type *pt,
+                                    struct net_device *real_dev);
+
+static void VNetBridgeFree(VNetJack *this);
+static void VNetBridgeReceiveFromVNet(VNetJack *this, struct sk_buff *skb);
+static Bool VNetBridgeCycleDetect(VNetJack *this, int generation);
+static Bool VNetBridgeIsDeviceWireless(struct net_device *dev);
+static void VNetBridgePortsChanged(VNetJack *this);
+static int  VNetBridgeIsBridged(VNetJack *this);
+static int  VNetBridgeProcRead(char *page, char **start, off_t off,
+                               int count, int *eof, void *data);
+static void VNetBridgeComputeHeaderPosIPv6(struct sk_buff *skb);
+static PacketStatus VNetCallSMACFunc(struct SMACState *state,
+                                     struct sk_buff **skb, void *startOfData,
+                                     SMACFunc func, unsigned int len);
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeStartPromisc --
+ *
+ *      Set IFF_PROMISC on the peer interface.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      The peer interface IFF_PROMISC flag may be changed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetBridgeStartPromisc(VNetBridge *bridge,      // IN:
+                       Bool rtnlLock)           // IN: Acquire RTNL lock
+{
+   struct net_device *dev = bridge->dev;
+
+   /*
+    * Disable wireless cards from going into promiscous mode because those
+    * cards which do support RF monitoring would not be able to function
+    * correctly i.e. they would not be able to send data packets.
+    */
+   if (rtnlLock) {
+      rtnl_lock();
+   }
+   if (!bridge->enabledPromisc && !bridge->wirelessAdapter) {
+      dev_set_promiscuity(dev, 1);
+      bridge->enabledPromisc = TRUE;
+      bridge->warnPromisc = FALSE;
+      LOG(0, (KERN_NOTICE "bridge-%s: enabled promiscuous mode\n",
+	      bridge->name));
+   }
+   if (rtnlLock) {
+      rtnl_unlock();
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeStopPromisc --
+ *
+ *      Restore saved IFF_PROMISC on the peer interface.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      The peer interface IFF_PROMISC flag may be changed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetBridgeStopPromisc(VNetBridge *bridge,       // IN:
+                      Bool rtnlLock)            // IN: Acquire RTNL lock
+{
+   struct net_device *dev = bridge->dev;
+
+   if (rtnlLock) {
+      rtnl_lock();
+   }
+   if (bridge->enabledPromisc && !bridge->wirelessAdapter) {
+      dev_set_promiscuity(dev, -1);
+      bridge->enabledPromisc = FALSE;
+      LOG(0, (KERN_NOTICE "bridge-%s: disabled promiscuous mode\n",
+	      bridge->name));
+   }
+   if (rtnlLock) {
+      rtnl_unlock();
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeDevCompatible --
+ *
+ *      Check whether bridge and network device are compatible.
+ *
+ * Results:
+ *      Non-zero if device is good enough for bridge.  Zero otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER int
+VNetBridgeDevCompatible(VNetBridge *bridge,      // IN: Bridge
+                        struct net_device *net)  // IN: Network device
+{
+#ifdef VMW_NETDEV_HAS_NET
+   if (compat_dev_net(net) != &init_net) {
+      return 0;
+   }
+#endif
+   return strcmp(net->name, bridge->name) == 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridge_Create --
+ *
+ *      Creates a bridge. Allocates struct, allocates internal device,
+ *      initializes port/jack, and creates a proc entry. Finally, creates an
+ *      event sender and register itself with the kernel for device state
+ *      change notifications.
+ *
+ *      At this time the bridge is not yet plugged into the hub, because this
+ *      will be done by the caller, i.e. the driver. But we need to know the
+ *      hub in order to create an event sender. This allows for enabling
+ *      the notification mechanism, which will instantly start firing, which in
+ *      turn will bring up the bridge (if present), which eventually will
+ *      inject bridge events. Moreover, the bridge will start injecting
+ *      packets, which will be dropped on the floor. All in all, this is not
+ *      that elegant. Alternatively, we could (i) plug into the hub inside of
+ *      this function, which would require adding a few parameters, (ii) split
+ *      the function into a create part and a registration part. Both ways are
+ *      not consistent with how driver.c plugs the ports into the hub.
+ *
+ * Results:
+ *      Errno. Also returns an allocated jack to connect to,
+ *      NULL on error.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetBridge_Create(const char *devName, // IN:  name of device (e.g., "eth0")
+                  uint32 flags,        // IN:  configuration flags
+                  VNetJack *hubJack,   // IN:  the future hub
+                  VNetPort **ret)      // OUT: port to virtual hub
+{
+   VNetBridge *bridge = NULL;
+   static unsigned id = 0;
+   int retval = 0;
+
+   *ret = NULL;
+
+   /*
+    * Its an error if device name is empty.
+    */
+
+   if (devName[0] == '\0') {
+      retval = -EINVAL;
+      goto out;
+   }
+
+   /* complain about unknown/unsupported flags */
+   if (flags & ~VNET_BRFLAG_FORCE_SMAC) {
+      retval = -EINVAL;
+      goto out;
+   }
+
+   /*
+    * Allocate bridge structure
+    */
+
+   bridge = kmalloc(sizeof *bridge, GFP_USER);
+   if (bridge == NULL) {
+      retval = -ENOMEM;
+      goto out;
+   }
+   memset(bridge, 0, sizeof *bridge);
+   spin_lock_init(&bridge->historyLock);
+   memcpy(bridge->name, devName, sizeof bridge->name);
+   NULL_TERMINATE_STRING(bridge->name);
+
+   /*
+    * Initialize jack.
+    */
+
+   bridge->port.id = id++;
+   bridge->port.next = NULL;
+
+   bridge->port.jack.peer = NULL;
+   bridge->port.jack.numPorts = 1;
+   VNetSnprintf(bridge->port.jack.name, sizeof bridge->port.jack.name,
+		"bridge%u", bridge->port.id);
+   bridge->port.jack.private = bridge;
+   bridge->port.jack.index = 0;
+   bridge->port.jack.procEntry = NULL;
+   bridge->port.jack.free = VNetBridgeFree;
+   bridge->port.jack.rcv = VNetBridgeReceiveFromVNet;
+   bridge->port.jack.cycleDetect = VNetBridgeCycleDetect;
+   bridge->port.jack.portsChanged = VNetBridgePortsChanged;
+   bridge->port.jack.isBridged = VNetBridgeIsBridged;
+
+   /*
+    * Make proc entry for this jack.
+    */
+
+   retval = VNetProc_MakeEntry(bridge->port.jack.name, S_IFREG, bridge,
+                               VNetBridgeProcRead,
+                               &bridge->port.jack.procEntry);
+   if (retval) {
+      if (retval == -ENXIO) {
+         bridge->port.jack.procEntry = NULL;
+      } else {
+         goto out;
+      }
+   }
+
+   /*
+    * Rest of fields.
+    */
+
+   bridge->port.flags = IFF_RUNNING;
+
+   memset(bridge->port.paddr, 0, sizeof bridge->port.paddr);
+   memset(bridge->port.ladrf, 0, sizeof bridge->port.ladrf);
+
+   bridge->port.paddr[0] = VMX86_STATIC_OUI0;
+   bridge->port.paddr[1] = VMX86_STATIC_OUI1;
+   bridge->port.paddr[2] = VMX86_STATIC_OUI2;
+
+   bridge->port.fileOpRead = NULL;
+   bridge->port.fileOpWrite = NULL;
+   bridge->port.fileOpIoctl = NULL;
+   bridge->port.fileOpPoll = NULL;
+
+   /* misc. configuration */
+   bridge->forceSmac = (flags & VNET_BRFLAG_FORCE_SMAC) ? TRUE : FALSE;
+
+   /* create event sender */
+   retval = VNetHub_CreateSender(hubJack, &bridge->eventSender);
+   if (retval != 0) {
+      goto out;
+   }
+
+   /*
+    * on RHEL3 Linux 2.4.21-47 (others maybe too) the notifier does not fire
+    * and bring up the bridge as expected, thus we bring it up manually
+    * *before* registering the notifier (PR306435)
+    */
+   VNetBridgeUp(bridge, TRUE);
+
+   /*
+    * register notifier for network device state change notifications, the
+    * notifier will fire right away, and the notifier handler will bring up
+    * the bridge (see exception above)
+    */
+   bridge->notifier.notifier_call = VNetBridgeNotify;
+   bridge->notifier.priority = 0;
+   register_netdevice_notifier(&bridge->notifier);
+
+   /* return bridge */
+   *ret = &bridge->port;
+   LOG(1, (KERN_DEBUG "bridge-%s: attached\n", bridge->name));
+   return 0;
+
+out:
+   if (bridge != NULL) {
+      kfree(bridge);
+   }
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeFree --
+ *
+ *      Unregister from device state notifications, disable the bridge,
+ *      destroy sender, remove proc entry, cleanup smac, and deallocate
+ *      struct.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetBridgeFree(VNetJack *this) // IN: jack to free
+{
+   VNetBridge *bridge = (VNetBridge*)this->private;
+
+   /* unregister notifier */
+   if (bridge->notifier.notifier_call != NULL) {
+      int err;
+
+      err = compat_unregister_netdevice_notifier(&bridge->notifier);
+      if (err != 0) {
+         LOG(0, (KERN_NOTICE "Can't unregister netdevice notifier (%d)\n",
+                 err));
+      }
+      bridge->notifier.notifier_call = NULL;
+   }
+
+   /* disable bridge */
+   if (bridge->dev != NULL) {
+      LOG(1, (KERN_DEBUG "bridge-%s: disabling the bridge\n", bridge->name));
+      VNetBridgeDown(bridge, TRUE);
+   }
+
+   /* destroy event sender */
+   VNetEvent_DestroySender(bridge->eventSender);
+   bridge->eventSender = NULL;
+
+   /* remove /proc entry */
+   if (this->procEntry) {
+      VNetProc_RemoveEntry(this->procEntry);
+   }
+
+   if (bridge->smac){
+      SMAC_CleanupState(&(bridge->smac));
+   }
+
+   /* free bridge */
+   LOG(1, (KERN_DEBUG "bridge-%s: detached\n", bridge->name));
+   kfree(bridge);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetCallSMACFunc --
+ *
+ *      Wrapper for SMAC functions. The skb must be linear.
+ *
+ * Results:
+ *      Packet Status.
+ *
+ * Side effects:
+ *      The skb buffer is freed if not successful otherwise it points to
+ *      the clone.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static PacketStatus
+VNetCallSMACFunc(struct SMACState *state, // IN: pointer to state
+                 struct sk_buff **skb,    // IN/OUT: packet to process
+                 void *startOfData,       // IN: points to start of data
+                 SMACFunc func,           // IN: function to be called
+                 unsigned int len)        // IN: length including ETH header
+{
+   SMACPackets packets = { {0} };
+   PacketStatus status;
+
+   SKB_LINEAR_ASSERT(*skb);
+
+   packets.orig.skb = *skb;
+   packets.orig.startOfData = startOfData;
+   packets.orig.len = len;
+
+   status = func(state, &packets);
+   if (status != PacketStatusForwardPacket) {
+      dev_kfree_skb(*skb);
+      return status;
+   }
+
+   if (packets.clone.skb) {
+      dev_kfree_skb(*skb);
+      *skb = packets.clone.skb;
+   }
+   return status;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeReceiveFromVNet --
+ *
+ *      This jack is receiving a packet from a vnet.  This function
+ *      sends down (i.e., out on the host net device) if the packet
+ *      isn't destined for the host, and it sends up (i.e.,
+ *      simulates a receive for the host) if the packet
+ *      satisfies the host's packet filter.
+ *
+ *      When the function sends up it keeps a reference to the
+ *      packet in a history list so that we can avoid handing
+ *      a VM a copy of its own packet.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Frees skb.  Checks if host device is still using
+ *      promiscuous mode.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetBridgeReceiveFromVNet(VNetJack        *this, // IN: jack
+                          struct sk_buff  *skb)  // IN: pkt to receive
+{
+   VNetBridge *bridge = (VNetBridge*)this->private;
+   struct net_device *dev = bridge->dev;
+   uint8 dest[ETH_ALEN];
+   struct sk_buff *clone;
+
+   LOG(3, (KERN_DEBUG "bridge-%s: transmit %d\n",
+           bridge->name, (int) skb->len));
+
+   if (!dev) {
+      dev_kfree_skb(skb);
+      return;
+   }
+
+   /*
+    * skb might be freed by wireless code, so need to keep
+    * a local copy of the MAC rather than a pointer to it.
+    */
+
+   memcpy(dest, SKB_2_DESTMAC(skb), ETH_ALEN);
+
+#ifdef notdef
+   // xxx;
+   /*
+    * We need to send the packet both up to the host and down
+    * to the interface.
+    * However, we ignore packets destined only for this hub.
+    */
+
+   for (i = 0; i < VNET_PORTS_PER_HUB; i++) {
+      VNetPort *p = &port->hub->port[i];
+      if (UP_AND_RUNNING(p->flags) && MAC_EQ(dest, p->paddr)) {
+	 return;
+      }
+   }
+#endif
+
+   /*
+    * SMAC processing. SMAC interfaces that the skb is linear, so ensure that
+    * this is the case prior to calling out.
+    */
+
+   if (bridge->smac) {
+      if (compat_skb_is_nonlinear(skb) && compat_skb_linearize(skb)) {
+         LOG(4, (KERN_NOTICE "bridge-%s: couldn't linearize, packet dropped\n",
+                 bridge->name));
+         return;
+      }
+      if (VNetCallSMACFunc(bridge->smac, &skb, skb->data,
+                           SMAC_CheckPacketToHost, skb->len) !=
+          PacketStatusForwardPacket) {
+         LOG(4, (KERN_NOTICE "bridge-%s: packet dropped\n", bridge->name));
+	 return;
+      }
+   }
+
+   /*
+    * Send down (imitate packet_sendmsg)
+    *
+    * Do this only if the packet is not addressed to the peer,
+    * and the packet size is not too big.
+    */
+
+   dev_lock_list();
+   if (MAC_EQ(dest, dev->dev_addr) ||
+       skb->len > dev->mtu + dev->hard_header_len) {
+      dev_unlock_list();
+   } else {
+#     if 0 // XXX we should do header translation
+      if ((dev->flags & IFF_SOFTHEADERS) != 0) {
+	 if (skb->len > dev->mtu) {
+	    clone = NULL;
+	 } else {
+	    clone = dev_alloc_skb(skb->len + dev->hard_header_len, GFP_ATOMIC);
+	 }
+	 if (clone != NULL) {
+	    skb_reserve(clone, dev->hard_header_len);
+	    if (dev->hard_header != NULL) {
+	       dev->hard_header(clone, dev, ETH_P_IP, NULL, NULL, skb->len);
+	    }
+	    memcpy(skb_put(clone, skb->len), skb->data, skb->len);
+	 }
+      }
+#     endif
+      clone = skb_clone(skb, GFP_ATOMIC);
+      if (clone == NULL) {
+	 dev_unlock_list();
+      } else {
+         skb_set_owner_w(clone, bridge->sk);
+	 clone->protocol = ((struct ethhdr *)skb->data)->h_proto; // XXX
+	 if ((dev->flags & IFF_UP) != 0) {
+	    dev_unlock_list();
+	    DEV_QUEUE_XMIT(clone, dev, 0);
+	 } else {
+	    dev_unlock_list();
+	    dev_kfree_skb(clone);
+	 }
+      }
+   }
+
+   /*
+    * Send up (imitate Ethernet receive)
+    *
+    * Do this if the packet is addressed to the peer (or is broadcast, etc.).
+    *
+    * This packet will get back to us, via VNetBridgeReceive.
+    * We save it so we can recognize it (and its clones) again.
+    */
+
+   if (VNetPacketMatch(dest, dev->dev_addr, NULL, 0, allMultiFilter, dev->flags)) {
+      clone = skb_clone(skb, GFP_ATOMIC);
+      if (clone) {
+	 unsigned long flags;
+	 int i;
+
+	 atomic_inc(&clone->users);
+
+	 clone->dev = dev;
+	 clone->protocol = eth_type_trans(clone, dev);
+	 spin_lock_irqsave(&bridge->historyLock, flags);
+	 for (i = 0; i < VNET_BRIDGE_HISTORY; i++) {
+	    if (bridge->history[i] == NULL) {
+	       bridge->history[i] = clone;
+#	       if LOGLEVEL >= 3
+	       {
+		  int j;
+		  int count = 0;
+		  for (j = 0; j < VNET_BRIDGE_HISTORY; j++) {
+		     if (bridge->history[j] != NULL) {
+			count++;
+		     }
+		  }
+		  LOG(3, (KERN_DEBUG "bridge-%s: host slot %d history %d\n",
+			  bridge->name, i, count));
+	       }
+#	       endif
+	       break;
+	    }
+	 }
+	 if (i >= VNET_BRIDGE_HISTORY) {
+	    LOG(1, (KERN_NOTICE "bridge-%s: history full\n",
+		    bridge->name));
+
+	    for (i = 0; i < VNET_BRIDGE_HISTORY; i++) {
+	       struct sk_buff *s = bridge->history[i];
+
+	       /*
+		* We special case 0 to avoid races with another thread on
+		* another cpu wanting to use the 0 entry. This could happen
+		* when we release the lock to free the former entry.
+		* See bug 11231 for details.
+		*/
+	       if (i == 0) {
+		  bridge->history[0] = clone;
+	       } else {
+		  bridge->history[i] = NULL;
+	       }
+	       if (s) {
+	       	  spin_unlock_irqrestore(&bridge->historyLock, flags);
+		  dev_kfree_skb(s);
+		  spin_lock_irqsave(&bridge->historyLock, flags);
+	       }
+	    }
+	 }
+         spin_unlock_irqrestore(&bridge->historyLock, flags);
+
+         /*
+          * We used to cli() before calling netif_rx() here. It was probably
+          * unneeded (as we never did it in netif.c, and the code worked). In
+          * any case, now that we are using netif_rx_ni(), we should certainly
+          * not do it, or netif_rx_ni() will deadlock on the cli() lock --hpreg
+          */
+
+	 netif_rx_ni(clone);
+#	 if LOGLEVEL >= 4
+	 do_gettimeofday(&vnetTime);
+#	 endif
+      }
+   }
+
+   // xxx;
+   dev_kfree_skb(skb);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeCycleDetect --
+ *
+ *      Cycle detection algorithm.
+ *
+ * Results:
+ *      TRUE if a cycle was detected, FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+VNetBridgeCycleDetect(VNetJack *this,       // IN: jack
+                      int       generation) // IN: generation
+{
+   VNetBridge *bridge = (VNetBridge*)this->private;
+   return VNetCycleDetectIf(bridge->name, generation);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgePortsChanged --
+ *
+ *      The number of ports connected to this jack has change, react
+ *      accordingly by starting/stopping promiscuous mode based on
+ *      whether any peers exist.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Promiscuous mode may be started or stopped.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetBridgePortsChanged(VNetJack *this) // IN: jack
+{
+   VNetBridge *bridge = (VNetBridge*)this->private;
+   if (bridge->dev) {
+      if (VNetGetAttachedPorts(this)) {
+         VNetBridgeStartPromisc(bridge, TRUE);
+      } else {
+         VNetBridgeStopPromisc(bridge, TRUE);
+      }
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeIsBridged --
+ *
+ *      Reports if the bridged interface is up or down.
+ *
+ * Results:
+ *      1 - we are bridged but the interface is not up
+ *      2 - we are bridged and the interface is up
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetBridgeIsBridged(VNetJack *this) // IN: jack
+{
+   VNetBridge *bridge = (VNetBridge*)this->private;
+   if (bridge->dev) {
+      return 2;
+   } else {
+      return 1;
+   }
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeIsDeviceWireless --
+ *
+ *      Check if the device is a wireless adapter, depending on the version
+ *      of the wireless extension present in the kernel.
+ *
+ * Results:
+ *      TRUE if the device is wireless, FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+VNetBridgeIsDeviceWireless(struct net_device *dev) //IN: sock
+{
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 22)
+#  if defined(CONFIG_WIRELESS_EXT)
+   return dev->ieee80211_ptr != NULL || dev->wireless_handlers != NULL;
+#  else
+   return dev->ieee80211_ptr != NULL;
+#  endif
+#elif defined(CONFIG_WIRELESS_EXT)
+   return dev->wireless_handlers != NULL;
+#elif !defined(CONFIG_NET_RADIO)
+   return FALSE;
+#elif defined WIRELESS_EXT && WIRELESS_EXT > 19
+   return dev->wireless_handlers != NULL;
+#elif defined WIRELESS_EXT && WIRELESS_EXT > 12
+   return dev->wireless_handlers != NULL || dev->get_wireless_stats != NULL;
+#else
+   return dev->get_wireless_stats != NULL;
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeSendLinkStateEvent --
+ *
+ *      Sends a link state event.
+ *
+ * Results:
+ *      Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+static int
+VNetBridgeSendLinkStateEvent(VNetBridge *bridge, // IN: the bridge
+                             uint32 adapter,     // IN: the adapter
+                             Bool up)            // IN: the link state
+{
+   VNet_LinkStateEvent event;
+   int res;
+
+   event.header.size = sizeof event;
+   res = VNetEvent_GetSenderId(bridge->eventSender, &event.header.senderId);
+   if (res != 0) {
+      LOG(1, (KERN_NOTICE "bridge-%s: can't send link state event, "
+              "getSenderId failed (%d)\n", bridge->name, res));
+      return res;
+   }
+   event.header.eventId = 0;
+   event.header.classSet = VNET_EVENT_CLASS_UPLINK;
+   event.header.type = VNET_EVENT_TYPE_LINK_STATE;
+   event.adapter = adapter;
+   event.up = up;
+   res = VNetEvent_Send(bridge->eventSender, &event.header);
+   if (res != 0) {
+      LOG(1, (KERN_NOTICE "bridge-%s: can't send link state event, send "
+              "failed (%d)\n", bridge->name, res));
+   }
+   return res;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeUp --
+ *
+ *      Bring a bridge up.  Gets peer's device structure, verifies
+ *      that interface is up, checks the header length,
+ *      allocates a socket, adds a packet handler to the network
+ *      stack, and then places the peer's device in promiscuous
+ *      mode.
+ *
+ * Results:
+ *      errno.
+ *
+ * Side effects:
+ *      Bridging may be brought up with a peer interface.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetBridgeUp(VNetBridge *bridge, // IN: bridge struct
+             Bool rtnlLock)      // IN: acquire RTNL lock
+{
+   int retval = 0;
+
+   if (bridge->dev != NULL) {
+      LOG(0, (KERN_NOTICE "bridge-%s: already up\n", bridge->name));
+      goto out;
+   }
+
+   /*
+    * Get peer device structure
+    */
+
+   dev_lock_list();
+   bridge->dev = DEV_GET(bridge);
+   LOG(2, (KERN_DEBUG "bridge-%s: got dev %p\n",
+	   bridge->name, bridge->dev));
+   if (bridge->dev == NULL) {
+      dev_unlock_list();
+      retval = -ENODEV;
+      goto out;
+   }
+   if (!(bridge->dev->flags & IFF_UP)) {
+      LOG(2, (KERN_DEBUG "bridge-%s: interface %s is not up\n",
+              bridge->name, bridge->dev->name));
+      dev_unlock_list();
+      retval = -ENODEV;
+      goto out;
+   }
+
+   /*
+    * At a minimum, the header size should be the same as ours.
+    *
+    * XXX we should either do header translation or ensure this
+    * is an Ethernet.
+    */
+
+   if (bridge->dev->hard_header_len != ETH_HLEN) {
+      LOG(1, (KERN_DEBUG "bridge-%s: can't bridge with %s, bad header length %d\n",
+	      bridge->name, bridge->dev->name, bridge->dev->hard_header_len));
+      dev_unlock_list();
+      retval = -EINVAL;
+      goto out;
+   }
+
+   /*
+    * Get a socket to play with
+    *
+    * We set the dead field so we don't get a call back from dev_kfree_skb().
+    * (The alternative is to support the callback.)
+    */
+
+   bridge->sk = compat_sk_alloc(bridge, GFP_ATOMIC);
+   if (bridge->sk == NULL) {
+      dev_unlock_list();
+      retval = -ENOMEM;
+      goto out;
+   }
+   sock_init_data(NULL, bridge->sk);
+   sock_set_flag(bridge->sk, SOCK_DEAD);
+
+   if (VNetBridgeIsDeviceWireless(bridge->dev)) {
+      LOG(1, (KERN_NOTICE "bridge-%s: device is wireless, enabling SMAC\n",
+              bridge->name));
+      bridge->wirelessAdapter = TRUE;
+   }
+
+   /*
+    * If it is a wireless adapter initialize smac struct.
+    */
+
+   if (bridge->wirelessAdapter || bridge->forceSmac) {
+      SMAC_InitState(&(bridge->smac));
+      if (bridge->smac) {
+         /*
+          * Store the MAC address of the adapter
+          */
+
+         SMAC_SetMac(bridge->smac, bridge->dev->dev_addr);
+      }
+   }
+
+   /*
+    * Link up with the peer device by adding a
+    * packet handler to the networking stack.
+    */
+
+   bridge->pt.func = VNetBridgeReceiveFromDev;
+   bridge->pt.type = htons(ETH_P_ALL);
+   bridge->pt.dev = bridge->dev;
+
+   bridge->pt.af_packet_priv = bridge->sk;
+   bridge->enabledPromisc = FALSE;
+   bridge->warnPromisc = FALSE;
+   dev_add_pack(&bridge->pt);
+   dev_unlock_list();
+
+   /*
+    * Put in promiscuous mode if need be.
+    */
+
+   mutex_lock(&vnetStructureMutex);
+   if (VNetGetAttachedPorts(&bridge->port.jack)) {
+      VNetBridgeStartPromisc(bridge, rtnlLock);
+   }
+   mutex_unlock(&vnetStructureMutex);
+
+   /* send link state up event */
+   retval = VNetBridgeSendLinkStateEvent(bridge, bridge->dev->ifindex, TRUE);
+   if (retval != 0) {
+      LOG(1, (KERN_NOTICE "bridge-%s: can't send link state event (%d)\n",
+              bridge->name, retval));
+      goto out;
+   }
+
+   LOG(1, (KERN_DEBUG "bridge-%s: up\n", bridge->name));
+
+   /*
+    * Return
+    */
+
+out:
+   if (retval != 0) {
+      if (bridge->sk != NULL) {
+	 sk_free(bridge->sk);
+	 bridge->sk = NULL;
+      }
+      bridge->dev = NULL;
+   }
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeDown --
+ *
+ *      Bring a bridge down.  Stops promiscuous mode, removes the
+ *      packet handler from the network stack, and frees the
+ *      socket.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Bridging is brought down.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetBridgeDown(VNetBridge *bridge, // IN: bridge
+               Bool rtnlLock)      // IN: acquire RTNL lock
+{
+   int retval;
+
+   if (bridge->dev == NULL) {
+      LOG(0, (KERN_NOTICE "bridge-%s: already down\n", bridge->name));
+      return;
+   }
+
+   /* send link state down event */
+   retval = VNetBridgeSendLinkStateEvent(bridge, bridge->dev->ifindex, FALSE);
+   if (retval != 0) {
+      LOG(1, (KERN_NOTICE "bridge-%s: can't send link state event (%d)\n",
+              bridge->name, retval));
+   }
+
+   VNetBridgeStopPromisc(bridge, rtnlLock);
+   if (bridge->smac){
+      SMAC_SetMac(bridge->smac, NULL);
+   }
+   bridge->dev = NULL;
+   dev_remove_pack(&bridge->pt);
+   sk_free(bridge->sk);
+   bridge->sk = NULL;
+
+   LOG(1, (KERN_DEBUG "bridge-%s: down\n", bridge->name));
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetBridgeNotifyLogBridgeUpError --
+ *
+ *      Logs a bridge up error for the notify function following this function.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+VNetBridgeNotifyLogBridgeUpError(int errno,        // IN: the error number
+                                 char *bridgeName, // IN: the bridge name
+                                 char *devName)    // IN: the device name
+{
+   switch (errno) {
+      case -ENODEV:
+         LOG(0, (KERN_WARNING "bridge-%s: interface %s not found or not "
+                 "up\n", bridgeName, devName));
+	 break;
+      case -EINVAL:
+         LOG(0, (KERN_WARNING "bridge-%s: interface %s is not a valid "
+                 "Ethernet interface\n", bridgeName, devName));
+         break;
+      case -ENOMEM:
+         LOG(0, (KERN_WARNING "bridge-%s: failed to allocate memory\n",
+                 bridgeName));
+         break;
+      default:
+         /* This should never happen --hpreg */
+         LOG(0, (KERN_WARNING "bridge-%s: failed to enable the bridge to "
+                 "interface %s (error %d)\n", bridgeName, devName,
+                 -errno));
+         break;
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetBridgeNotify --
+ *
+ *      Callback on peer device state change.  The function brings
+ *      the bridge up/down in response to changes in the peer device.
+ *
+ * Results:
+ *      NOTIFY_DONE
+ *
+ * Side effects:
+ *      Promiscuous mode is changed when bridge brought up/down.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static int
+VNetBridgeNotify(struct notifier_block *this, // IN: callback data (bridge)
+                 u_long msg,                  // IN: type of event
+                 void *data)                  // IN: device pertaining to event
+{
+   VNetBridge *bridge = list_entry(this, VNetBridge, notifier);
+   struct net_device *dev = (struct net_device *) data;
+
+   switch (msg) {
+   case NETDEV_UNREGISTER:
+      LOG(2, (KERN_DEBUG "bridge-%s: interface %s is unregistering\n",
+              bridge->name, dev->name));
+      if (dev == bridge->dev) {
+         /* This should never happen --hpreg */
+         LOG(0, (KERN_WARNING "bridge-%s: interface %s unregistered without "
+                 "going down! Disabling the bridge\n", bridge->name,
+                 dev->name));
+         VNetBridgeDown(bridge, FALSE);
+      }
+      break;
+
+   case NETDEV_DOWN:
+      LOG(2, (KERN_DEBUG "bridge-%s: interface %s is going down\n",
+              bridge->name, dev->name));
+      if (dev == bridge->dev) {
+         LOG(1, (KERN_DEBUG "bridge-%s: disabling the bridge on dev down\n",
+                 bridge->name));
+         VNetBridgeDown(bridge, FALSE);
+      }
+      break;
+
+   case NETDEV_UP:
+      LOG(2, (KERN_DEBUG "bridge-%s: interface %s is going up\n",
+              bridge->name, dev->name));
+      if (bridge->dev == NULL && VNetBridgeDevCompatible(bridge, dev)) {
+         int errno;
+
+         LOG(1, (KERN_DEBUG "bridge-%s: enabling the bridge on dev up\n",
+                 bridge->name));
+	 errno = VNetBridgeUp(bridge, FALSE);
+         if (errno != 0) {
+            VNetBridgeNotifyLogBridgeUpError(errno, bridge->name, dev->name);
+         }
+      }
+      break;
+
+   default:
+      LOG(2, (KERN_DEBUG "bridge-%s: interface %s is sending notification "
+              "0x%lx\n", bridge->name, dev->name, msg));
+      break;
+   }
+
+   return NOTIFY_DONE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * RangeInLinearSKB --
+ *
+ *      Checks if the given number of bytes from a given offset resides
+ *      within the linear part of the skb.  If not then attempts to
+ *      linearize the skb.
+ *
+ * Results:
+ *      Returns TRUE if the range of bytes is already in the linear
+ *      portion or if linearize succeeded.  Otherwise, returns FALSE if
+ *      the linearize operation fails.
+ *
+ * Side effects:
+ *      As in skb_linearize().
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER Bool
+RangeInLinearSKB(struct sk_buff *skb, // IN:
+                 unsigned int start,  // IN:  Start offset
+                 unsigned int length) // IN:  How many bytes
+{
+   if (LIKELY(!compat_skb_is_nonlinear(skb) ||
+              start + length <= compat_skb_headlen(skb))) {
+      /*
+       * Nothing to do.
+       */
+
+      return TRUE;
+   }
+
+   return compat_skb_linearize(skb) == 0;
+}
+
+
+/*
+ * Not all kernel versions have NEXTHDR_MOBILITY defined.
+ */
+
+#ifndef NEXTHDR_MOBILITY
+#  define NEXTHDR_MOBILITY 135 /* Mobility header. */
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeComputeHeaderPosIPv6 --
+ *
+ *      Compute correct position of transport header in IPv6 packets.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Transport header pointer updated to point to the PDU contained
+ *      in the packet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetBridgeComputeHeaderPosIPv6(struct sk_buff *skb) // IN:
+{
+   struct ipv6hdr *ipv6Hdr;
+   unsigned int offset; /* Offset from skb->data. */
+   unsigned int headerLen; /* Length of current header. */
+   uint8 nextHeader;
+
+   /*
+    * Check if the start of the network header is within the linear part of
+    * skb.  If not, then linearize the skb.
+    */
+
+   if (UNLIKELY(compat_skb_network_header(skb) < skb->data ||
+                compat_skb_network_header(skb) >= skb->data +
+                                                  compat_skb_headlen(skb))) {
+      if (compat_skb_linearize(skb)) {
+         return; /* Bail out. */
+      }
+   }
+
+   offset = compat_skb_network_offset(skb);
+   if (!RangeInLinearSKB(skb, offset, sizeof *ipv6Hdr)) {
+      return; /* Bail out. */
+   }
+
+   ipv6Hdr = (struct ipv6hdr *)compat_skb_network_header(skb);
+   headerLen = sizeof *ipv6Hdr;
+   offset += headerLen; /* End of IPv6 header (not including extensions). */
+
+   /*
+    * All IPv6 extension headers begin with a "next header" field (one byte),
+    * and most of them have a "header length" field (as the 2nd byte).  In each
+    * iteration, we find the length of the extension header and add it to
+    * offset from the beginning of skb.  And, in each iteration we update the
+    * next header variable.  When we return from the following for loop, offset
+    * would have incremented by the length of each of the extension header,
+    * and next header type will be something else than an IPv6 extension header
+    * signifying that we have walked through the entire IPv6 header.  We set
+    * the transport header's offset to the value of this offset before exiting
+    * the for loop.
+    */
+
+   nextHeader = ipv6Hdr->nexthdr;
+   for (;;) {
+      switch (nextHeader) {
+      case NEXTHDR_HOP:
+      case NEXTHDR_ROUTING:
+      case NEXTHDR_AUTH:
+      case NEXTHDR_DEST:
+      case NEXTHDR_MOBILITY:
+         /*
+          * We need to check two bytes in the option header:  next header and
+          * header extension length.
+          */
+
+         if (!RangeInLinearSKB(skb, offset, 2)) {
+            return; /* Bail out. */
+         }
+         headerLen = skb->data[offset + 1];
+         if (nextHeader == NEXTHDR_AUTH) {
+            headerLen = (headerLen + 2) << 2; /* See RFC 2402. */
+         } else {
+            headerLen = (headerLen + 1) << 3; /* See ipv6_optlen(). */
+         }
+
+         break;
+
+      case NEXTHDR_FRAGMENT:
+      case NEXTHDR_ESP:
+      case NEXTHDR_NONE:
+         /*
+          * We stop walking if we find the fragment header (NEXTHDR_FRAGMENT).
+          * If the payload is encrypted we may not know the start of the
+          * transport header [1].  So, we just return.  Same applies when
+          * nothing follows this header (NEXTHDR_NONE).
+          * [1]:  http://www.cu.ipv6tf.org/literatura/chap8.pdf
+          */
+
+         return;
+
+       default:
+         /*
+          * We have walked through all IPv6 extension headers.  Let's set the
+          * transport header and return.
+          */
+
+         compat_skb_set_transport_header(skb, offset);
+         return;
+      }
+
+      nextHeader = skb->data[offset];
+      offset += headerLen;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeComputeHeaderPos --
+ *
+ *      Compute correct position for UDP/TCP header.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      transport header pointer updated to point to the tcp/udp header.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER void
+VNetBridgeComputeHeaderPos(struct sk_buff *skb) // IN: buffer to examine
+{
+   /* Maybe some kernel gets it right... */
+   if (compat_skb_network_header_len(skb)) {
+      return;
+   }
+   switch (be16_to_cpu(skb->protocol)) {
+      case ETH_P_IP: {
+         struct iphdr *ipHdr = compat_skb_ip_header(skb);
+
+         compat_skb_set_transport_header(skb, compat_skb_network_offset(skb) +
+                                              ipHdr->ihl * 4);
+         break;
+      }
+
+      case ETH_P_IPV6:
+         VNetBridgeComputeHeaderPosIPv6(skb);
+         break;
+
+      default:
+         LOG(3, (KERN_DEBUG "Unknown EII protocol %04X: csum at %d\n",
+                 be16_to_cpu(skb->protocol), compat_skb_csum_offset(skb)));
+         break;
+   }
+}
+
+
+/*
+ * We deal with three types of kernels:
+ * New kernels: skb_shinfo() has gso_size member, and there is
+ *              skb_gso_segment() helper to split GSO skb into flat ones.
+ * Older kernels: skb_shinfo() has tso_size member, and there is
+ *                no helper.
+ * Oldest kernels: without any segmentation offload support.
+ */
+#if defined(NETIF_F_GSO) || LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 18)
+#define VNetBridgeIsGSO(skb) skb_shinfo(skb)->gso_size
+#define VNetBridgeGSOSegment(skb) skb_gso_segment(skb, 0)
+#elif defined(NETIF_F_TSO)
+#define VNetBridgeIsGSO(skb) skb_shinfo(skb)->tso_size
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeGSOSegment --
+ *
+ *	Split a large TCP/IPv4 sk_buff into multiple sk_buffs of
+ *	size skb_shinfo(skb)->tso_size
+ *	Called from VNetBridgeSendLargePacket().
+ *
+ * Results:
+ *	List of skbs created.
+ *
+ * Side effects:
+ *	The incoming packet is split into multiple packets.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static struct sk_buff *
+VNetBridgeGSOSegment(struct sk_buff *skb)        // IN: packet to split
+{
+   struct sk_buff *segs = NULL;
+   struct sk_buff **next = &segs;
+   int bytesPerPacket, bytesLeft;
+   int macHdrLen, ipHdrLen, tcpHdrLen, allHdrLen;
+   int curByteOffset;
+   uint16 ipID;
+   uint32 seqNo;
+
+   if (((struct ethhdr *)compat_skb_mac_header(skb))->h_proto != htons(ETH_P_IP)) {
+      return ERR_PTR(-EPFNOSUPPORT);
+   }
+
+   if (compat_skb_ip_header(skb)->protocol != IPPROTO_TCP) {
+      return ERR_PTR(-EPROTONOSUPPORT);
+   }
+
+   macHdrLen = compat_skb_network_header(skb) - compat_skb_mac_header(skb);
+   ipHdrLen = compat_skb_ip_header(skb)->ihl << 2;
+   tcpHdrLen = compat_skb_tcp_header(skb)->doff << 2;
+   allHdrLen = macHdrLen + ipHdrLen + tcpHdrLen;
+
+   ipID = ntohs(compat_skb_ip_header(skb)->id);
+   seqNo = ntohl(compat_skb_tcp_header(skb)->seq);
+
+   /* Host TCP stack populated this (MSS) for the host NIC driver */
+   bytesPerPacket = skb_shinfo(skb)->tso_size;
+
+   bytesLeft = skb->len - allHdrLen;
+   curByteOffset = allHdrLen;
+
+   while (bytesLeft) {
+      struct sk_buff *newSkb;
+      int payloadSize = (bytesLeft < bytesPerPacket) ? bytesLeft : bytesPerPacket;
+
+      newSkb = dev_alloc_skb(payloadSize + allHdrLen + NET_IP_ALIGN);
+      if (!newSkb) {
+         while (segs) {
+            newSkb = segs;
+            segs = segs->next;
+            newSkb->next = NULL;
+            dev_kfree_skb(newSkb);
+         }
+         return ERR_PTR(-ENOMEM);
+      }
+      skb_reserve(newSkb, NET_IP_ALIGN);
+      newSkb->dev = skb->dev;
+      newSkb->protocol = skb->protocol;
+      newSkb->pkt_type = skb->pkt_type;
+      newSkb->ip_summed = VM_TX_CHECKSUM_PARTIAL;
+
+      /*
+       * MAC+IP+TCP copy
+       * This implies that ALL fields in the IP and TCP headers are copied from
+       * the original skb. This is convenient: we'll only fix up fields that
+       * need to be changed below
+       */
+      memcpy(skb_put(newSkb, allHdrLen), skb->data, allHdrLen);
+
+      /* Fix up pointers to different layers */
+      compat_skb_reset_mac_header(newSkb);
+      compat_skb_set_network_header(newSkb, macHdrLen);
+      compat_skb_set_transport_header(newSkb, macHdrLen + ipHdrLen);
+
+      /* Payload copy */
+      skb_copy_bits(skb, curByteOffset, compat_skb_tail_pointer(newSkb), payloadSize);
+      skb_put(newSkb, payloadSize);
+
+      curByteOffset+=payloadSize;
+      bytesLeft -= payloadSize;
+
+      /* Fix up IP hdr */
+      compat_skb_ip_header(newSkb)->tot_len = htons(payloadSize + tcpHdrLen + ipHdrLen);
+      compat_skb_ip_header(newSkb)->id = htons(ipID);
+      compat_skb_ip_header(newSkb)->check = 0;
+      /* Recompute new IP checksum */
+      compat_skb_ip_header(newSkb)->check =
+              ip_fast_csum(compat_skb_network_header(newSkb),
+                           compat_skb_ip_header(newSkb)->ihl);
+
+      /* Fix up TCP hdr */
+      compat_skb_tcp_header(newSkb)->seq = htonl(seqNo);
+      /* Clear FIN/PSH if not last packet */
+      if (bytesLeft > 0) {
+         compat_skb_tcp_header(newSkb)->fin = 0;
+         compat_skb_tcp_header(newSkb)->psh = 0;
+      }
+      /* Recompute partial TCP checksum */
+      compat_skb_tcp_header(newSkb)->check =
+         ~csum_tcpudp_magic(compat_skb_ip_header(newSkb)->saddr,
+                            compat_skb_ip_header(newSkb)->daddr,
+                            payloadSize+tcpHdrLen, IPPROTO_TCP, 0);
+
+      /* Offset of field */
+      newSkb->csum = offsetof(struct tcphdr, check);
+
+      /* Join packet to the list of segments */
+      *next = newSkb;
+      next = &newSkb->next;
+
+      /* Bump up our counters */
+      ipID++;
+      seqNo += payloadSize;
+
+   }
+   return segs;
+}
+#else
+#define VNetBridgeIsGSO(skb) (0)
+#define VNetBridgeGSOSegment(skb) ERR_PTR(-ENOSYS)
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeSendLargePacket --
+ *
+ *      Split and send a large TCP/IPv4 sk_buff into multiple sk_buffs which
+ *      fits on wire.  Called from VNetBridgeReceiveFromDev(), which is a
+ *	protocol handler called from the bottom half, so steady as she
+ *	goes...
+ *
+ *	skb passed in is deallocated by function.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      The incoming packet is split into multiple packets and sent to the
+ *      vnet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetBridgeSendLargePacket(struct sk_buff *skb,        // IN: packet to split
+                          VNetBridge *bridge)         // IN: bridge
+{
+   struct sk_buff *segs;
+
+   segs = VNetBridgeGSOSegment(skb);
+   dev_kfree_skb(skb);
+   if (IS_ERR(segs)) {
+      LOG(1, (KERN_DEBUG "bridge-%s: cannot segment packet: error %ld\n",
+              bridge->name, PTR_ERR(segs)));
+      return;
+   }
+
+   while (segs) {
+      struct sk_buff *newSkb;
+
+      newSkb = segs;
+      segs = newSkb->next;
+      newSkb->next = NULL;
+      /* Send it along */
+      skb = newSkb;
+      VNetSend(&bridge->port.jack, newSkb);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeReceiveFromDev --
+ *
+ *      Receive a packet from a bridged peer device
+ *
+ *      This is called from the bottom half.  Must be careful.
+ *
+ * Results:
+ *      errno.
+ *
+ * Side effects:
+ *      A packet may be sent to the vnet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetBridgeReceiveFromDev(struct sk_buff *skb,         // IN: packet to receive
+                         struct net_device *dev,      // IN: unused
+                         struct packet_type *pt,      // IN: pt (pointer to bridge)
+                         struct net_device *real_dev) // IN: real device, unused
+{
+   VNetBridge *bridge = list_entry(pt, VNetBridge, pt);
+   int i;
+   unsigned long flags;
+
+   if (bridge->dev == NULL) {
+      LOG(3, (KERN_DEBUG "bridge-%s: received %d closed\n",
+	      bridge->name, (int) skb->len));
+      dev_kfree_skb(skb);
+      return -EIO;	// value is ignored anyway
+   }
+
+   /*
+    * Check is this is a packet that we sent up to the host, and if
+    * so then don't bother to receive the packet.
+    */
+
+   spin_lock_irqsave(&bridge->historyLock, flags);
+   for (i = 0; i < VNET_BRIDGE_HISTORY; i++) {
+      struct sk_buff *s = bridge->history[i];
+      if (s != NULL &&
+	  (s == skb || SKB_IS_CLONE_OF(skb, s))) {
+	 bridge->history[i] = NULL;
+	 spin_unlock_irqrestore(&bridge->historyLock, flags);
+	 dev_kfree_skb(s);
+	 LOG(3, (KERN_DEBUG "bridge-%s: receive %d self %d\n",
+		 bridge->name, (int) skb->len, i));
+	 dev_kfree_skb(skb);
+	 return 0;
+      }
+   }
+   spin_unlock_irqrestore(&bridge->historyLock, flags);
+
+#  if LOGLEVEL >= 4
+   {
+      struct timeval now;
+      do_gettimeofday(&now);
+      LOG(3, (KERN_DEBUG "bridge-%s: time %d\n",
+	      bridge->name,
+	      (int)((now.tv_sec * 1000000 + now.tv_usec)
+                    - (vnetTime.tv_sec * 1000000 + vnetTime.tv_usec))));
+   }
+#  endif
+
+   /*
+    * SMAC might linearize the skb, but linearizing a shared skb is a no-no,
+    * so check for sharing before calling out to SMAC.
+    */
+   skb = skb_share_check(skb, GFP_ATOMIC);
+   if (!skb) {
+      return 0;
+   }
+
+   if (bridge->smac) {
+      /*
+       * Wireless driver processes the packet and processes the ethernet header
+       * and the length is reduced by the amount. We need the raw ethernet
+       * packet length hence add the ethernet header length for incoming
+       * packets.
+       *
+       * Note that SMAC interfaces assume skb linearity.
+       */
+      if (compat_skb_is_nonlinear(skb) && compat_skb_linearize(skb)) {
+         LOG(4, (KERN_NOTICE "bridge-%s: couldn't linearize, packet dropped\n",
+                 bridge->name));
+         return 0;
+      }
+      if (VNetCallSMACFunc(bridge->smac, &skb, compat_skb_mac_header(skb),
+                           SMAC_CheckPacketFromHost, skb->len + ETH_HLEN) !=
+          PacketStatusForwardPacket) {
+         LOG(4, (KERN_NOTICE "bridge-%s: packet dropped\n", bridge->name));
+	 return 0;
+      }
+   }
+
+   /*
+    * Unbelievable... Caller sets h.raw = nh.raw before invoking us...
+    */
+   VNetBridgeComputeHeaderPos(skb);
+
+   skb_push(skb, skb->data - compat_skb_mac_header(skb));
+   LOG(3, (KERN_DEBUG "bridge-%s: receive %d\n",
+	   bridge->name, (int) skb->len));
+
+   /*
+    * If this is a large packet, chop chop chop (if supported)...
+    */
+   if (VNetBridgeIsGSO(skb)) {
+      VNetBridgeSendLargePacket(skb, bridge);
+   } else {
+      VNetSend(&bridge->port.jack, skb);
+   }
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetBridgeProcRead --
+ *
+ *      Callback for read operation on this bridge entry in vnets proc fs.
+ *
+ * Results:
+ *      Length of read operation.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetBridgeProcRead(char    *page,   // IN/OUT: buffer to write into
+                   char   **start,  // OUT: 0 if file < 4k, else offset into page
+                   off_t    off,    // IN: (unused) offset of read into the file
+                   int      count,  // IN: (unused) maximum number of bytes to read
+                   int     *eof,    // OUT: TRUE if there is nothing more to read
+                   void    *data)   // IN: client data - pointer to bridge
+{
+   VNetBridge *bridge = (VNetBridge*)data;
+   int len = 0;
+
+   if (!bridge) {
+      return len;
+   }
+
+   len += VNetPrintPort(&bridge->port, page+len);
+
+   len += sprintf(page+len, "dev %s ", bridge->name);
+
+   len += sprintf(page+len, "\n");
+
+   *start = 0;
+   *eof   = 1;
+   return len;
+}
diff --git a/vmnet-only/community_source.h b/vmnet-only/community_source.h
new file mode 100644
index 00000000..2d32d8fa
--- /dev/null
+++ b/vmnet-only/community_source.h
@@ -0,0 +1,67 @@
+/*********************************************************
+ * Copyright (C) 2009-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * community_source.h --
+ *
+ *    Macros for excluding source code from community.
+ */
+
+#ifndef _COMMUNITY_SOURCE_H_
+#define _COMMUNITY_SOURCE_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+/* 
+ * Convenience macro for COMMUNITY_SOURCE
+ */
+#undef EXCLUDE_COMMUNITY_SOURCE
+#ifdef COMMUNITY_SOURCE
+   #define EXCLUDE_COMMUNITY_SOURCE(x) 
+#else
+   #define EXCLUDE_COMMUNITY_SOURCE(x) x
+#endif
+
+#undef COMMUNITY_SOURCE_AMD_SECRET
+#if !defined(COMMUNITY_SOURCE) || defined(AMD_SOURCE)
+/*
+ * It's ok to include AMD_SECRET source code for non-Community Source,
+ * or for drops directed at AMD.
+ */
+   #define COMMUNITY_SOURCE_AMD_SECRET
+#endif
+
+#undef COMMUNITY_SOURCE_INTEL_SECRET
+#if !defined(COMMUNITY_SOURCE) || defined(INTEL_SOURCE)
+/*
+ * It's ok to include INTEL_SECRET source code for non-Community Source,
+ * or for drops directed at Intel.
+ */
+   #define COMMUNITY_SOURCE_INTEL_SECRET
+#endif
+
+#endif
diff --git a/vmnet-only/compat_autoconf.h b/vmnet-only/compat_autoconf.h
new file mode 100644
index 00000000..26064aa8
--- /dev/null
+++ b/vmnet-only/compat_autoconf.h
@@ -0,0 +1,41 @@
+/*********************************************************
+ * Copyright (C) 2009 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_AUTOCONF_H__
+#   define __COMPAT_AUTOCONF_H__
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMKDRIVERS
+#include "includeCheck.h"
+
+
+#ifndef LINUX_VERSION_CODE
+#   error "Include compat_version.h before compat_autoconf.h"
+#endif
+
+/* autoconf.h moved from linux/autoconf.h to generated/autoconf.h in 2.6.33-rc1. */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 33)
+#   include <linux/autoconf.h>
+#else
+#   include <generated/autoconf.h>
+#endif
+
+#endif /* __COMPAT_AUTOCONF_H__ */
diff --git a/vmnet-only/compat_module.h b/vmnet-only/compat_module.h
new file mode 100644
index 00000000..2af73722
--- /dev/null
+++ b/vmnet-only/compat_module.h
@@ -0,0 +1,83 @@
+/*********************************************************
+ * Copyright (C) 2007 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * compat_module.h --
+ */
+
+#ifndef __COMPAT_MODULE_H__
+#   define __COMPAT_MODULE_H__
+
+
+#include <linux/module.h>
+
+
+/*
+ * Modules wishing to use the GPL license are required to include a
+ * MODULE_LICENSE definition in their module source as of 2.4.10.
+ */
+#ifndef MODULE_LICENSE
+#define MODULE_LICENSE(license)
+#endif
+
+/*
+ * To make use of our own home-brewed MODULE_INFO, we need macros to
+ * concatenate two expressions to "__mod_", and and to convert an
+ * expression into a string. I'm sure we've got these in our codebase,
+ * but I'd rather not introduce such a dependency in a compat header.
+ */
+#ifndef __module_cat
+#define __module_cat_1(a, b) __mod_ ## a ## b
+#define __module_cat(a, b) __module_cat_1(a, b)
+#endif
+
+#ifndef __stringify
+#define __stringify_1(x) #x
+#define __stringify(x) __stringify_1(x)
+#endif
+
+/*
+ * MODULE_INFO was born in 2.5.69.
+ */
+#ifndef MODULE_INFO
+#define MODULE_INFO(tag, info)                                                \
+static const char __module_cat(tag, __LINE__)[]                               \
+  __attribute__((section(".modinfo"), unused)) = __stringify(tag) "=" info
+#endif
+
+/*
+ * MODULE_VERSION was born in 2.6.4. The earlier form appends a long "\0xxx"
+ * string to the module's version, but that was removed in 2.6.10, so we'll
+ * ignore it in our wrapper.
+ */
+#ifndef MODULE_VERSION
+#define MODULE_VERSION(_version) MODULE_INFO(version, _version)
+#endif
+
+/*
+ * Linux kernel < 2.6.31 takes 'int' for 'bool' module parameters.
+ * Linux kernel >= 3.3.0 takes 'bool' for 'bool' module parameters.
+ * Kernels between the two take either.  So flip switch at 3.0.0.
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 0, 0)
+   typedef bool compat_mod_param_bool;
+#else
+   typedef int compat_mod_param_bool;
+#endif
+
+#endif /* __COMPAT_MODULE_H__ */
diff --git a/vmnet-only/compat_netdevice.h b/vmnet-only/compat_netdevice.h
new file mode 100644
index 00000000..e1a3b0ee
--- /dev/null
+++ b/vmnet-only/compat_netdevice.h
@@ -0,0 +1,346 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_NETDEVICE_H__
+#   define __COMPAT_NETDEVICE_H__
+
+
+#include <linux/skbuff.h>
+#include <linux/rtnetlink.h>
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/pci.h>
+
+/*
+ * The enet_statistics structure moved from linux/if_ether.h to
+ * linux/netdevice.h and is renamed net_device_stats in 2.1.25 --hpreg
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 1, 25)
+#   include <linux/if_ether.h>
+
+#   define net_device_stats enet_statistics
+#endif
+
+
+/* The netif_rx_ni() API appeared in 2.4.8 --hpreg */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 8)
+#   define netif_rx_ni netif_rx
+#endif
+
+
+/* The device struct was renamed net_device in 2.3.14 --hpreg */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 3, 14)
+#   define net_device device
+#endif
+
+
+/*
+ * SET_MODULE_OWNER appeared sometime during 2.3.x. It was setting
+ * dev->owner = THIS_MODULE until 2.5.70, where netdevice refcounting
+ * was completely changed.  SET_MODULE_OWNER was nop for whole
+ * 2.6.x series, and finally disappeared in 2.6.24.
+ *
+ * MOD_xxx_USE_COUNT wrappers are here, as they must be mutually
+ * exclusive with SET_MODULE_OWNER call.
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
+#   define COMPAT_SET_MODULE_OWNER(dev) do {} while (0)
+#   define COMPAT_NETDEV_MOD_INC_USE_COUNT MOD_INC_USE_COUNT
+#   define COMPAT_NETDEV_MOD_DEC_USE_COUNT MOD_DEC_USE_COUNT
+#else
+#   if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
+#      define COMPAT_SET_MODULE_OWNER(dev) SET_MODULE_OWNER(dev)
+#   else
+#      define COMPAT_SET_MODULE_OWNER(dev) do {} while (0)
+#   endif
+#   define COMPAT_NETDEV_MOD_INC_USE_COUNT do {} while (0)
+#   define COMPAT_NETDEV_MOD_DEC_USE_COUNT do {} while (0)
+#endif
+
+/*
+ * SET_NETDEV_DEV appeared sometime during 2.5.x, and later was
+ * crossported to various 2.4.x kernels (as dummy macro).
+ */
+#ifdef SET_NETDEV_DEV
+#   define COMPAT_SET_NETDEV_DEV(dev, pdev) SET_NETDEV_DEV(dev, pdev)
+#else
+#   define COMPAT_SET_NETDEV_DEV(dev, pdev) do {} while (0)
+#endif
+
+/*
+ * Build alloc_etherdev API on the top of init_etherdev.  For 2.0.x kernels
+ * we must provide dummy init method, otherwise register_netdev does
+ * nothing.
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 3)
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 2, 0)
+int
+vmware_dummy_init(struct net_device *dev)
+{
+   return 0;
+}
+#endif
+
+
+static inline struct net_device*
+compat_alloc_etherdev(int priv_size)
+{
+   struct net_device* dev;
+   int size = sizeof *dev + priv_size;
+
+   /*
+    * The name is dynamically allocated before 2.4.0, but 
+    * is an embedded array in later kernels.
+    */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
+   size += sizeof("ethXXXXXXX");
+#endif
+   dev = kmalloc(size, GFP_KERNEL);
+   if (dev) {
+      memset(dev, 0, size);
+      if (priv_size) {
+         dev->priv = dev + 1;
+      }
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
+      dev->name = (char *)(dev + 1) + priv_size;
+#endif
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 2, 0)
+      dev->init = vmware_dummy_init;
+#endif
+      if (init_etherdev(dev, 0) != dev) {
+         kfree(dev);
+         dev = NULL;
+      }
+   }
+   return dev;
+}
+#else
+#define compat_alloc_etherdev(sz)   alloc_etherdev(sz)
+#endif
+
+
+/*
+ * alloc_netdev and free_netdev are there since 2.4.23.  Their use is mandatory
+ * since 2.6.24.
+ */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 23)
+static inline struct net_device *
+compat_alloc_netdev(int priv_size,
+                    const char *mask,
+                    void (*setup)(struct net_device *))
+{
+   struct net_device *dev;
+   int netdev_size = sizeof *dev;
+   int alloc_size;
+
+#   if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
+   netdev_size += IFNAMSIZ;
+#   endif
+
+   alloc_size = netdev_size + priv_size;
+   dev = kmalloc(alloc_size, GFP_KERNEL);
+   if (dev) {
+      memset(dev, 0, alloc_size);
+      dev->priv = (char*)dev + netdev_size;
+      setup(dev);
+#   if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
+      dev->name = (char*)(dev + 1);
+#   endif
+      strcpy(dev->name, mask);   
+   }
+   return dev;
+}
+#   define compat_free_netdev(dev)     kfree(dev)
+#else
+#   define compat_alloc_netdev(size, mask, setup) alloc_netdev(size, mask, setup)
+#   define compat_free_netdev(dev)                free_netdev(dev)
+#endif
+
+/* netdev_priv() appeared in 2.6.3 */
+#if  LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 3)
+#   define compat_netdev_priv(netdev)   (netdev)->priv
+#else
+#   define compat_netdev_priv(netdev)   netdev_priv(netdev)
+#endif
+
+/*
+ * In 3.1 merge window feature maros were removed from mainline,
+ * so let's add back ones we care about.
+ */
+#if !defined(HAVE_NET_DEVICE_OPS) && \
+         LINUX_VERSION_CODE >= KERNEL_VERSION(3, 0, 0)
+#   define HAVE_NET_DEVICE_OPS 1
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 9)
+#   define COMPAT_NETDEV_TX_OK    NETDEV_TX_OK
+#   define COMPAT_NETDEV_TX_BUSY  NETDEV_TX_BUSY
+#else
+#   define COMPAT_NETDEV_TX_OK    0
+#   define COMPAT_NETDEV_TX_BUSY  1
+#endif
+
+/* unregister_netdevice_notifier was not safe prior to 2.6.17 */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 17) && \
+    !defined(ATOMIC_NOTIFIER_INIT)
+/* pre 2.6.17 and not patched */
+static inline int compat_unregister_netdevice_notifier(struct notifier_block *nb) {
+   int err;
+
+   rtnl_lock();
+   err = unregister_netdevice_notifier(nb);
+   rtnl_unlock();
+   return err;
+}
+#else
+/* post 2.6.17 or patched */
+#define compat_unregister_netdevice_notifier(_nb) \
+        unregister_netdevice_notifier(_nb);
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24) || defined(__VMKLNX__)
+
+#   define compat_netif_napi_add(dev, napi, poll, quota) \
+      netif_napi_add(dev, napi, poll, quota)
+
+#   if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 30) || \
+       defined VMW_NETIF_SINGLE_NAPI_PARM
+#      define compat_napi_complete(dev, napi) napi_complete(napi)
+#      define compat_napi_schedule(dev, napi) napi_schedule(napi)
+#   else
+#      define compat_napi_complete(dev, napi) netif_rx_complete(dev, napi)
+#      define compat_napi_schedule(dev, napi) netif_rx_schedule(dev, napi)
+#   endif
+
+#   define compat_napi_enable(dev, napi)  napi_enable(napi)
+#   define compat_napi_disable(dev, napi) napi_disable(napi)
+
+#else
+
+#   define compat_napi_complete(dev, napi) netif_rx_complete(dev)
+#   define compat_napi_schedule(dev, napi) netif_rx_schedule(dev)
+#   define compat_napi_enable(dev, napi)   netif_poll_enable(dev)
+#   define compat_napi_disable(dev, napi)  netif_poll_disable(dev)
+
+/* RedHat ported GRO to 2.6.18 bringing new napi_struct with it */
+#   if defined NETIF_F_GRO
+#      define compat_netif_napi_add(netdev, napi, pollcb, quota) \
+      do {                        \
+         (netdev)->poll = (pollcb);    \
+         (netdev)->weight = (quota);\
+         (napi)->dev = (netdev); \
+      } while (0)
+
+#   else
+       struct napi_struct {
+          int dummy;
+       };
+#      define compat_netif_napi_add(dev, napi, pollcb, quota) \
+       do {                        \
+          (dev)->poll = (pollcb);    \
+          (dev)->weight = (quota);\
+       } while (0)
+
+#   endif
+
+#endif
+
+#ifdef NETIF_F_TSO6
+#  define COMPAT_NETIF_F_TSO (NETIF_F_TSO6 | NETIF_F_TSO)
+#else
+#  define COMPAT_NETIF_F_TSO (NETIF_F_TSO)
+#endif
+
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 18)
+#   define compat_netif_tx_lock(dev) netif_tx_lock(dev)
+#   define compat_netif_tx_unlock(dev) netif_tx_unlock(dev)
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 16)
+#   define compat_netif_tx_lock(dev) spin_lock(&dev->xmit_lock)
+#   define compat_netif_tx_unlock(dev) spin_unlock(&dev->xmit_lock)
+#else
+/* Vendor backporting (SLES 10) has muddled the tx_lock situation. Pick whichever
+ * of the above works for you. */
+#   define compat_netif_tx_lock(dev) do {} while (0)
+#   define compat_netif_tx_unlock(dev) do {} while (0)
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 37)
+#   define COMPAT_VLAN_GROUP_ARRAY_LEN VLAN_N_VID
+#   define compat_flush_scheduled_work(work) cancel_work_sync(work)
+#else
+#   define COMPAT_VLAN_GROUP_ARRAY_LEN VLAN_GROUP_ARRAY_LEN
+#   define compat_flush_scheduled_work(work) flush_scheduled_work()
+#endif
+
+
+
+/*
+ * For kernel versions older than 2.6.29, where pci_msi_enabled is not
+ * available, check if
+ *	1. CONFIG_PCI_MSI is present
+ *	2. kernel version is newer than 2.6.25 (because multiqueue is not
+ *	   supporter) in kernels older than that)
+ *	3. msi can be enabled. If it fails it means that MSI is not available.
+ * When all the above are true, return non-zero so that multiple queues will be
+ * allowed in the driver.
+ */
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 29)
+#   define compat_multiqueue_allowed(dev) pci_msi_enabled()
+#else
+#   if defined CONFIG_PCI_MSI && LINUX_VERSION_CODE > KERNEL_VERSION(2, 6, 25)
+static inline int
+compat_multiqueue_allowed(struct pci_dev *dev)
+{
+   int ret;
+
+   if (!pci_enable_msi(dev))
+      ret = 1;
+   else
+      ret = 0;
+
+   pci_disable_msi(dev);
+   return ret;
+}
+
+#   else
+#      define compat_multiqueue_allowed(dev) (0)
+#   endif
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 37)
+#   define compat_vlan_get_protocol(skb) vlan_get_protocol(skb)
+#else
+#   define compat_vlan_get_protocol(skb) (skb->protocol)
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 3, 0)
+typedef netdev_features_t compat_netdev_features_t;
+#else
+typedef u32 compat_netdev_features_t;
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 7, 0)
+#define compat_netif_trans_update(d) netif_trans_update(d)
+#else
+#define compat_netif_trans_update(d) do { (d)->trans_start = jiffies; } while (0)
+#endif
+
+#endif /* __COMPAT_NETDEVICE_H__ */
diff --git a/vmnet-only/compat_skbuff.h b/vmnet-only/compat_skbuff.h
new file mode 100644
index 00000000..b6468855
--- /dev/null
+++ b/vmnet-only/compat_skbuff.h
@@ -0,0 +1,170 @@
+/*********************************************************
+ * Copyright (C) 2007 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_SKBUFF_H__
+#   define __COMPAT_SKBUFF_H__
+
+#include <linux/skbuff.h>
+
+/*
+ * When transition from mac/nh/h to skb_* accessors was made, also SKB_WITH_OVERHEAD
+ * was introduced.
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 22) || \
+   (LINUX_VERSION_CODE == KERNEL_VERSION(2, 6, 21) && defined(SKB_WITH_OVERHEAD))
+#define compat_skb_mac_header(skb)         skb_mac_header(skb)
+#define compat_skb_network_header(skb)     skb_network_header(skb)
+#define compat_skb_network_offset(skb)     skb_network_offset(skb)
+#define compat_skb_transport_header(skb)   skb_transport_header(skb)
+#define compat_skb_transport_offset(skb)   skb_transport_offset(skb)
+#define compat_skb_network_header_len(skb) skb_network_header_len(skb)
+#define compat_skb_tail_pointer(skb)       skb_tail_pointer(skb)
+#define compat_skb_end_pointer(skb)        skb_end_pointer(skb)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 22)
+#   define compat_skb_ip_header(skb)       ip_hdr(skb)
+#   define compat_skb_ipv6_header(skb)     ipv6_hdr(skb)
+#   define compat_skb_tcp_header(skb)      tcp_hdr(skb)
+#else
+#   define compat_skb_ip_header(skb)   ((struct iphdr *)skb_network_header(skb))
+#   define compat_skb_ipv6_header(skb) ((struct ipv6hdr *)skb_network_header(skb))
+#   define compat_skb_tcp_header(skb)  ((struct tcphdr *)skb_transport_header(skb))
+#endif
+#define compat_skb_reset_mac_header(skb)          skb_reset_mac_header(skb)
+#define compat_skb_reset_network_header(skb)      skb_reset_network_header(skb)
+#define compat_skb_reset_transport_header(skb)    skb_reset_transport_header(skb)
+#define compat_skb_set_network_header(skb, off)   skb_set_network_header(skb, off)
+#define compat_skb_set_transport_header(skb, off) skb_set_transport_header(skb, off)
+#else
+#define compat_skb_mac_header(skb)         (skb)->mac.raw
+#define compat_skb_network_header(skb)     (skb)->nh.raw
+#define compat_skb_network_offset(skb)     ((skb)->nh.raw - (skb)->data)
+#define compat_skb_transport_header(skb)   (skb)->h.raw
+#define compat_skb_transport_offset(skb)   ((skb)->h.raw - (skb)->data)
+#define compat_skb_network_header_len(skb) ((skb)->h.raw - (skb)->nh.raw)
+#define compat_skb_tail_pointer(skb)       (skb)->tail
+#define compat_skb_end_pointer(skb)        (skb)->end
+#define compat_skb_ip_header(skb)          (skb)->nh.iph
+#define compat_skb_ipv6_header(skb)        (skb)->nh.ipv6h
+#define compat_skb_tcp_header(skb)         (skb)->h.th
+#define compat_skb_reset_mac_header(skb)   ((skb)->mac.raw = (skb)->data)
+#define compat_skb_reset_network_header(skb)      ((skb)->nh.raw = (skb)->data)
+#define compat_skb_reset_transport_header(skb)    ((skb)->h.raw = (skb)->data)
+#define compat_skb_set_network_header(skb, off)   ((skb)->nh.raw = (skb)->data + (off))
+#define compat_skb_set_transport_header(skb, off) ((skb)->h.raw = (skb)->data + (off))
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 18) || defined(VMW_SKB_LINEARIZE_2618)
+#   define compat_skb_linearize(skb) skb_linearize((skb))
+#else
+
+#   if LINUX_VERSION_CODE == KERNEL_VERSION(2, 6, 0)
+#      define compat_skb_linearize(skb) __skb_linearize((skb), GFP_ATOMIC)
+#   elif LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 4)
+#      define compat_skb_linearize(skb) skb_linearize((skb), GFP_ATOMIC)
+#   else
+static inline int
+compat_skb_linearize(struct sk_buff *skb)
+{
+   return 0;
+}
+#   endif
+
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 20)
+#define compat_skb_csum_offset(skb)        (skb)->csum_offset
+#else
+#define compat_skb_csum_offset(skb)        (skb)->csum
+#endif
+
+/*
+ * Note that compat_skb_csum_start() has semantic different from kernel's csum_start:
+ * kernel's skb->csum_start is offset between start of checksummed area and start of
+ * complete skb buffer, while our compat_skb_csum_start(skb) is offset from start
+ * of packet itself.
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 22)
+#define compat_skb_csum_start(skb)         ((skb)->csum_start - skb_headroom(skb))
+#else
+#define compat_skb_csum_start(skb)         compat_skb_transport_offset(skb)
+#endif
+
+#if defined(NETIF_F_GSO) /* 2.6.18 and upwards */
+#define compat_skb_mss(skb) (skb_shinfo(skb)->gso_size)
+#else
+#define compat_skb_mss(skb) (skb_shinfo(skb)->tso_size)
+#endif
+
+/* used by both received pkts and outgoing ones */
+#define VM_CHECKSUM_UNNECESSARY CHECKSUM_UNNECESSARY
+
+/* csum status of received pkts */
+#if defined(CHECKSUM_COMPLETE)
+#   define VM_RX_CHECKSUM_PARTIAL     CHECKSUM_COMPLETE
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 19) && defined(CHECKSUM_HW)
+#   define VM_RX_CHECKSUM_PARTIAL     CHECKSUM_HW
+#else
+#   define VM_RX_CHECKSUM_PARTIAL     CHECKSUM_PARTIAL
+#endif
+
+/* csum status of outgoing pkts */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 19) && defined(CHECKSUM_HW)
+#   define VM_TX_CHECKSUM_PARTIAL      CHECKSUM_HW
+#else
+#   define VM_TX_CHECKSUM_PARTIAL      CHECKSUM_PARTIAL
+#endif
+
+#if (LINUX_VERSION_CODE < KERNEL_VERSION(2,1,0))
+#   define compat_kfree_skb(skb, type) kfree_skb(skb, type)
+#   define compat_dev_kfree_skb(skb, type) dev_kfree_skb(skb, type)
+#   define compat_dev_kfree_skb_any(skb, type) dev_kfree_skb(skb, type)
+#   define compat_dev_kfree_skb_irq(skb, type) dev_kfree_skb(skb, type)
+#else
+#   define compat_kfree_skb(skb, type) kfree_skb(skb)
+#   define compat_dev_kfree_skb(skb, type) dev_kfree_skb(skb)
+#   if (LINUX_VERSION_CODE < KERNEL_VERSION(2,3,43))
+#      define compat_dev_kfree_skb_any(skb, type) dev_kfree_skb(skb)
+#      define compat_dev_kfree_skb_irq(skb, type) dev_kfree_skb(skb)
+#   else
+#      define compat_dev_kfree_skb_any(skb, type) dev_kfree_skb_any(skb)
+#      define compat_dev_kfree_skb_irq(skb, type) dev_kfree_skb_irq(skb)
+#   endif
+#endif
+
+#ifndef NET_IP_ALIGN
+#   define COMPAT_NET_IP_ALIGN  2
+#else
+#   define COMPAT_NET_IP_ALIGN  NET_IP_ALIGN 
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 4)
+#   define compat_skb_headlen(skb)         skb_headlen(skb)
+#   define compat_pskb_may_pull(skb, len)  pskb_may_pull(skb, len)
+#   define compat_skb_is_nonlinear(skb)    skb_is_nonlinear(skb)
+#else
+#   define compat_skb_headlen(skb)         (skb)->len
+#   define compat_pskb_may_pull(skb, len)  1
+#   define compat_skb_is_nonlinear(skb)    0
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 12)
+#   define compat_skb_header_cloned(skb)   skb_header_cloned(skb)
+#else
+#   define compat_skb_header_cloned(skb)   0
+#endif
+#endif /* __COMPAT_SKBUFF_H__ */
diff --git a/vmnet-only/compat_sock.h b/vmnet-only/compat_sock.h
new file mode 100644
index 00000000..1aae4ec6
--- /dev/null
+++ b/vmnet-only/compat_sock.h
@@ -0,0 +1,77 @@
+/*********************************************************
+ * Copyright (C) 2003 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_SOCK_H__
+#   define __COMPAT_SOCK_H__
+
+#include <linux/stddef.h> /* for NULL */
+#include <net/sock.h>
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 35)
+static inline wait_queue_head_t *sk_sleep(struct sock *sk)
+{
+    return sk->sk_sleep;
+}
+#endif
+
+
+/*
+ * Prior to 2.6.24, there was no sock network namespace member. In 2.6.26, it
+ * was hidden behind accessor functions so that its behavior could vary
+ * depending on the value of CONFIG_NET_NS.
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 26)
+# define compat_sock_net(sk)            sock_net(sk)
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24)
+# define compat_sock_net(sk)            sk->sk_net
+#endif
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 16)
+
+#ifndef CONFIG_FILTER
+# define sk_filter(sk, skb, needlock)    0
+#endif
+
+/* Taken from 2.6.16's sock.h and modified for macro. */
+# define compat_sk_receive_skb(sk, skb, nested)         \
+   ({                                                   \
+     int rc = NET_RX_SUCCESS;                           \
+                                                        \
+     if (sk_filter(sk, skb, 0)) {                       \
+        kfree_skb(skb);                                 \
+     } else {                                           \
+        skb->dev = NULL;                                \
+        bh_lock_sock(sk);                               \
+        if (!sock_owned_by_user(sk)) {                  \
+           rc = (sk)->sk_backlog_rcv(sk, skb);          \
+        } else {                                        \
+           sk_add_backlog(sk, skb);                     \
+        }                                               \
+        bh_unlock_sock(sk);                             \
+     }                                                  \
+                                                        \
+     sock_put(sk);                                      \
+     rc;                                                \
+    })
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 20)
+# define compat_sk_receive_skb(sk, skb, nested) sk_receive_skb(sk, skb)
+#else
+# define compat_sk_receive_skb(sk, skb, nested) sk_receive_skb(sk, skb, nested)
+#endif
+
+#endif /* __COMPAT_SOCK_H__ */
diff --git a/vmnet-only/compat_version.h b/vmnet-only/compat_version.h
new file mode 100644
index 00000000..56d021cf
--- /dev/null
+++ b/vmnet-only/compat_version.h
@@ -0,0 +1,131 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __COMPAT_VERSION_H__
+#   define __COMPAT_VERSION_H__
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMKDRIVERS
+#include "includeCheck.h"
+
+
+#ifndef __linux__
+#   error "linux-version.h"
+#endif
+
+
+#include <linux/version.h>
+
+#ifndef KERNEL_VERSION
+#   error KERNEL_VERSION macro is not defined, environment is busted
+#endif
+
+
+/*
+ * Distinguish relevant classes of Linux kernels.
+ *
+ * The convention is that version X defines all
+ * the KERNEL_Y symbols where Y <= X.
+ *
+ * XXX Do not add more definitions here. This way of doing things does not
+ *     scale, and we are going to phase it out soon --hpreg
+ */
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 1, 0)
+#   define KERNEL_2_1
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 2, 0)
+#   define KERNEL_2_2
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 1)
+#   define KERNEL_2_3_1
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 15)
+/*   new networking */
+#   define KERNEL_2_3_15
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 25)
+/*  new procfs */
+#   define KERNEL_2_3_25
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 29)
+/*  even newer procfs */
+#   define KERNEL_2_3_29
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 43)
+/*  softnet changes */
+#   define KERNEL_2_3_43
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 47)
+/*  more softnet changes */
+#   define KERNEL_2_3_47
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 99)
+/*  name in netdevice struct is array and not pointer */
+#   define KERNEL_2_3_99
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 0)
+/*  New 'owner' member at the beginning of struct file_operations */
+#      define KERNEL_2_4_0
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 8)
+/*  New netif_rx_ni() --hpreg */
+#   define KERNEL_2_4_8
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 5, 2)
+/*  New kdev_t, major()/minor() API --hpreg */
+#   define KERNEL_2_5_2
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 5, 5)
+/*  New sk_alloc(), pte_offset_map()/pte_unmap() --hpreg */
+#   define KERNEL_2_5_5
+#endif
+
+/* Linux kernel 3.0 can be called 2.6.40, and 3.1 can be 2.6.41...
+ * Use COMPAT_LINUX_VERSION_CHECK_LT iff you need to compare running kernel to
+ * versions 3.0 and above.
+ *
+ */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 0, 0)
+   /* Straight forward comparison if kernel version is 3.0.0 and beyond */
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) LINUX_VERSION_CODE < KERNEL_VERSION (a, b, c)
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 40)
+   /* Use b of the check to calculate corresponding c of kernel
+    *  version to compare */
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) LINUX_VERSION_CODE < KERNEL_VERSION (2, 6, (b + 40))
+#else
+    /* This is anyways lesser than any 3.x versions */
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) 1
+#endif
+
+#endif /* __COMPAT_VERSION_H__ */
diff --git a/vmnet-only/driver-config.h b/vmnet-only/driver-config.h
new file mode 100644
index 00000000..fbf45d3c
--- /dev/null
+++ b/vmnet-only/driver-config.h
@@ -0,0 +1,79 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * Sets the proper defines from the Linux header files
+ *
+ * This file must be included before the inclusion of any kernel header file,
+ * with the exception of linux/autoconf.h and linux/version.h --hpreg
+ */
+
+#ifndef __VMX_CONFIG_H__
+#define __VMX_CONFIG_H__
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMKDRIVERS
+#include "includeCheck.h"
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+/*
+ * We rely on Kernel Module support.  Check here.
+ */
+#ifndef CONFIG_MODULES
+#   error "No Module support in this kernel.  Please configure with CONFIG_MODULES"
+#endif
+
+/*
+ * 2.2 kernels still use __SMP__ (derived from CONFIG_SMP
+ * in the main Makefile), so we do it here.
+ */
+
+#ifdef CONFIG_SMP
+#   define __SMP__ 1
+#endif
+
+#if defined(CONFIG_MODVERSIONS) && defined(KERNEL_2_1)
+#   if LINUX_VERSION_CODE < KERNEL_VERSION(2,5,60)
+/*
+ * MODVERSIONS might be already defined when using kernel's Makefiles.
+ */
+#      ifndef MODVERSIONS
+#         define MODVERSIONS
+#      endif
+#      include <linux/modversions.h>
+#   endif
+#endif
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24)
+/*
+ * Force the uintptr_t definition to come from linux/types.h instead of vm_basic_types.h.
+ */
+#   include <linux/types.h>
+#   define _STDINT_H 1
+#endif
+
+#ifndef __KERNEL__
+#   define __KERNEL__
+#endif
+
+#endif
diff --git a/vmnet-only/driver.c b/vmnet-only/driver.c
new file mode 100644
index 00000000..7e7ad99c
--- /dev/null
+++ b/vmnet-only/driver.c
@@ -0,0 +1,1707 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "driver-config.h"
+
+#define EXPORT_SYMTAB
+
+#include <linux/kernel.h>
+#include "compat_module.h"
+#include <linux/version.h>
+#include <linux/sched.h>
+#include <linux/slab.h>
+#include <linux/poll.h>
+
+#include <linux/smp.h>
+
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/mm.h>
+#include "compat_skbuff.h"
+#include <linux/if_ether.h>
+#include <linux/sockios.h>
+#include "compat_sock.h"
+#include <linux/kdev_t.h>
+#include <linux/mutex.h>
+
+#define __KERNEL_SYSCALLS__
+#include <asm/io.h>
+
+#include <linux/proc_fs.h>
+#include <linux/file.h>
+
+#include "vnetInt.h"
+#include "vnetFilter.h"
+
+#include "vmnetInt.h"
+
+/*
+ * Initialization and creation routines from other files.
+ * Putting them here reduces the need for so many header files.
+ */
+
+extern int VNetUserIf_Create(VNetPort **ret);
+extern int VNetNetIf_Create(char *devName, VNetPort **ret, int hubNum);
+extern int VNetBridge_Create(char *devName, uint32 flags, VNetJack *hubJack,
+                             VNetPort **ret);
+extern int VNetUserListener_Create(uint32 classMask, VNetJack *hubJack, VNetPort **ret);
+
+
+/*
+ *  Structure for cycle detection of host interfaces.  This
+ *  struct is only used by VNetCycleDetectIf().
+ */
+
+typedef struct VNetInterface {
+   char           name[VNET_NAME_LEN];
+   int            myGeneration;
+   struct VNetInterface *next;
+} VNetInterface;
+
+static VNetInterface *vnetInterfaces = NULL;
+
+/* this will let all multicast packets go through. */
+const uint8 allMultiFilter[VNET_LADRF_LEN] = { 0xff, 0xff, 0xff, 0xff,
+					       0xff, 0xff, 0xff, 0xff };
+
+/* broadcast MAC */
+const uint8 broadcast[ETH_ALEN] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
+
+/*
+ * All jack->peer accesses are guarded by this lock.
+ *
+ * This lock is acquired for read from interrupt context:
+ * use write_lock_irqsave() to gain write access.
+ *
+ * If you are acquiring this lock for write, and you do
+ * not have vnetStructureMutex already acquired,
+ * it is most certainly a bug.
+ */
+static DEFINE_RWLOCK(vnetPeerLock);
+
+/*
+ * All concurrent changes to the network structure are
+ * guarded by this mutex.
+ *
+ * For change to peer field you must own both
+ * vnetStructureMutex and vnetPeerLock for write.
+ */
+DEFINE_MUTEX(vnetStructureMutex);
+
+/*
+ * The following method ensures that only one thread uses iotcl code
+ * in the absence of BKL on newer kernels.
+ */
+static DEFINE_MUTEX(vnetIoctlMutex);
+
+/*
+ * List of known ports. Use vnetStructureMutex for locking.
+ */
+
+static VNetPort *vnetAllPorts     = NULL;
+
+
+struct proto vmnet_proto = {
+   .name     = "VMNET",
+   .owner    = THIS_MODULE,
+   .obj_size = sizeof(struct sock),
+};
+
+/*
+ *  Device driver interface.
+ */
+
+int VNetRegister(int value);
+static int  VNetFileOpOpen(struct inode *inode, struct file *filp);
+static int  VNetFileOpClose(struct inode *inode, struct file *filp);
+static unsigned int VNetFileOpPoll(struct file *filp, poll_table *wait);
+static ssize_t  VNetFileOpRead(struct file *filp, char *buf, size_t count,
+			       loff_t *ppos);
+static ssize_t  VNetFileOpWrite(struct file *filp, const char *buf, size_t count,
+			        loff_t *ppos);
+static long  VNetFileOpUnlockedIoctl(struct file * filp,
+                                     unsigned int iocmd, unsigned long ioarg);
+
+static struct file_operations vnetFileOps;
+
+/*
+ * Utility functions
+ */
+
+static void VNetFreeInterfaceList(void);
+static int VNetSwitchToDifferentPeer(VNetJack *jack, VNetJack *newPeer,
+				     Bool connectNewToPeer,
+				     struct file *filp, VNetPort *jackPort,
+				     VNetPort *newPeerPort);
+static void VNetKrefRelease(struct kref *kref);
+
+uint vnet_max_qlen = VNET_MAX_QLEN;
+module_param(vnet_max_qlen, uint, 0);
+MODULE_PARM_DESC(vnet_max_qlen, "Maximum queue length of the vmnet, default is"
+                 " 1024, maximum is 1024");
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetRegister --
+ *
+ *      (debugging support) Should be the first function of this file
+ *
+ * Results:
+ *
+ *      Registers the module.
+ *      /sbin/ksyms -a | grep VNetRegister will return the base
+ *      address of that function as loaded in the kernel.
+ *
+ *      Since this is the first function of the kernel module,
+ *      every other symbol can be computing by adding the base
+ *      to the output of nm.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetRegister(int value) // IN: unused
+{
+   LOG(0, (KERN_WARNING "/dev/vmnet: VNetRegister called\n"));
+   return 0;
+}
+
+#ifdef VMW_HAVE_SK_ALLOC_WITH_PROTO
+
+/*
+ *----------------------------------------------------------------------
+ *
+ *  VNetProtoRegister --
+ *  VNetProtoUnregister --
+ *
+ *      Register or unregister the struct proto that we use for sk_alloc.
+ *
+ * Results:
+ *      int.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#define VNetProtoRegister()   proto_register(&vmnet_proto, 0)
+#define VNetProtoUnregister() \
+   do { \
+      proto_unregister(&vmnet_proto); \
+   } while (0)
+
+#else
+
+#define VNetProtoRegister()     0
+#define VNetProtoUnregister()
+
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetAddPortToList --
+ *
+ *      Add port to list of known ports.
+ *	Caller must own vnetStructureMutex.
+ *
+ * Results:
+ *
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VNetAddPortToList(VNetPort *port) // IN: port to add to list
+{
+   port->next = vnetAllPorts;
+   vnetAllPorts = port;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetRemovePortFromList --
+ *
+ *      Remove port from list of known ports.
+ *	Caller must own vnetStructureMutex.
+ *
+ * Results:
+ *
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VNetRemovePortFromList(const VNetPort *port) // IN: port to remove from list
+{
+   VNetPort **p;
+
+   for (p = &vnetAllPorts; *p; p = &(*p)->next) {
+      if (*p == port) {
+         *p = port->next;
+         break;
+      }
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * init_module --
+ *
+ *      linux module entry point. Called by /sbin/insmod command.
+ *      Initializes module and Registers this driver for a
+ *      vnet major #.  The 64-bit version of this driver also
+ *      registers handlers for 32-bit applications.
+ *
+ * Results:
+ *      errno (0 on success).
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+init_module(void)
+{
+   int retval;
+
+   /*
+    * First initialize everything, and as a last step register
+    * vmnet device: immediately after registration anybody can
+    * ask driver for anything.
+    */
+
+   retval = VNetProc_Init();
+   if (retval) {
+      LOG(0, (KERN_NOTICE "/dev/vmnet: could not register proc fs\n"));
+      return -ENOENT;
+   }
+
+   retval = VNetProtoRegister();
+   if (retval) {
+      goto err_proto;
+   }
+
+   /*
+    * Initialize the file_operations structure. Because this code is always
+    * compiled as a module, this is fine to do it here and not in a static
+    * initializer.
+    */
+
+   memset(&vnetFileOps, 0, sizeof vnetFileOps);
+   vnetFileOps.owner = THIS_MODULE;
+   vnetFileOps.read = VNetFileOpRead;
+   vnetFileOps.write = VNetFileOpWrite;
+   vnetFileOps.poll = VNetFileOpPoll;
+   vnetFileOps.unlocked_ioctl = VNetFileOpUnlockedIoctl;
+   vnetFileOps.compat_ioctl = VNetFileOpUnlockedIoctl;
+   vnetFileOps.open = VNetFileOpOpen;
+   vnetFileOps.release = VNetFileOpClose;
+
+   retval = register_chrdev(VNET_MAJOR_NUMBER, "vmnet", &vnetFileOps);
+   if (retval) {
+      LOG(0, (KERN_NOTICE "/dev/vmnet: could not register major device %d\n",
+	      VNET_MAJOR_NUMBER));
+      goto err_chrdev;
+   }
+
+   if (vnet_max_qlen < (VNET_MAX_QLEN >> 1) || vnet_max_qlen > 1024) {
+      LOG(0, (KERN_NOTICE "vmnet: Invalid vnet_max_qlen specified, "
+              "vnet_max_qlen is to be set to default value 1024.\n"));
+      vnet_max_qlen = VNET_MAX_QLEN;
+   }
+   return 0;
+
+err_chrdev:
+   VNetProtoUnregister();
+err_proto:
+   VNetProc_Cleanup();
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * cleanup_module --
+ *
+ *      Called by /sbin/rmmod.  Unregisters this driver for a
+ *      vnet major #, and deinitializes the modules.  The 64-bit
+ *      version of this driver also unregisters the handlers
+ *      for 32-bit applications.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+cleanup_module(void)
+{
+   unregister_chrdev(VNET_MAJOR_NUMBER, "vmnet");
+   VNetProtoUnregister();
+   VNetProc_Cleanup();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetFileOpOpen --
+ *
+ *      The virtual network's open file operation.  Connects to (and
+ *      potentially allocates) a hub, then opens a connection to
+ *      this virtual network (i.e., plugs a cable into the virtual
+ *      hub).
+ *
+ * Results:
+ *      Errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetFileOpOpen(struct inode  *inode, // IN: used to get hub number
+               struct file   *filp)  // IN: filp
+{
+   VNetPort *port;
+   VNetJack *hubJack;
+   int hubNum;
+   int retval;
+
+   LOG(1, (KERN_DEBUG "/dev/vmnet: open called by PID %d (%s)\n",
+           current->pid, current->comm));
+
+   /*
+    * Sanity check the hub number.
+    */
+
+   hubNum = MINOR(inode->i_rdev);
+   if (hubNum < 0 || hubNum >= VNET_NUM_VNETS) {
+      return -ENODEV;
+   }
+
+   /*
+    * Allocate port
+    */
+
+   retval = VNetUserIf_Create(&port);
+   if (retval) {
+      return -retval;
+   }
+   port->hubNum = hubNum;
+
+   /*
+    * Allocate and connect to hub.
+    */
+
+   hubJack = VNetHub_AllocVnet(hubNum);
+   if (!hubJack) {
+      kref_put(&port->jack.kref, VNetKrefRelease);
+      return -EBUSY;
+   }
+
+   mutex_lock(&vnetStructureMutex);
+   retval = VNetConnect(&port->jack, hubJack);
+   if (retval) {
+      mutex_unlock(&vnetStructureMutex);
+      kref_put(&port->jack.kref, VNetKrefRelease);
+      kref_put(&hubJack->kref, VNetKrefRelease);
+      return retval;
+   }
+
+   VNetAddPortToList(port);
+   mutex_unlock(&vnetStructureMutex);
+
+   /*
+    * Store away jack in file pointer private field for later use.
+    */
+
+   filp->private_data = port;
+
+   LOG(1, (KERN_DEBUG "/dev/vmnet: port on hub %d successfully opened\n", hubNum));
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetFileOpClose --
+ *
+ *      The virtual network's close file operation.  Disconnects
+ *      from the virtual hub (i.e., unplugs the cable).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetFileOpClose(struct inode  *inode, // IN: (unused)
+                struct file   *filp)  // IN: filp
+{
+   VNetPort *port = (VNetPort*)filp->private_data;
+   VNetJack *peer;
+
+   if (!port) {
+      LOG(1, (KERN_DEBUG "/dev/vmnet: bad file pointer on close\n"));
+      return -EBADF;
+   }
+
+   mutex_lock(&vnetStructureMutex);
+   peer = VNetDisconnect(&port->jack);
+   VNetRemovePortFromList(port);
+   mutex_unlock(&vnetStructureMutex);
+
+   kref_put(&port->jack.kref, VNetKrefRelease);
+   kref_put(&peer->kref, VNetKrefRelease);
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetFileOpRead --
+ *
+ *      The virtual network's read file operation.
+ *
+ * Results:
+ *      On success the len of the packet received,
+ *      else if no packet waiting and nonblocking 0,
+ *      else -errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+ssize_t
+VNetFileOpRead(struct file  *filp,  // IN:
+               char         *buf,   // OUT:
+               size_t        count, // IN:
+	       loff_t	    *ppos)  // IN: (unused)
+{
+   VNetPort *port = (VNetPort*)filp->private_data;
+
+   if (!port) {
+      LOG(1, (KERN_DEBUG "/dev/vmnet: bad file pointer on read\n"));
+      return -EBADF;
+   }
+
+   if (!port->fileOpRead) {
+      return -EPERM;
+   }
+
+   return port->fileOpRead(port, filp, buf, count);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetFileOpWrite --
+ *
+ *      The virtual network's write file operation.
+ *
+ * Results:
+ *      On success the count of bytes written else errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+ssize_t
+VNetFileOpWrite(struct file   *filp,  // IN:
+                const char    *buf,   // IN:
+                size_t         count, // IN:
+		loff_t	      *ppos)  // IN: (unused)
+{
+   VNetPort *port = (VNetPort*)filp->private_data;
+
+   if (!port) {
+      LOG(1, (KERN_DEBUG "/dev/vmnet: bad file pointer on write\n"));
+      return -EBADF;
+   }
+
+   if (!port->fileOpWrite) {
+      return -EPERM;
+   }
+
+   return port->fileOpWrite(port, filp, buf, count);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetFileOpPoll --
+ *
+ *      The virtual network's file select operation.
+ *
+ * Results:
+ *      Return 1 if success, else sleep and return 0.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static unsigned int
+VNetFileOpPoll(struct file *filp, // IN:
+	       poll_table  *wait) // IN:
+{
+   VNetPort *port = (VNetPort*)filp->private_data;
+
+   if (!port) {
+      LOG(1, (KERN_DEBUG "/dev/vmnet: bad file pointer on poll\n"));
+      return -EBADF;
+   }
+
+   if (!port->fileOpPoll) {
+      return -EPERM;
+   }
+
+   return port->fileOpPoll(port, filp, wait);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetFileOpUnlockedIoctl --
+ *
+ *      The virtual network's ioctl file operation. This is used for
+ *      setup of the connection. Currently supported commands are
+ *      (taken from sockios.h):
+ *
+ *      SIOCGIFADDR - get ethernet address          - ioarg OUT: 6 bytes
+ *      SIOCSIFADDR - set ethernet address          - ioarg IN:  6 bytes
+ *      SIOCSIFFLAGS - set flags                    - ioarg IN:  4 bytes
+ *
+ *      Private ioctl calls, taken from device-private ioctl space
+ *      in sockios.h, and defined in includes/vm_oui.h:
+ *
+ *      SIOCSLADRF (0x89F2) - set logical address filter (for
+ *         filtering multicast packets)             - ioarg IN:  8 bytes
+ *
+ *      SIOCGBRSTATUS - get bridging status         - ioarg OUT: 4 bytes
+ *      SIOCSPEER - set bridge peer interface       - ioarg IN:  8 bytes
+ *      SIOCSPEER2 - set bridge peer interface      - ioarg IN: 32 bytes
+ *      SIOCSBIND - bind to a particular vnet/PVN   - ioarg IN: VNet_Bind
+ *      SIOCSFILTERRULES - set host filter rules    - ioarg IN: VNet_Filter
+ *      SIOCBRIDGE - (legacy see SIOCSPEER)
+ *      SIOCSUSERLISTENER - set user listener - ioarg IN: VNet_SetUserListener
+ *
+ *      Supported flags are (taken from if.h):
+ *
+ *      IFF_UP - ready to receive packets             - OFF by default
+ *      IFF_BROADCAST - receive broadcast packets     - OFF by default
+ *      IFF_DEBUG - turn on debugging                 - OFF by default
+ *      IFF_PROMISC - promiscuous mode                - OFF by default
+ *      IFF_MULTICAST - receive multicast packets     - OFF by default
+ *      IFF_ALLMULTI - receive all multicast packets
+ *            (like IFF_PROMISC but with multicast)   - OFF by default
+ *
+ * Results:
+ *      On success 0 else errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+long
+VNetFileOpUnlockedIoctl(struct file    *filp,  // IN:
+                        unsigned int    iocmd, // IN:
+                        unsigned long   ioarg) // IN:
+{
+   VNetPort *port = (VNetPort*)filp->private_data;
+   VNetJack *hubJack;
+   VNetPort *new;
+   char name[32];
+   long retval;
+   VNet_SetMacAddrIOCTL macAddr;
+   VNet_Bind newNetwork;
+   VNet_BridgeParams bridgeParams;
+
+   if (!port) {
+      LOG(1, (KERN_DEBUG "/dev/vmnet: bad file pointer on ioctl\n"));
+      return -EBADF;
+   }
+
+   // sprintf(vnetHub[hubNum]->devName, "vmnet%d", hubNum);
+
+   switch (iocmd) {
+   case SIOCSPEER:
+   case SIOCBRIDGE:
+   case SIOCSPEER2:
+   case SIOCSPEER3:
+      memset(&bridgeParams, 0, sizeof bridgeParams);
+      if (iocmd == SIOCSPEER3) {
+         retval = copy_from_user(&bridgeParams, (void *)ioarg,
+                                 sizeof bridgeParams);
+      } else if (iocmd == SIOCSPEER2) {
+         retval = copy_from_user(&bridgeParams.name, (void *)ioarg,
+                                 sizeof bridgeParams.name);
+      } else {
+         retval = copy_from_user(&bridgeParams.name, (void *)ioarg, 8);
+      }
+
+      if (retval) {
+         return -EFAULT;
+      }
+      NULL_TERMINATE_STRING(bridgeParams.name);
+
+      if (!capable(CAP_NET_RAW)) {
+         return -EACCES;
+      }
+
+      mutex_lock(&vnetIoctlMutex);
+      retval = VNetBridge_Create(bridgeParams.name, bridgeParams.flags,
+                                 port->jack.peer, &new);
+      if (!retval) {
+         retval = VNetSwitchToDifferentPeer(&port->jack, &new->jack, TRUE,
+                                            filp, port, new);
+      }
+      mutex_unlock(&vnetIoctlMutex);
+
+      break;
+
+   case SIOCSUSERLISTENER:
+      {
+         VNet_SetUserListener param;
+
+         /* copy parameters */
+         if (copy_from_user(&param, (void *)ioarg, sizeof param)) {
+            return -EFAULT;
+         }
+
+         /* check version */
+         if (param.version != VNET_EVENT_VERSION) {
+            return -EINVAL;
+         }
+
+         mutex_lock(&vnetIoctlMutex);
+         /* create user listener */
+         retval = VNetUserListener_Create(param.classMask, port->jack.peer, &new);
+         if (retval == 0) {
+            /* replace current port with user listener */
+            retval = VNetSwitchToDifferentPeer(&port->jack, &new->jack, TRUE,
+                                               filp, port, new);
+         }
+         mutex_unlock(&vnetIoctlMutex);
+      }
+      break;
+
+   case SIOCPORT:
+      mutex_lock(&vnetIoctlMutex);
+      retval = VNetUserIf_Create(&new);
+      if (retval == 0) {
+         retval = VNetSwitchToDifferentPeer(&port->jack, &new->jack,
+                                            TRUE, filp, port, new);
+      }
+      mutex_unlock(&vnetIoctlMutex);
+      break;
+
+   case SIOCNETIF:
+      if (copy_from_user(name, (void *)ioarg, 8)) {
+         return -EFAULT;
+      }
+      name[8] = '\0'; /* allow 8-char unterminated string */
+
+      mutex_lock(&vnetIoctlMutex);
+      retval = VNetNetIf_Create(name, &new, port->hubNum);
+      if (retval == 0) {
+         retval = VNetSwitchToDifferentPeer(&port->jack, &new->jack,
+                                            TRUE, filp, port, new);
+      }
+      mutex_unlock(&vnetIoctlMutex);
+      break;
+
+   case SIOCSBIND:
+      if (copy_from_user(&newNetwork, (void *)ioarg, sizeof newNetwork)) {
+         return -EFAULT;
+      }
+
+      if (newNetwork.version != VNET_BIND_VERSION) {
+         LOG(1, (KERN_NOTICE "/dev/vmnet: bad bind version: %u %u\n",
+             newNetwork.version, VNET_BIND_VERSION));
+         return -EINVAL;
+      }
+
+      mutex_lock(&vnetIoctlMutex);
+
+      switch (newNetwork.bindType) {
+      case VNET_BIND_TO_VNET:
+         if (newNetwork.number < 0 || newNetwork.number >= VNET_NUM_VNETS) {
+            LOG(1, (KERN_NOTICE "/dev/vmnet: invalid bind to vnet %d\n",
+                newNetwork.number));
+            retval = -EINVAL;
+         } else {
+            hubJack = VNetHub_AllocVnet(newNetwork.number);
+            retval = 0;
+         }
+         break;
+
+      case VNET_BIND_TO_PVN:
+         {
+            uint8 id[VNET_PVN_ID_LEN] = {0};
+
+            if (memcmp(id, newNetwork.id,
+                       min(sizeof id, sizeof newNetwork.id)) == 0) {
+               LOG(0, (KERN_NOTICE "/dev/vmnet: invalid bind to pvn\n"));
+               retval = -EINVAL;
+            } else {
+               memcpy(id, newNetwork.id,
+                      min(sizeof id, sizeof newNetwork.id));
+               hubJack = VNetHub_AllocPvn(id);
+               retval = 0;
+            }
+         }
+         break;
+
+      default:
+         LOG(1, (KERN_NOTICE "/dev/vmnet: bad bind type: %u\n",
+         newNetwork.bindType));
+         retval = -EINVAL;
+      }
+
+      if (retval == 0) {
+         retval = VNetSwitchToDifferentPeer(&port->jack, hubJack,
+                                            FALSE, NULL, NULL, NULL);
+      }
+
+      mutex_unlock(&vnetIoctlMutex);
+      break;
+
+   case SIOCSFILTERRULES:
+      LOG(0, (KERN_NOTICE "/dev/vmnet: kernel doesn't support netfilter\n"));
+      return -EINVAL;
+
+   case SIOCGBRSTATUS:
+      {
+         uint32 flags;
+
+         read_lock(&vnetPeerLock);
+         flags = VNetIsBridged(&port->jack);
+         read_unlock(&vnetPeerLock);
+
+         retval = put_user(flags, (uint32 *)ioarg) ? -EFAULT : 0;
+      }
+      break;
+
+   case SIOCGIFADDR:
+      {
+         uint8 paddr[ETH_ALEN];
+
+         mutex_lock(&vnetIoctlMutex);
+         memcpy(paddr, port->paddr, sizeof paddr);
+         mutex_unlock(&vnetIoctlMutex);
+
+         retval = copy_to_user((void *)ioarg, paddr, ETH_ALEN) ? -EFAULT : 0;
+      }
+      break;
+
+   case SIOCSIFADDR:
+      return -EFAULT;
+
+   case SIOCSLADRF:
+      {
+         uint8 ladrf[VNET_LADRF_LEN];
+
+         if (copy_from_user(ladrf, (void *)ioarg, sizeof ladrf)) {
+            return -EFAULT;
+         }
+
+         mutex_lock(&vnetIoctlMutex);
+         memcpy(port->ladrf, ladrf, sizeof port->ladrf);
+         port->exactFilterLen = 0;
+         mutex_unlock(&vnetIoctlMutex);
+
+         retval = 0;
+      }
+      break;
+
+   case SIOCSIFFLAGS:
+      {
+         uint32 flags;
+
+         if (get_user(flags, (uint32 *)ioarg)) {
+            return -EFAULT;
+         }
+
+         /* Sanitize */
+         flags &= IFF_UP | IFF_BROADCAST | IFF_DEBUG | IFF_PROMISC |
+                  IFF_MULTICAST | IFF_ALLMULTI;
+         flags |= IFF_RUNNING;
+
+         mutex_lock(&vnetIoctlMutex);
+         port->flags = flags;
+         if (port->fileOpIoctl) {
+
+            /*
+             * Userif ports have some postprocessing when the IFF_UP flags is
+             * changed.
+             */
+            port->fileOpIoctl(port, filp, iocmd, ioarg);
+         }
+         mutex_unlock(&vnetIoctlMutex);
+
+         retval = 0;
+      }
+
+      break;
+
+   case SIOCSETMACADDR:
+      if (copy_from_user(&macAddr, (void *)ioarg, sizeof macAddr)) {
+         return -EFAULT;
+      }
+
+      switch (macAddr.version) {
+      case 1:
+         if (macAddr.flags & VNET_SETMACADDRF_UNIQUE) {
+            if (VMX86_IS_VIRT_ADAPTER_MAC(macAddr.addr)) {
+               return -EBUSY;
+            }
+            mutex_lock(&vnetIoctlMutex);
+            retval = VNetSetMACUnique(port, macAddr.addr);
+            mutex_unlock(&vnetIoctlMutex);
+
+         } else {
+            mutex_lock(&vnetIoctlMutex);
+            memcpy(port->paddr, macAddr.addr, ETH_ALEN);
+            mutex_unlock(&vnetIoctlMutex);
+
+            retval = 0;
+         }
+
+         break;
+
+      default:
+         retval = -EINVAL;
+         break;
+      }
+      break;
+
+   case SIOCSMCASTFILTER:
+      {
+         VNetMcastFilter vnetMcastFilter;
+         if (copy_from_user(&vnetMcastFilter, (void *)ioarg,
+                            sizeof vnetMcastFilter)) {
+            return -EFAULT;
+         }
+         if (vnetMcastFilter.exactFilterLen > VNET_MAX_EXACT_FILTER_LEN) {
+            return -EFAULT;
+         }
+
+         mutex_lock(&vnetIoctlMutex);
+
+         memcpy(port->ladrf, vnetMcastFilter.ladrf, sizeof port->ladrf);
+         memcpy(port->exactFilter, vnetMcastFilter.exactFilter,
+                vnetMcastFilter.exactFilterLen * ETHER_ADDR_LEN);
+         port->exactFilterLen = vnetMcastFilter.exactFilterLen;
+
+         mutex_unlock(&vnetIoctlMutex);
+
+         retval = 0;
+         break;
+      }
+
+   case SIOCGETAPIVERSION2:
+      {
+         uint32 verFromUser;
+
+         if (get_user(verFromUser, (uint32 *)ioarg)) {
+            return -EFAULT;
+         }
+         /* Should we require verFromUser == VNET_API_VERSION? */
+      }
+      /* fall thru */
+
+   case SIOCGETAPIVERSION:
+      retval = put_user(VNET_API_VERSION, (uint32 *)ioarg) ?  -EFAULT : 0;
+      break;
+
+   default:
+      if (!port->fileOpIoctl) {
+         return -ENOIOCTLCMD;
+      }
+
+      mutex_lock(&vnetIoctlMutex);
+      retval = port->fileOpIoctl(port, filp, iocmd, ioarg);
+      mutex_unlock(&vnetIoctlMutex);
+
+      break;
+   }
+
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetSwitchToDifferentPeer --
+ *
+ *      This function is used to disconnect from a one peer and
+ *      connect to another peer.  If the connect to the new peer
+ *      fails (e.g., if the connect would create a cycle), then
+ *      the function will reconnect back to the original peer.
+ *      The function will deallocate the old or the new peer,
+ *      whichever is the one that has been disconnected.
+ *
+ *      optional behavior:
+ *
+ *      For the case where the function was successful in switching
+ *      to the new peer, the caller can optionally provide a 'filp'
+ *      (private_data is set to the new port), and the caller
+ *      can also provide one each of a port to be added to
+ *      and/or removed from the port list.  If the caller provides
+ *      ports to add/remove from the list, then
+ *      connectNewToPeerOfJack should be set to TRUE (otherwise
+ *      inconsistencies in the port list are likely to occur).
+ *
+ * Results:
+ *      errno (0 on success).
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetSwitchToDifferentPeer(VNetJack *jack,              // IN: jack whose peer is to be changed
+			  VNetJack *newPeer,           // IN: the new peer to try to switch to
+			  Bool connectNewToPeerOfJack, // IN: connect new to peer of 'jack' or to 'jack' itself?
+			  struct file *filp,           // IN: (optional) set filp to 'newpeerPort' on success
+			  VNetPort *jackPort,          // IN: (optional) port to remove from list on success
+			  VNetPort *newPeerPort)       // IN: (optional) port to add to list on success
+{
+   VNetJack *oldPeer;
+   int retval;
+
+   if (newPeer == NULL) {
+      LOG(0, (KERN_NOTICE "/dev/vmnet: failed to alloc new peer\n"));
+      return -EINVAL;
+   }
+
+   /*
+    * OK this is tricky. Try and connect the new peer while saving
+    * enough information so that we can reconnect back to the
+    * old peer if a cycle is detected.
+    */
+
+   mutex_lock(&vnetStructureMutex);
+
+   /* Disconnect from the old peer */
+   oldPeer = VNetDisconnect(jack);
+
+   /* Try to connect to the new peer */
+   if (connectNewToPeerOfJack) {
+      retval = VNetConnect(oldPeer, newPeer);
+   } else {
+      retval = VNetConnect(jack, newPeer);
+   }
+   if (retval) {
+
+      /* Connect failed, so reconnect back to old peer */
+      int retval2 = VNetConnect(jack, oldPeer);
+      mutex_unlock(&vnetStructureMutex);
+
+      /* Free the new peer */
+      kref_put(&newPeer->kref, VNetKrefRelease);
+      if (retval2) {
+	 // assert xxx redo this
+	 LOG(1, (KERN_NOTICE "/dev/vmnet: cycle on connect failure\n"));
+	 return -EBADF;
+      }
+      return retval;
+   }
+
+   if (filp != NULL) {
+      newPeerPort->hubNum = jackPort->hubNum;
+      VNetAddPortToList(newPeerPort);
+      filp->private_data = newPeerPort;
+      VNetRemovePortFromList(jackPort);
+   }
+
+   mutex_unlock(&vnetStructureMutex);
+
+   /* Connected to new peer, so dealloc the old peer */
+   if (connectNewToPeerOfJack) {
+      kref_put(&jack->kref, VNetKrefRelease);
+   } else {
+      kref_put(&oldPeer->kref, VNetKrefRelease);
+   }
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetMulticastFilter --
+ *
+ *      Utility function that filters multicast packets according
+ *      to a 64-bit logical address filter (like the one on the
+ *      lance chipset).  AllMultiFilter lets all packets through.
+ *
+ *      We generate a hash value from the destination MAC address
+ *      and see if it's in our filter.  Broadcast packets have
+ *      already OK'd by PacketMatch, so we don't have to worry
+ *      about that.
+ *
+ *      (This is in the green AMD "Ethernet Controllers" book,
+ *      page 1-53.)
+ *
+ * Results:
+ *      TRUE if packet is in filter, FALSE if not.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#define CRC_POLYNOMIAL_BE 0x04c11db7UL  /* Ethernet CRC, big endian */
+
+static INLINE_SINGLE_CALLER Bool
+VNetMulticastFilter(const uint8 *destAddr,        // IN: multicast MAC
+                    const uint8 *exactFilter,     // IN: exact mc filter
+                    const uint32 exactFilterLen,  // IN: length of exact mc filter
+		    const uint8 *ladrf)           // IN: logical addr filter
+{
+   uint16 hashcode;
+   int32 crc;
+   int32 poly = CRC_POLYNOMIAL_BE;
+   int j;
+   int bit;
+   int byte;
+
+   /*  first check exact multicast filter */
+   if (exactFilterLen) {
+      uint32 i;
+      for (i = 0; i < exactFilterLen; i++) {
+         if (MAC_EQ(destAddr, exactFilter + i * ETHER_ADDR_LEN)){
+            return TRUE;
+         }
+      }
+      /*
+       * Do not need to further compute and check ladrf if no match
+       * in exact multicast filter, since only one of them is 
+       * used at a time.
+       */
+      return FALSE;
+   }
+   
+
+   crc = 0xffffffff;                  /* init CRC for each address */
+   for (byte = 0; byte < ETH_ALEN; byte++) { /* for each address byte */
+      /* process each address bit */
+      for (bit = *destAddr++, j = 0;
+	   j < VNET_LADRF_LEN;
+	   j++, bit >>= 1) {
+	 crc = (crc << 1) ^ ((((crc<0?1:0) ^ bit) & 0x01) ? poly : 0);
+      }
+   }
+   hashcode = (crc & 1);              /* hashcode is 6 LSb of CRC ... */
+   for (j = 0; j < 5; j++) {                /* ... in reverse order. */
+      hashcode = (hashcode << 1) | ((crc>>=1) & 1);
+   }
+
+   byte = hashcode >> 3;              /* bit[3-5] -> byte in filter */
+   bit = 1 << (hashcode & 0x07);      /* bit[0-2] -> bit in byte */
+   if (ladrf[byte] & bit) {
+      return TRUE;
+   } else {
+      return FALSE;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetPacketMatch --
+ *
+ *      Determines whether the packet should be given to the interface.
+ *
+ * Results:
+ *      TRUE if the pasket is OK for this interface, FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+VNetPacketMatch(const uint8   *destAddr,        // IN: destination MAC
+                const uint8   *ifAddr,          // IN: MAC of interface
+                const uint8   *exactFilter,     // IN: exact mc filter
+                const uint32  exactFilterLen,   // IN: size of exact mc filter
+		const uint8   *ladrf,           // IN: multicast filter
+                uint32        flags)            // IN: filter flags
+{
+   /*
+    * Return TRUE if promiscuous requested, or unicast destined
+    * for interface, or broadcast (and broadcast requested), or
+    * if multicast (and all multicast, or this specific
+    * multicast MAC, was requested).
+    */
+
+   return ((flags & IFF_PROMISC) || MAC_EQ(destAddr, ifAddr) ||
+	   ((flags & IFF_BROADCAST) && MAC_EQ(destAddr, broadcast)) ||
+	   ((destAddr[0] & 0x1) && (flags & IFF_ALLMULTI ||
+	     (flags & IFF_MULTICAST &&
+	      VNetMulticastFilter(destAddr, exactFilter, exactFilterLen, ladrf)))));
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNet_MakeMACAddress --
+ *
+ *      Generate a unique MAC address and assign it to the given port.
+ *      The address will be in the range:
+ *
+ *      VMX86_STATIC_OUI:e0:00:00 - VMX86_STATIC_OUI:ff:ff:ff
+ *
+ * Results:
+ *      errno.
+ *
+ * Side effects:
+ *      The address is changed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNet_MakeMACAddress(VNetPort *port) // IN: port
+{
+   uint8 paddr[ETH_ALEN] = {0};
+   int conflict;
+   int maxTries = 1000;
+
+   do {
+      VMX86_GENERATE_RANDOM_MAC(paddr);
+
+      conflict = VNetSetMACUnique(port, paddr);
+
+      /*
+       * We don't have to check for conflicts with the virtual
+       * host adapters since they are in the range
+       * c0:00:00-c0:00:FF.
+       */
+
+   } while (maxTries-- > 0 && conflict);
+
+   return conflict;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetConnect --
+ *
+ *      Connect 2 jacks.
+ *	vnetStructureMutex must be held.
+ *
+ * Results:
+ *      errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetConnect(VNetJack *jack1, // IN: jack
+            VNetJack *jack2) // IN: jack
+{
+   static int vnetGeneration = 0;
+   Bool foundCycle;
+   unsigned long flags;
+
+   vnetGeneration++;
+
+   foundCycle = VNetCycleDetect(jack1, vnetGeneration);
+   if (foundCycle) {
+      VNetFreeInterfaceList();
+      return -EDEADLK;
+   }
+
+   foundCycle = VNetCycleDetect(jack2, vnetGeneration);
+   if (foundCycle) {
+      VNetFreeInterfaceList();
+      return -EDEADLK;
+   }
+   VNetFreeInterfaceList();
+
+   /*
+    * Synchronize with peer readers
+    */
+
+   write_lock_irqsave(&vnetPeerLock, flags);
+   jack1->peer = jack2;
+   jack2->peer = jack1;
+   jack1->state = TRUE;
+   jack2->state = TRUE;
+   kref_init(&jack1->kref);
+   kref_init(&jack2->kref);
+   write_unlock_irqrestore(&vnetPeerLock, flags);
+
+   if (jack2->numPorts) {
+      VNetPortsChanged(jack1);
+   }
+
+   if (jack1->numPorts) {
+      VNetPortsChanged(jack2);
+   }
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetDisconnect --
+ *
+ *	Disconnect 2 jacks.
+ *	vnetStructureMutex must be held.
+ *
+ * Results:
+ *      Return the peer jack (returns NULL on error, or if no peer)
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+VNetJack *
+VNetDisconnect(VNetJack *jack) // IN: jack
+{
+   VNetJack *peer;
+   unsigned long flags;
+
+   write_lock_irqsave(&vnetPeerLock, flags);
+   peer = jack->peer;
+   if (!peer) {
+      write_unlock_irqrestore(&vnetPeerLock, flags);
+      return NULL;
+   }
+   jack->state = FALSE;
+   peer->state = FALSE;
+   write_unlock_irqrestore(&vnetPeerLock, flags);
+
+   if (peer->numPorts) {
+      VNetPortsChanged(jack);
+   }
+
+   if (jack->numPorts) {
+      VNetPortsChanged(peer);
+   }
+
+   return peer;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetCycleDetectIf --
+ *
+ *      Perform the cycle detect alogorithm for this generation on a
+ *      specific interface. This could be a bridged interface, host
+ *      interface or both.
+ *      vnetStructureMutex must be held.
+ *
+ * Results:
+ *      TRUE if a cycle was detected, FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+VNetCycleDetectIf(const char *name, // IN:
+                  int   generation) // IN:
+{
+   VNetInterface *p;
+
+   for (p = vnetInterfaces; p != NULL; p = p->next) {
+      if (!strcmp(name, p->name)) {
+         if (p->myGeneration == generation) {
+            return TRUE;
+         } else {
+            p->myGeneration = generation;
+            return FALSE;
+         }
+      }
+   }
+
+   p = kmalloc(sizeof *p, GFP_USER);
+   if (!p) {
+      // assert
+      return TRUE;
+   }
+
+   memcpy(p->name, name, sizeof p->name);
+   NULL_TERMINATE_STRING(p->name);
+   p->myGeneration = generation;
+   p->next = vnetInterfaces;
+   vnetInterfaces = p;
+
+   return FALSE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetFreeInterfaceList --
+ *
+ *      Free's the linked list that may have been constructed
+ *      during a recent run on the cycle detect alogorithm.
+ *      vnetStructureMutex must be held.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetFreeInterfaceList()
+{
+   while (vnetInterfaces != NULL) {
+      VNetInterface *next = vnetInterfaces->next;
+      kfree(vnetInterfaces);
+      vnetInterfaces = next;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetKrefRelease --
+ *
+ *      Free the VNetJack if no reference.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetKrefRelease(struct kref *kref)
+{
+   struct VNetJack *jack = container_of(kref, struct VNetJack, kref);
+
+   jack->state = FALSE;
+   jack->peer = NULL;
+   VNetFree(jack);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetSend --
+ *
+ *      Send a packet through this jack. Note, the packet goes to the
+ *      jacks peer.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      The skb is no longer owned by us.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetSend(VNetJack *jack, // IN: jack
+         struct sk_buff *skb)  // IN: packet
+{
+   VNetJack *peer;
+
+   read_lock(&vnetPeerLock);
+   if (jack && jack->peer && jack->peer->rcv) {
+      peer = jack->peer;
+      kref_get(&(peer->kref));
+      read_unlock(&vnetPeerLock);
+
+      peer->rcv(peer, skb);
+      kref_put(&(peer->kref), VNetKrefRelease);
+   } else {
+      read_unlock(&vnetPeerLock);
+      dev_kfree_skb(skb);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetSetMACUnique --
+ *
+ *      Verify that MAC address is not used by other ports.
+ *      Function grabs mutex, so caller shouldn't hold any
+ *      locks.
+ *
+ * Results:
+ *
+ *      0      if address is unique. Port's paddr is updated.
+ *      -EBUSY if address is already in use. Port's paddr is unchanged.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetSetMACUnique(VNetPort *port,            // IN:
+		 const uint8 mac[ETH_ALEN]) // IN:
+{
+   VNetPort *p;
+
+   mutex_lock(&vnetStructureMutex);
+   for (p = vnetAllPorts; p != NULL; p = p->next) {
+      if (p != port && MAC_EQ(p->paddr, mac)) {
+         mutex_unlock(&vnetStructureMutex);
+         return -EBUSY;
+      }
+   }
+   memcpy(port->paddr, mac, ETH_ALEN);
+   mutex_unlock(&vnetStructureMutex);
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetPrintJack --
+ *
+ *      Print info about the jack to a buffer.
+ *
+ * Results:
+ *      Length of the write.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetPrintJack(const VNetJack *jack, // IN: jack
+              char           *buf)  // OUT: info about jack
+{
+   int len = 0;
+
+   read_lock(&vnetPeerLock);
+   if (!jack->peer) {
+      len += sprintf(buf+len, "connected not ");
+   } else {
+      len += sprintf(buf+len, "connected %s ", jack->peer->name);
+   }
+   read_unlock(&vnetPeerLock);
+
+   return len;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetPrintPort --
+ *
+ *      Print info about the port to a buffer.
+ *
+ * Results:
+ *      Length of the write.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetPrintPort(const VNetPort *port, // IN: port
+              char           *buf)  // OUT: info about port
+{
+   int len = 0;
+
+   len += VNetPrintJack(&port->jack, buf+len);
+
+   len += sprintf(buf+len, "mac %02x:%02x:%02x:%02x:%02x:%02x ",
+                  port->paddr[0], port->paddr[1], port->paddr[2],
+                  port->paddr[3], port->paddr[4], port->paddr[5]);
+
+   len += sprintf(buf+len, "ladrf %02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x ",
+                  port->ladrf[0], port->ladrf[1], port->ladrf[2],
+                  port->ladrf[3], port->ladrf[4], port->ladrf[5],
+                  port->ladrf[6], port->ladrf[7]);
+
+   len += sprintf(buf+len, "flags IFF_RUNNING");
+
+   if (port->flags & IFF_UP) {
+      len += sprintf(buf+len, ",IFF_UP");
+   }
+
+   if (port->flags & IFF_BROADCAST) {
+      len += sprintf(buf+len, ",IFF_BROADCAST");
+   }
+
+   if (port->flags & IFF_DEBUG) {
+      len += sprintf(buf+len, ",IFF_DEBUG");
+   }
+
+   if (port->flags & IFF_PROMISC) {
+      len += sprintf(buf+len, ",IFF_PROMISC");
+   }
+
+   if (port->flags & IFF_MULTICAST) {
+      len += sprintf(buf+len, ",IFF_MULTICAST");
+   }
+
+   if (port->flags & IFF_ALLMULTI) {
+      len += sprintf(buf+len, ",IFF_ALLMULTI");
+   }
+
+   len += sprintf(buf+len, " ");
+
+   return len;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetSnprintf --
+ *
+ *      Wrapper to account for lack of snprintf() in older kernels,
+ *      where 'old' appears to be older than 2.4.8.
+ *
+ * Results:
+ *      Refer to docs for snprintf() and / or sprintf().  This
+ *      version unconditionally adds NULL termination to the end
+ *      of the string.
+ *
+ * Side effects:
+ *      Might overrun buffer on older kernels.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetSnprintf(char *str,          // OUT: resulting string
+	     size_t size,        // IN: length of 'result' in bytes
+	     const char *format, // IN: format string
+	     ...)                // IN: (optional)
+{
+   int length;
+   va_list args;
+
+   va_start(args, format);
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 8)
+   length = vsnprintf(str, size, format, args);
+#else
+   length = vsprintf(str, format, args);
+#endif
+
+   va_end(args);
+
+   str[size - 1] = '\0';
+
+   return length;
+}
+
+MODULE_AUTHOR("VMware, Inc.");
+MODULE_DESCRIPTION("VMware Virtual Networking Driver.");
+MODULE_LICENSE("GPL v2");
+/*
+ * Starting with SLE10sp2, Novell requires that IHVs sign a support agreement
+ * with them and mark their kernel modules as externally supported via a
+ * change to the module header. If this isn't done, the module will not load
+ * by default (i.e., neither mkinitrd nor modprobe will accept it).
+ */
+MODULE_INFO(supported, "external");
diff --git a/vmnet-only/geninclude.c b/vmnet-only/geninclude.c
new file mode 100644
index 00000000..88d68dc5
--- /dev/null
+++ b/vmnet-only/geninclude.c
@@ -0,0 +1,41 @@
+/*********************************************************
+ * Copyright (C) 2003 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#ifdef CONFIG_X86_VOYAGER
+APATH/mach-voyager
+#endif
+#ifdef CONFIG_X86_VISWS
+APATH/mach-visws
+#endif
+#ifdef CONFIG_X86_NUMAQ
+APATH/mach-numaq
+#endif
+#ifdef CONFIG_X86_BIGSMP
+APATH/mach-bigsmp
+#endif
+#ifdef CONFIG_X86_SUMMIT
+APATH/mach-summit
+#endif
+#ifdef CONFIG_X86_GENERICARCH
+APATH/mach-generic
+#endif
+APATH/mach-default
+
diff --git a/vmnet-only/hub.c b/vmnet-only/hub.c
new file mode 100644
index 00000000..8f578353
--- /dev/null
+++ b/vmnet-only/hub.c
@@ -0,0 +1,733 @@
+/*********************************************************
+ * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "driver-config.h"
+
+#define EXPORT_SYMTAB
+
+#include <linux/kernel.h>
+#include <linux/version.h>
+#include <linux/sched.h>
+#include <linux/slab.h>
+#include <linux/poll.h>
+
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/mm.h>
+#include "compat_skbuff.h"
+#include <linux/if_ether.h>
+#include <linux/sockios.h>
+#include "compat_sock.h"
+
+#define __KERNEL_SYSCALLS__
+#include <asm/io.h>
+
+#include <linux/proc_fs.h>
+#include <linux/file.h>
+
+#include "vnetInt.h"
+
+#define HUB_TYPE_VNET         0x1
+#define HUB_TYPE_PVN          0x2
+
+typedef struct VNetHubStats {
+   unsigned      tx;
+} VNetHubStats;
+
+typedef struct VNetHub {
+   uint32        hubType;                  // HUB_TYPE_xxx
+   union {
+     int         vnetNum;                  // vnet number (HUB_TYPE_VNET)
+     uint8       pvnID[VNET_PVN_ID_LEN];   // PVN ID      (HUB_TYPE_PVN)
+   } id;
+   Bool		 used[NUM_JACKS_PER_HUB];  // tracks which jacks in use
+   VNetJack      jack[NUM_JACKS_PER_HUB];  // jacks for the hub
+   VNetHubStats  stats[NUM_JACKS_PER_HUB]; // stats for the jacks
+   int           totalPorts;               // num devices reachable from hub
+   int           myGeneration;             // used for cycle detection
+   struct VNetHub *next;                   // next hub in linked list
+   VNetEvent_Mechanism *eventMechanism;    // event notification mechanism
+} VNetHub;
+
+static VNetJack *VNetHubAlloc(Bool allocPvn, int hubNum,
+			      uint8 id[VNET_PVN_ID_LEN]);
+static void VNetHubFree(VNetJack *this);
+static void VNetHubReceive(VNetJack *this, struct sk_buff *skb);
+static Bool VNetHubCycleDetect(VNetJack *this, int generation);
+static void VNetHubPortsChanged(VNetJack *this);
+static int  VNetHubIsBridged(VNetJack *this);
+static int  VNetHubProcRead(char *page, char **start, off_t off,
+                            int count, int *eof, void *data);
+
+static VNetHub *vnetHub;
+static DEFINE_SPINLOCK(vnetHubLock);
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubFindHubByNum --
+ *
+ *      Find a hub for a specified vnet number.
+ *      Caller must be holding vnetHubLock.
+ *
+ * Results:
+ *      Pointer to hub, or NULL if not found.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static VNetHub *
+VNetHubFindHubByNum(int hubNum) // IN: vnet number to find
+{
+   VNetHub *currHub = vnetHub;
+   while (currHub && (currHub->hubType != HUB_TYPE_VNET ||
+		      currHub->id.vnetNum != hubNum)) {
+      currHub = currHub->next;
+   }
+   return currHub;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubFindHubByID --
+ *
+ *      Find a hub for a specified PVN id.
+ *      Caller must be holding vnetHubLock.
+ *
+ * Results:
+ *      Pointer to hub, or NULL if not found.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static VNetHub *
+VNetHubFindHubByID(uint8 idNum[VNET_PVN_ID_LEN]) // IN: PVN id to find
+{
+   VNetHub *currHub = vnetHub;
+   while (currHub && (currHub->hubType != HUB_TYPE_PVN ||
+                      memcmp(idNum, currHub->id.pvnID,
+                             sizeof currHub->id.pvnID))) {
+      currHub = currHub->next;
+   }
+   return currHub;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubAddHubToList --
+ *
+ *      Add hub to list of known hubs.
+ *	Caller must be holding vnetHubLock.
+ *
+ * Results:
+ *
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VNetHubAddHubToList(VNetHub *hub) // IN: hub to add to list
+{
+   hub->next = vnetHub;
+   vnetHub = hub;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubRemoveHubFromList --
+ *
+ *      Remove hub from list of known hubs.
+ *	Caller must be holding vnetHubLock.
+ *
+ * Results:
+ *
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VNetHubRemoveHubFromList(VNetHub *hub) // IN: hub to remove from list
+{
+   VNetHub **h;
+
+   for (h = &vnetHub; *h; h = &(*h)->next) {
+      if (*h == hub) {
+         *h = hub->next;
+         break;
+      }
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHub_AllocVnet --
+ *
+ *      Allocate a jack on a hub for a vnet.
+ *
+ * Results:
+ *      The jack to connect to, NULL on error.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+VNetJack *
+VNetHub_AllocVnet(int hubNum) // IN: the vnet number to alloc on
+{
+   return VNetHubAlloc(FALSE, hubNum, NULL);
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHub_AllocPvn --
+ *
+ *      Allocate a jack on a hub for a PVN.
+ *
+ * Results:
+ *      The jack to connect to, NULL on error.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+VNetJack *
+VNetHub_AllocPvn(uint8 id[]) // IN: the PVN ID to alloc on
+{
+   return VNetHubAlloc(TRUE, -1, id);
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubAlloc --
+ *
+ *      Allocate a jack on this hub.
+ *
+ * Results:
+ *      The jack to connect to, NULL on error.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+VNetJack *
+VNetHubAlloc(Bool allocPvn, // IN: TRUE for PVN, FALSE for vnet
+	     int hubNum,    // IN: vnet # to use (-1 if allocPvn == TRUE)
+	     uint8 id[])    // IN: PVN ID to use (NULL if allocPvn == FALSE)
+{
+   VNetHub *hub;
+   VNetJack *jack;
+   int i;
+   int retval;
+   unsigned long flags;
+   static uint32 pvnInstance = 0;
+
+   spin_lock_irqsave(&vnetHubLock, flags);
+
+   hub = allocPvn ? VNetHubFindHubByID(id) : VNetHubFindHubByNum(hubNum);
+   if (!hub) {
+      spin_unlock_irqrestore(&vnetHubLock, flags);
+      LOG(1, (KERN_DEBUG "/dev/vmnet: hub %d does not exist, allocating memory.\n",
+              hubNum));
+
+      hub = kmalloc(sizeof *hub, GFP_KERNEL);
+      if (hub == NULL) {
+         LOG(1, (KERN_DEBUG "/dev/vmnet: no memory to allocate hub %d\n", hubNum));
+         return NULL;
+      }
+      for (i = 0; i < NUM_JACKS_PER_HUB; i++) {
+         jack = &hub->jack[i];
+
+         /*
+          * The private field indicates if this jack is allocated.
+          * NULL means free, otherwise the jack is allocated and it
+          * should point back to the hub.
+          */
+
+         jack->peer = NULL;
+         jack->numPorts = 0;
+	 if (allocPvn) {
+	    VNetSnprintf(jack->name, sizeof jack->name, "pvn%d.%d",
+			 pvnInstance, i);
+	 } else {
+	    VNetSnprintf(jack->name, sizeof jack->name, "hub%d.%d", hubNum, i);
+	 }
+         jack->private = NULL;
+         jack->index = i;
+         jack->procEntry = NULL;
+         jack->free = VNetHubFree;
+         jack->rcv = VNetHubReceive;
+         jack->cycleDetect = VNetHubCycleDetect;
+         jack->portsChanged = VNetHubPortsChanged;
+         jack->isBridged = VNetHubIsBridged;
+
+         memset(&hub->stats[i], 0, sizeof hub->stats[i]);
+
+	 hub->used[i] = FALSE;
+      }
+
+      if (allocPvn) {
+	 hub->hubType = HUB_TYPE_PVN;
+         memcpy(hub->id.pvnID, id, sizeof hub->id.pvnID);
+	 ++pvnInstance;
+      } else {
+	 hub->hubType = HUB_TYPE_VNET;
+	 hub->id.vnetNum = hubNum;
+      }
+      hub->next = NULL;
+      hub->totalPorts = 0;
+      hub->myGeneration = 0;
+
+      /* create event mechanism */
+      retval = VNetEvent_CreateMechanism(&hub->eventMechanism);
+      if (retval != 0) {
+         LOG(1, (KERN_DEBUG "can't create event mechanism (%d)\n", retval));
+         kfree(hub);
+         return NULL;
+      }
+
+      spin_lock_irqsave(&vnetHubLock, flags);
+      if (allocPvn ? VNetHubFindHubByID(id) : VNetHubFindHubByNum(hubNum)) {
+         /*
+	  * Someone else just allocated this hub. Free our structure
+	  * and use already present hub.
+	  */
+
+	 kfree(hub);
+	 hub = allocPvn ? VNetHubFindHubByID(id) : VNetHubFindHubByNum(hubNum);
+      } else {
+	 VNetHubAddHubToList(hub);
+      }
+   }
+
+   for (i = 0; i < NUM_JACKS_PER_HUB; i++) {
+      jack = &hub->jack[i];
+      if (!hub->used[i]) {
+         hub->used[i] = TRUE;
+	 spin_unlock_irqrestore(&vnetHubLock, flags);
+
+         /*
+          * Make proc entry for this jack.
+          */
+
+         retval = VNetProc_MakeEntry(jack->name, S_IFREG, jack,
+                                     VNetHubProcRead, &jack->procEntry);
+         if (retval) {
+            if (retval == -ENXIO) {
+               jack->procEntry = NULL;
+            } else {
+               hub->used[i] = FALSE;
+               return NULL;
+            }
+         }
+
+         /*
+          *  OK, now allocate this jack.
+          */
+
+         jack->numPorts = hub->totalPorts;
+         jack->peer = NULL;
+         jack->private = hub;
+
+         return jack;
+      }
+   }
+   spin_unlock_irqrestore(&vnetHubLock, flags);
+
+   return NULL;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubFree --
+ *
+ *      Free the jack on this hub.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetHubFree(VNetJack *this)
+{
+   VNetHub *hub = (VNetHub*)this->private;
+   int i = 0;
+   int retval;
+   unsigned long flags;
+
+   if (this != &hub->jack[this->index]) {
+      LOG(1, (KERN_DEBUG "/dev/vmnet: bad free of hub jack\n"));
+      return;
+   }
+
+   if (this->procEntry) {
+      VNetProc_RemoveEntry(this->procEntry);
+      this->procEntry = NULL;
+   }
+
+   this->private = NULL;
+
+   spin_lock_irqsave(&vnetHubLock, flags);
+
+   hub->used[this->index] = FALSE;
+
+   for (i = 0; i < NUM_JACKS_PER_HUB; i++) {
+      if (hub->used[i]) {
+	 spin_unlock_irqrestore(&vnetHubLock, flags);
+	 return;
+      }
+   }
+   VNetHubRemoveHubFromList(hub);
+
+   spin_unlock_irqrestore(&vnetHubLock, flags);
+
+   /* destroy event mechanism */
+   retval = VNetEvent_DestroyMechanism(hub->eventMechanism);
+   if (retval != 0) {
+      LOG(1, (KERN_DEBUG "can't destroy event mechanism (%d)\n", retval));
+   }
+   hub->eventMechanism = NULL;
+
+   kfree(hub);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetHub_CreateSender --
+ *
+ *    Creates an event sender for the mechanism of this hub.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetHub_CreateSender(VNetJack *jack,       // IN: a jack to a hub
+                     VNetEvent_Sender **s) // OUT: the new sender
+{
+   if (jack != NULL && jack->private != NULL) {
+      VNetHub *hub = (VNetHub*)jack->private;
+      return VNetEvent_CreateSender(hub->eventMechanism, s);
+   } else {
+      return -EINVAL;
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetHub_CreateListener --
+ *
+ *    Creates an event listener for the mechanism of this hub.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetHub_CreateListener(VNetJack *jack,         // IN: a jack to a hub
+                       VNetEvent_Handler h,    // IN: a handler
+                       void *data,             // IN: the handler's data
+                       uint32 classMask,       // IN: a class mask
+                       VNetEvent_Listener **l) // OUT: the new listener
+{
+   if (jack != NULL && jack->private != NULL) {
+      VNetHub *hub = (VNetHub*)jack->private;
+      return VNetEvent_CreateListener(hub->eventMechanism, h, data, classMask,
+                                      l);
+   } else {
+      return -EINVAL;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubReceive --
+ *
+ *      This jack is receiving a packet. Take appropriate action.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Frees skb.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetHubReceive(VNetJack       *this, // IN:
+               struct sk_buff *skb)  // IN:
+{
+   VNetHub *hub = (VNetHub*)this->private;
+   VNetJack *jack;
+   struct sk_buff *clone;
+   int i;
+
+   hub->stats[this->index].tx++;
+
+   for (i = 0; i < NUM_JACKS_PER_HUB; i++) {
+      jack = &hub->jack[i];
+      if (jack->private &&   /* allocated */
+          jack->peer &&      /* and connected */
+          jack->state &&     /* and enabled */
+          jack->peer->state && /* and enabled */
+          jack->peer->rcv && /* and has a receiver */
+          (jack != this)) {  /* and not a loop */
+         clone = skb_clone(skb, GFP_ATOMIC);
+         if (clone) {
+            VNetSend(jack, clone);
+         }
+      }
+   }
+
+   dev_kfree_skb(skb);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubCycleDetect --
+ *
+ *      Cycle detection algorithm.
+ *
+ * Results:
+ *      TRUE if a cycle was detected, FALSE otherwise.
+ *
+ * Side effects:
+ *      Will generate other cycleDetect events to other jacks on hub.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+VNetHubCycleDetect(VNetJack *this,
+                   int       generation)
+{
+   VNetHub *hub = (VNetHub *)this->private;
+   Bool foundCycle;
+   int i;
+
+   if (hub->myGeneration == generation) {
+      return TRUE;
+   }
+
+   hub->myGeneration = generation;
+
+   for (i = 0; i < NUM_JACKS_PER_HUB; i++) {
+      if (hub->jack[i].private && hub->jack[i].state && (i != this->index)) {
+         foundCycle = VNetCycleDetect(hub->jack[i].peer, generation);
+         if (foundCycle) {
+            return TRUE;
+         }
+      }
+   }
+
+   return FALSE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubPortsChanged --
+ *
+ *      The number of ports connected to this jack has change, react
+ *      accordingly.
+ *      This function presumes that the caller has the semaphore.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      May generate other portsChanged events to other jacks on hub.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetHubPortsChanged(VNetJack *this)
+{
+   VNetHub *hub = (VNetHub *)this->private;
+   int num, new;
+   int i;
+
+   hub->totalPorts = 0;
+
+   for (i=0; i<NUM_JACKS_PER_HUB; i++) {
+      if (hub->jack[i].private) {
+         hub->totalPorts += VNetGetAttachedPorts(&hub->jack[i]);
+      }
+   }
+
+   for (i=0; i<NUM_JACKS_PER_HUB; i++) {
+      if (hub->jack[i].private) {
+         num = VNetGetAttachedPorts(&hub->jack[i]);
+         new = hub->totalPorts - num;
+         if (i == this->index) {
+            if (new != hub->jack[i].numPorts) {
+               /* basically an assert failure */
+               LOG(0, (KERN_DEBUG "/dev/vmnet: numPorts mismatch.\n"));
+            }
+         } else {
+            hub->jack[i].numPorts = new;
+            if (hub->jack[i].state)
+               VNetPortsChanged(hub->jack[i].peer);
+         }
+      }
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubIsBridged --
+ *
+ *      Check whether we are bridged.
+ *
+ * Results:
+ *      0 - not bridged
+ *      1 - we are bridged but the interface is not up
+ *      2 - we are bridged and the interface is up
+ *      3 - some bridges are down
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetHubIsBridged(VNetJack *this)
+{
+   VNetHub *hub = (VNetHub*)this->private;
+   int ret = 0;
+   int num;
+   int i;
+
+   for (i=0; i<NUM_JACKS_PER_HUB; i++) {
+      if ((hub->jack[i].private) && (i != this->index)) {
+         num = VNetIsBridged(&hub->jack[i]);
+         ret = MAX(ret, num);
+         if ((num == 1) && (ret == 2)) {
+            ret = 3;
+         }
+      }
+   }
+
+   return ret;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetHubProcRead --
+ *
+ *      Callback for read operation on hub entry in vnets proc fs.
+ *
+ * Results:
+ *      Length of read operation.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetHubProcRead(char    *page,   // IN/OUT: buffer to write into
+                char   **start,  // OUT: 0 if file < 4k, else offset into page
+                off_t    off,    // IN: offset of read into the file
+                int      count,  // IN: maximum number of bytes to read
+                int     *eof,    // OUT: TRUE if there is nothing more to read
+                void    *data)   // IN: client data - not used
+{
+   VNetJack *jack = (VNetJack*)data;
+   VNetHub *hub;
+   int len = 0;
+
+   if (!jack || !jack->private) {
+      return len;
+   }
+   hub = (VNetHub*)jack->private;
+
+   len += VNetPrintJack(jack, page+len);
+
+   len += sprintf(page+len, "tx %u ", hub->stats[jack->index].tx);
+
+   len += sprintf(page+len, "\n");
+
+   *start = 0;
+   *eof   = 1;
+   return len;
+}
diff --git a/vmnet-only/includeCheck.h b/vmnet-only/includeCheck.h
new file mode 100644
index 00000000..08fd1e58
--- /dev/null
+++ b/vmnet-only/includeCheck.h
@@ -0,0 +1,17 @@
+/*********************************************************
+ * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
diff --git a/vmnet-only/monitorAction_exported.h b/vmnet-only/monitorAction_exported.h
new file mode 100644
index 00000000..28b57c2c
--- /dev/null
+++ b/vmnet-only/monitorAction_exported.h
@@ -0,0 +1,156 @@
+/*********************************************************
+ * Copyright (C) 2010-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _MONITORACTION_EXPORTED_H_
+#define _MONITORACTION_EXPORTED_H_
+
+#define INCLUDE_ALLOW_VMX
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#include "includeCheck.h"
+
+#include "vm_assert.h"
+#include "vm_atomic.h"
+#include "vm_basic_types.h"
+
+/*
+ * Please bump the version number if your change will break the
+ * compatability to the drivers.
+ */
+#define ACTION_EXPORTED_VERSION   2
+
+#define ACTION_WORD_SIZE   (sizeof(uint64) * 8)
+#define ACTION_NUM_WORDS   (2)
+#define ACTION_NUM_IDS     (ACTION_NUM_WORDS * ACTION_WORD_SIZE)
+
+#define MONACTION_INVALID  MAX_UINT32
+
+typedef uint32 MonitorIdemAction;
+
+/*
+ * Representation of a set of actions.
+ */
+typedef struct MonitorActionSet {
+   volatile uint64 word[ACTION_NUM_WORDS];
+} MonitorActionSet;
+
+#ifndef __cplusplus
+typedef enum MonitorActionSetName MonitorActionSetName;
+#endif
+
+/*
+ * Summary of action and interrupt states.
+ */
+typedef struct MonitorActionIntr {
+   MonitorActionSet  pendingSet;
+   volatile Bool     action;
+   Bool              intr;
+   Bool              nmi;
+   Bool              db;
+   uint32            _pad;
+} MonitorActionIntr;
+
+/*
+ *------------------------------------------------------------------------
+ * MonitorActionSet_AtomicInclude --
+ *
+ *    This function atomically adds an action to an action set.
+ *
+ * Results:
+ *    TRUE if the action being added did not exist in the action set.
+ *    FALSE otherwise.
+ *
+ * Side effects:
+ *    The given action set will be updated.
+ *------------------------------------------------------------------------
+ */
+static INLINE Bool
+MonitorActionSet_AtomicInclude(MonitorActionSet *set, const uint32 actionID)
+{
+   Atomic_uint64 *atomicSet =
+      Atomic_VolatileToAtomic64(&set->word[actionID / ACTION_WORD_SIZE]);
+   uint64 mask = (uint64)1 << (actionID % ACTION_WORD_SIZE);
+   uint64 oldWord;
+   uint64 newWord;
+
+   ASSERT_ON_COMPILE((ACTION_WORD_SIZE & (ACTION_WORD_SIZE - 1)) == 0);
+#ifdef VMX86_DEBUG
+   /* If ASSERT is not desirable, do explicit check. Please see PR 567811. */
+#ifdef MODULE
+   if (UNLIKELY(actionID / ACTION_WORD_SIZE >= ACTION_NUM_WORDS)) {
+      return FALSE;
+   }
+#else
+   ASSERT(actionID / ACTION_WORD_SIZE < ACTION_NUM_WORDS);
+#endif // MODULE
+#endif // VMX86_DEBUG
+   do {
+      oldWord = Atomic_Read64(atomicSet);
+      newWord = oldWord | mask;
+   } while (!Atomic_CMPXCHG64(atomicSet, &oldWord, &newWord));
+   return (oldWord & mask) == 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------------
+ * MonitorAction_SetBits --
+ *
+ *      The core logic for posting an action. Update the set of pending
+ *      actions of the target VCPU in the shared area to mark the action
+ *      as present. Make sure the bit is set in the pendingSet first to
+ *      avoid a race with the drain loop.
+ *
+ *      It's the responsibility of the callers to ensure that the change
+ *      to actionIntr->action is globally visible before any IPI is sent
+ *      (the change to pendingSet is pushed out by the cmpxchg in
+ *      MonitorActionSet_AtomicInclude).
+ *
+ * Results:
+ *      TRUE if the action being posted was not pending before.
+ *      FALSE otherwise (other threads could have posted the same action).
+ *
+ * Side effects:
+ *      None.
+ *----------------------------------------------------------------------------
+ */
+static INLINE Bool
+MonitorAction_SetBits(MonitorActionIntr *actionIntr, MonitorIdemAction actionID)
+{
+   /* Careful if optimizing this: see PR70016. */
+   Bool newAction =
+      MonitorActionSet_AtomicInclude(&actionIntr->pendingSet, actionID);
+   actionIntr->action = TRUE;
+   return newAction;
+}
+
+/*
+ * C1 states entered by monitor while waiting for an action
+ */
+typedef enum {
+   VMM_C1_STATE_INVALID = 0,
+   VMM_C1_STATE_HLT,
+   VMM_C1_STATE_MWAIT,
+   VMM_C1_STATE_PAUSE
+} vmmC1StateType;
+
+#endif // _MONITORACTION_EXPORTED_H_
diff --git a/vmnet-only/net.h b/vmnet-only/net.h
new file mode 100644
index 00000000..28fd10d7
--- /dev/null
+++ b/vmnet-only/net.h
@@ -0,0 +1,209 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/************************************************************
+ *
+ *   net.h
+ *
+ *   This file should contain all network global defines.
+ *   No vlance/vmxnet/vnet/vmknet specific stuff should be
+ *   put here only defines used/usable by all network code.
+ *   --gustav
+ *
+ ************************************************************/
+
+#ifndef VMWARE_DEVICES_NET_H
+#define VMWARE_DEVICES_NET_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMCORE
+
+#include "includeCheck.h"
+#include "vm_device_version.h"
+
+#ifdef VMCORE
+#include "config.h"
+#include "str.h"
+#include "strutil.h"
+#endif
+
+#define ETHERNET_MTU         1518
+
+#ifndef ETHER_ADDR_LEN
+#define ETHER_ADDR_LEN          6  /* length of MAC address */
+#endif
+#define ETH_HEADER_LEN	       14  /* length of Ethernet header */
+#define IP_ADDR_LEN	        4  /* length of IPv4 address */
+#define IP_HEADER_LEN	       20  /* minimum length of IPv4 header */
+
+#define ETHER_MAX_QUEUED_PACKET 1600
+
+
+/*
+ * State's that a NIC can be in currently we only use this
+ * in VLance but if we implement/emulate new adapters that
+ * we also want to be able to morph a new corresponding
+ * state should be added.
+ */
+
+#define LANCE_CHIP  0x2934
+#define VMXNET_CHIP 0x4392
+
+/*
+ * Size of reserved IO space needed by the LANCE adapter and
+ * the VMXNET adapter. If you add more ports to Vmxnet than
+ * there is reserved space you must bump VMXNET_CHIP_IO_RESV_SIZE.
+ * The sizes must be powers of 2.
+ */
+
+#define LANCE_CHIP_IO_RESV_SIZE  0x20
+#define VMXNET_CHIP_IO_RESV_SIZE 0x40
+
+#define MORPH_PORT_SIZE 4
+
+#ifdef VMCORE
+typedef struct Net_AdapterCount {
+   uint8 vlance;
+   uint8 vmxnet2;
+   uint8 vmxnet3;
+   uint8 vrdma;
+   uint8 e1000;
+   uint8 e1000e;
+} Net_AdapterCount;
+#endif
+
+#ifdef USERLEVEL
+
+/*
+ *----------------------------------------------------------------------------
+ *
+ * Net_AddAddrToLADRF --
+ *
+ *      Given a MAC address, sets the corresponding bit in the LANCE style
+ *      Logical Address Filter 'ladrf'.
+ *      The caller should have initialized the ladrf to all 0's, as this
+ *      function only ORs on a bit in the array.
+ *      'addr' is presumed to be ETHER_ADDR_LEN in size;
+ *      'ladrf' is presumed to point to a 64-bit vector.
+ *
+ *      Derived from a long history of derivations, originally inspired by
+ *      sample code from the AMD "Network Products: Ethernet Controllers 1998
+ *      Data Book, Book 2", pages 1-53..1-55.
+ *
+ * Returns:
+ *      None.
+ *
+ * Side effects:
+ *      Updates 'ladrf'.
+ *
+ *----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Net_AddAddrToLadrf(const uint8 *addr,  // IN: pointer to MAC address
+                   uint8 *ladrf)       // IN/OUT: pointer to ladrf
+{
+#define CRC_POLYNOMIAL_BE 0x04c11db7UL	/* Ethernet CRC, big endian */
+
+   uint16 hashcode;
+   int32 crc = 0xffffffff;		/* init CRC for each address */
+   int32 j;
+   int32 bit;
+   int32 byte;
+
+   ASSERT(addr);
+   ASSERT(ladrf);
+
+   for (byte = 0; byte < ETHER_ADDR_LEN; byte++) {  /* for each address byte */
+      /* process each address bit */
+      for (bit = *addr++, j = 0;
+           j < 8;
+           j++, bit >>= 1) {
+	 crc = (crc << 1) ^ ((((crc < 0 ? 1 : 0) ^ bit) & 0x01) ?
+               CRC_POLYNOMIAL_BE : 0);
+      }
+   }
+   hashcode = (crc & 1);	       /* hashcode is 6 LSb of CRC ... */
+   for (j = 0; j < 5; j++) {	       /* ... in reverse order. */
+      hashcode = (hashcode << 1) | ((crc>>=1) & 1);
+   }
+
+   ladrf[hashcode >> 3] |= 1 << (hashcode & 0x07);
+}
+#endif // USERLEVEL
+
+#ifdef VMCORE
+/*
+ *----------------------------------------------------------------------
+ *
+ * Net_GetNumAdapters --
+ *
+ *      Returns the number of each type of network adapter configured in this 
+ *      VM.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+Net_GetNumAdapters(Net_AdapterCount *counts)
+{
+   uint32 i;
+
+   counts->vlance = 0;
+   counts->vmxnet2 = 0;
+   counts->vmxnet3 = 0;
+   counts->vrdma = 0;
+   counts->e1000 = 0;
+   counts->e1000e = 0;
+
+   for (i = 0; i < MAX_ETHERNET_CARDS; i++) {
+      char* adapterStr;
+
+      if (!Config_GetBool(FALSE, "ethernet%d.present", i)) {
+	 continue;
+      }
+      adapterStr = Config_GetString("vlance", "ethernet%d.virtualDev", i);
+      if (Str_Strcasecmp(adapterStr, "vmxnet3") == 0) {
+         counts->vmxnet3++;
+      } else if (Str_Strcasecmp(adapterStr, "vrdma") == 0) {
+         counts->vrdma++;
+      } else if (Str_Strcasecmp(adapterStr, "vlance") == 0) {
+         counts->vlance++;
+      } else if (Str_Strcasecmp(adapterStr, "vmxnet") == 0) {
+         counts->vmxnet2++;
+      } else if (Str_Strcasecmp(adapterStr, "e1000") == 0) {
+         counts->e1000++;
+      } else if (Str_Strcasecmp(adapterStr, "e1000e") == 0) {
+         counts->e1000e++;
+      } else {
+         LOG_ONCE(("%s: unknown adapter: %s\n", __FUNCTION__, adapterStr));
+      }
+      free(adapterStr);
+   }
+}
+
+#endif // VMCORE
+
+#endif // VMWARE_DEVICES_NET_H
diff --git a/vmnet-only/netdev_has_dev_net.c b/vmnet-only/netdev_has_dev_net.c
new file mode 100644
index 00000000..7ae5a015
--- /dev/null
+++ b/vmnet-only/netdev_has_dev_net.c
@@ -0,0 +1,37 @@
+/*********************************************************
+ * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * Detect whether there is dev_net accessor for dev->nd_net.
+ * It appeared between 2.6.25 and 2.6.26-rc1.
+ */
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 25)
+#   error This compile test intentionally fails.
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 26)
+#   include <linux/netdevice.h>
+
+struct net * 
+vmware_dev_net(struct net_device *dev)
+{
+   return dev_net(dev);
+}
+#endif
diff --git a/vmnet-only/netdev_has_net.c b/vmnet-only/netdev_has_net.c
new file mode 100644
index 00000000..210c9de0
--- /dev/null
+++ b/vmnet-only/netdev_has_net.c
@@ -0,0 +1,43 @@
+/*********************************************************
+ * Copyright (C) 2007 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * Detect whether there is separate net namespace.  It got introduced after
+ * 2.6.23.  If this builds, there are two arguments to __dev_get_by_name...
+ * For lower boundary use 2.6.23 - hopefully nobody crossports patch to
+ * older kernels.  Note that this also affects sk_alloc interface -
+ * for that there are two versions: sk_alloc(net, family, gfp, proto, 1) for
+ * kernels 2.6.23 < x <= 2.6.24-rc1, and 4 argument version
+ * sk_alloc(net, family, gfp, proto) for 2.6.24-rc1 < x.  We do ignore 2.6.24-rc1
+ * as hopefully in few weeks all 2.6.24-rc1 users will be gone.
+ */
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 23)
+#   error This compile test intentionally fails.
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 24)
+#   include <linux/netdevice.h>
+
+struct net_device * 
+vmware_get_by_name(void)
+{
+   return __dev_get_by_name(0, "dummy");
+}
+#endif
diff --git a/vmnet-only/netif.c b/vmnet-only/netif.c
new file mode 100644
index 00000000..bcd9a7cb
--- /dev/null
+++ b/vmnet-only/netif.c
@@ -0,0 +1,598 @@
+/*********************************************************
+ * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "driver-config.h"
+
+#define EXPORT_SYMTAB
+
+#include <linux/kernel.h>
+#include <linux/version.h>
+#include <linux/sched.h>
+#include <linux/slab.h>
+#include <linux/poll.h>
+
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/mm.h>
+#include "compat_skbuff.h"
+#include <linux/sockios.h>
+#include "compat_sock.h"
+
+#define __KERNEL_SYSCALLS__
+#include <asm/io.h>
+
+#include <linux/proc_fs.h>
+#include <linux/file.h>
+
+#include "vnetInt.h"
+#include "compat_netdevice.h"
+#include "vmnetInt.h"
+
+
+typedef struct VNetNetIF {
+   VNetPort                port;
+   struct net_device      *dev;
+   struct net_device_stats stats;
+} VNetNetIF;
+
+
+static void VNetNetIfFree(VNetJack *this);
+static void VNetNetIfReceive(VNetJack *this, struct sk_buff *skb);
+static Bool VNetNetIfCycleDetect(VNetJack *this, int generation);
+
+static int  VNetNetifOpen(struct net_device *dev);
+static int  VNetNetifProbe(struct net_device *dev);
+static int  VNetNetifClose(struct net_device *dev);
+static int  VNetNetifStartXmit(struct sk_buff *skb, struct net_device *dev);
+static struct net_device_stats *VNetNetifGetStats(struct net_device *dev);
+static int  VNetNetifSetMAC(struct net_device *dev, void *addr);
+static void VNetNetifSetMulticast(struct net_device *dev);
+static int  VNetNetIfProcRead(char *page, char **start, off_t off,
+                              int count, int *eof, void *data);
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetIfSetup --
+ *
+ *      Sets initial netdevice state.
+ * 
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetNetIfSetup(struct net_device *dev)  // IN:
+{
+#if !COMPAT_LINUX_VERSION_CHECK_LT(3, 1, 0) || defined(HAVE_NET_DEVICE_OPS)
+   static const struct net_device_ops vnetNetifOps = {
+      .ndo_init = VNetNetifProbe,
+      .ndo_open = VNetNetifOpen,
+      .ndo_start_xmit = VNetNetifStartXmit,
+      .ndo_stop = VNetNetifClose,
+      .ndo_get_stats = VNetNetifGetStats,
+      .ndo_set_mac_address = VNetNetifSetMAC,
+#if COMPAT_LINUX_VERSION_CHECK_LT(3, 2, 0)
+      .ndo_set_multicast_list = VNetNetifSetMulticast,
+#else
+      .ndo_set_rx_mode = VNetNetifSetMulticast,
+#endif
+
+   };
+#endif
+
+   ether_setup(dev); // turns on IFF_BROADCAST, IFF_MULTICAST
+#if COMPAT_LINUX_VERSION_CHECK_LT(3, 1, 0) && !defined(HAVE_NET_DEVICE_OPS) 
+   dev->init = VNetNetifProbe;
+   dev->open = VNetNetifOpen;
+   dev->hard_start_xmit = VNetNetifStartXmit;
+   dev->stop = VNetNetifClose;
+   dev->get_stats = VNetNetifGetStats;
+   dev->set_mac_address = VNetNetifSetMAC;
+   dev->set_multicast_list = VNetNetifSetMulticast;
+#else
+   dev->netdev_ops = &vnetNetifOps;
+   #endif /* HAVE_NET_DEVICE_OPS */
+
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetIf_Create --
+ *
+ *      Create a net level port to the wonderful world of virtual
+ *      networking.
+ * 
+ * Results: 
+ *      Errno. Also returns an allocated port to connect to,
+ *      NULL on error.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetNetIf_Create(char *devName,  // IN:
+                 VNetPort **ret, // OUT:
+                 int hubNum)     // IN: 
+{
+   VNetNetIF *netIf;
+   struct net_device *dev;
+   int retval;
+   static unsigned id = 0;
+   char deviceName[VNET_NAME_LEN];
+
+   memcpy(deviceName, devName, sizeof deviceName);
+   NULL_TERMINATE_STRING(deviceName);
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 18, 0)
+   dev = alloc_netdev(sizeof *netIf, deviceName, NET_NAME_USER, VNetNetIfSetup);
+#else
+   dev = alloc_netdev(sizeof *netIf, deviceName, VNetNetIfSetup);
+#endif
+   if (!dev) {
+      retval = -ENOMEM;
+      goto out;
+   }
+
+   netIf = netdev_priv(dev);
+
+   netIf->dev = dev;
+
+   netIf->port.id = id++;
+   netIf->port.next = NULL;
+
+   netIf->port.jack.peer = NULL;
+   netIf->port.jack.numPorts = 1;
+   VNetSnprintf(netIf->port.jack.name, sizeof netIf->port.jack.name,
+                "netif%u", netIf->port.id);
+   netIf->port.jack.private = netIf;
+   netIf->port.jack.index = 0;
+   netIf->port.jack.procEntry = NULL;
+   netIf->port.jack.free = VNetNetIfFree;
+   netIf->port.jack.rcv = VNetNetIfReceive;
+   netIf->port.jack.cycleDetect = VNetNetIfCycleDetect;
+   netIf->port.jack.portsChanged = NULL;
+   netIf->port.jack.isBridged = NULL;
+   netIf->port.exactFilterLen = 0;
+
+   /*
+    * Make proc entry for this jack.
+    */
+
+   retval = VNetProc_MakeEntry(netIf->port.jack.name, S_IFREG, netIf,
+                               VNetNetIfProcRead, &netIf->port.jack.procEntry);
+   if (retval) {
+      netIf->port.jack.procEntry = NULL;
+      if (retval != -ENXIO) {
+         goto outFreeDev;
+      }
+   }
+
+   /*
+    * Rest of fields.
+    */
+
+   netIf->port.flags = IFF_RUNNING;
+
+   memset(netIf->port.paddr, 0, sizeof netIf->port.paddr);
+   memset(netIf->port.ladrf, 0, sizeof netIf->port.ladrf);
+   memset(netIf->port.exactFilter, 0, sizeof netIf->port.exactFilter);
+
+   /* This will generate the reserved MAC address c0:00:?? where ?? == hubNum. */
+   VMX86_BUILD_MAC(netIf->port.paddr, hubNum);
+
+   /* Make sure the MAC is unique. */
+   retval = VNetSetMACUnique(&netIf->port, netIf->port.paddr);
+   if (retval) {
+     goto outRemoveProc;
+   }
+
+   netIf->port.fileOpRead = NULL;
+   netIf->port.fileOpWrite = NULL;
+   netIf->port.fileOpIoctl = NULL;
+   netIf->port.fileOpPoll = NULL;
+
+   memset(&netIf->stats, 0, sizeof netIf->stats);
+
+   memcpy(dev->dev_addr, netIf->port.paddr, sizeof netIf->port.paddr);
+
+   if (register_netdev(dev) != 0) {
+      LOG(0, (KERN_NOTICE "%s: could not register network device\n",
+          dev->name));
+      retval = -ENODEV;
+      goto outRemoveProc;
+   }
+
+   *ret = &netIf->port;
+   return 0;
+
+outRemoveProc:
+   if (netIf->port.jack.procEntry) {
+      VNetProc_RemoveEntry(netIf->port.jack.procEntry);
+   }
+outFreeDev:
+   free_netdev(dev);
+out:
+   return retval;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetIfFree --
+ *
+ *      Free the net interface port.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetNetIfFree(VNetJack *this) // IN: jack
+{
+   VNetNetIF *netIf = container_of(this, VNetNetIF, port.jack);
+
+   if (this->procEntry) {
+      VNetProc_RemoveEntry(this->procEntry);
+   }
+
+   unregister_netdev(netIf->dev);
+   free_netdev(netIf->dev);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetIfReceive --
+ *
+ *      This jack is receiving a packet. Take appropriate action.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      Frees skb.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetNetIfReceive(VNetJack        *this, // IN: jack
+		 struct sk_buff  *skb)  // IN: packet 
+{
+   VNetNetIF *netIf = this->private;
+   uint8 *dest = SKB_2_DESTMAC(skb);
+ 
+   if (!NETDEV_UP_AND_RUNNING(netIf->dev)) {
+      goto drop_packet;
+   }
+
+   if (!VNetPacketMatch(dest,
+                        netIf->dev->dev_addr,
+                        NULL,
+                        0,
+                        allMultiFilter,
+                        netIf->dev->flags)) {
+      goto drop_packet;
+   }
+   
+   /* send to the host interface */
+   skb->dev = netIf->dev;
+   skb->protocol = eth_type_trans(skb, netIf->dev);
+   netif_rx_ni(skb);
+   netIf->stats.rx_packets++;
+
+   return;
+   
+ drop_packet:
+   dev_kfree_skb(skb);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetIfCycleDetect --
+ *
+ *      Cycle detection algorithm.
+ * 
+ * Results: 
+ *      TRUE if a cycle was detected, FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+VNetNetIfCycleDetect(VNetJack *this,       // IN: jack
+                     int       generation) // IN: 
+{
+   VNetNetIF *netIf = this->private;
+
+   return VNetCycleDetectIf(netIf->dev->name, generation);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetifOpen --
+ *
+ *      The virtual network's open dev operation. 
+ *
+ * Results: 
+ *      errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetNetifOpen(struct net_device *dev) // IN:
+{
+   /*
+    * The host interface is not available if the hub is bridged.
+    *
+    * It's actually okay to support both.  We just need
+    * to tag packets when VNetXmitPacket gives them to the interface
+    * so they can be dropped by VNetBridgeReceive().
+    *
+    *  if so return -EBUSY;
+    */
+
+   netif_start_queue(dev);
+   // xxx need to change flags
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetifProbe --
+ *
+ *      ???
+ *
+ * Results: 
+ *      0.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetNetifProbe(struct net_device *dev) // IN: unused
+{
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetifClose --
+ *
+ *      The virtual network's close dev operation. 
+ *
+ * Results: 
+ *      errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetNetifClose(struct net_device *dev) // IN:
+{
+   netif_stop_queue(dev);
+   // xxx need to change flags
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetifStartXmit --
+ *
+ *      The virtual network's start xmit dev operation. 
+ *
+ * Results: 
+ *      ???, 0.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetNetifStartXmit(struct sk_buff    *skb, // IN:
+                   struct net_device *dev) // IN:
+{
+   VNetNetIF *netIf = netdev_priv(dev);
+
+   if(skb == NULL) {
+      return 0;
+   }
+
+   /*
+    * Block a timer-based transmit from overlapping.  This could better be
+    * done with atomic_swap(1, dev->tbusy), but set_bit() works as well.
+    * If this ever occurs the queue layer is doing something evil!
+    */
+
+   VNetSend(&netIf->port.jack, skb);
+
+   netIf->stats.tx_packets++;
+   compat_netif_trans_update(dev);
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetifSetMAC --
+ *
+ *      Sets MAC address (i.e. via ifconfig) of netif device.
+ *
+ * Results: 
+ *      Errno.
+ *
+ * Side effects:
+ *      The MAC address may be changed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetNetifSetMAC(struct net_device *dev, // IN:
+                void *p)                // IN:
+{
+   VNetNetIF *netIf = netdev_priv(dev);
+   struct sockaddr const *addr = p;
+
+   if (!VMX86_IS_STATIC_MAC(addr->sa_data)) {
+      return -EINVAL;
+   }
+   memcpy(netIf->port.paddr, addr->sa_data, dev->addr_len);
+   memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetifSetMulticast --
+ *
+ *      Sets or clears the multicast address list.  This information
+ *      comes from an array in dev->mc_list, and with a counter in
+ *      dev->mc_count.
+ *
+ *      Since host-only network ifaces can't be bridged, it's debatable
+ *      whether this is at all useful, but at least now you can turn it 
+ *      on from ifconfig without getting an ioctl error.
+ * Results: 
+ *      Void.
+ *
+ * Side effects:
+ *      Multicast address list might get changed.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetNetifSetMulticast(struct net_device *dev) // IN: unused
+{
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetifGetStats --
+ *
+ *      The virtual network's get stats dev operation. 
+ *
+ * Results: 
+ *      A struct full of stats.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static struct net_device_stats *
+VNetNetifGetStats(struct net_device *dev) // IN:
+{
+   VNetNetIF *netIf = netdev_priv(dev);
+
+   return &netIf->stats;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetIfProcRead --
+ *
+ *      Callback for read operation on this netif entry in vnets proc fs.
+ *
+ * Results: 
+ *      Length of read operation.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetNetIfProcRead(char   *page,  // IN/OUT: buffer to write into
+                  char  **start, // OUT: 0 if file < 4k, else offset into page
+                  off_t   off,   // IN: (unused) offset of read into the file
+                  int     count, // IN: (unused) maximum number of bytes to read
+                  int    *eof,   // OUT: TRUE if there is nothing more to read
+                  void   *data)  // IN: client data
+{
+   VNetNetIF *netIf = data; 
+   int len = 0;
+   
+   if (!netIf) {
+      return len;
+   }
+   
+   len += VNetPrintPort(&netIf->port, page+len);
+
+   len += sprintf(page+len, "dev %s ", netIf->dev->name);
+   
+   len += sprintf(page+len, "\n");
+
+   *start = 0;
+   *eof   = 1;
+   return len;
+}
diff --git a/vmnet-only/nfhook_uses_skb.c b/vmnet-only/nfhook_uses_skb.c
new file mode 100644
index 00000000..fd61b67b
--- /dev/null
+++ b/vmnet-only/nfhook_uses_skb.c
@@ -0,0 +1,45 @@
+/*********************************************************
+ * Copyright (C) 2007 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * Detect whether nf_hookfn takes struct sk_buff* skb, or struct sk_buff** pskb.
+ * Kernels before 2.6.23 take pskb, kernels since 2.6.24 take skb, and we
+ * are not sure about 2.6.23 itself, as change occured between 2.6.23 and
+ * 2.6.24-rc1.
+ */
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 23)
+#   error This compile test intentionally fails.
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 24)
+#   include <linux/netfilter.h>
+
+nf_hookfn test_function;
+
+unsigned int
+test_function(unsigned int hooknum,
+              struct sk_buff *skb,
+	      const struct net_device *in,
+	      const struct net_device *out,
+	      int (*defn)(struct sk_buff*))
+{
+   return 1234;
+}
+#endif
diff --git a/vmnet-only/procfs.c b/vmnet-only/procfs.c
new file mode 100644
index 00000000..165cda0a
--- /dev/null
+++ b/vmnet-only/procfs.c
@@ -0,0 +1,407 @@
+/*********************************************************
+ * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "driver-config.h"
+
+#define EXPORT_SYMTAB
+
+#include <linux/kernel.h>
+#include <linux/version.h>
+#include <linux/sched.h>
+#include <linux/slab.h>
+#include <linux/poll.h>
+
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/mm.h>
+#include "compat_skbuff.h"
+#include <linux/if_ether.h>
+#include <linux/sockios.h>
+#include "compat_sock.h"
+
+#define __KERNEL_SYSCALLS__
+#include <asm/io.h>
+
+#include <linux/proc_fs.h>
+#include <linux/file.h>
+
+#include "vnetInt.h"
+
+
+#if defined(CONFIG_PROC_FS)
+
+static int VNetProcMakeEntryInt(VNetProcEntry *parent, char *name, int mode,
+                                void *data, VNetProcReadFn *fn,
+                                VNetProcEntry **ret);
+static void VNetProcRemoveEntryInt(VNetProcEntry *node, VNetProcEntry *parent);
+
+static VNetProcEntry *base = NULL;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProc_Init --
+ *
+ *      Initialize the vnets procfs entries.
+ *
+ * Results: 
+ *      errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetProc_Init(void)
+{
+   return VNetProcMakeEntryInt(NULL, "vmnet", S_IFDIR, NULL, NULL, &base);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProc_Cleanup --
+ *
+ *      Cleanup the vnets proc filesystem entries.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetProc_Cleanup(void)
+{
+   VNetProcRemoveEntryInt(base, NULL);
+   base = NULL;
+}
+
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProcShow --
+ *
+ *      Show the contents of this procfs node.  We bounce through this
+ *      into the read function callback that was given to us when the
+ *      entry was created.
+ *
+ * Results:
+ *      errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetProcShow(struct seq_file *p, // IN:
+             void *v)            // IN:
+{
+   char *buf = (char *)__get_free_page(GFP_KERNEL);
+   if (buf != NULL) {
+      VNetProcEntry *ent = p->private;
+      char *start;
+      int eof;
+      buf[ent->fn(buf, &start, 0, PAGE_SIZE, &eof, ent->data)] = '\0';
+      seq_printf(p, buf);
+      free_page((unsigned long)buf);
+      return 0;
+   }
+   return -ENOMEM;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProcOpen --
+ *
+ *      Open a procfs node.
+ *
+ * Results:
+ *      errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetProcOpen(struct inode *inode,   // IN:
+             struct file *file)     // IN:
+{
+   return single_open(file, VNetProcShow, PDE_DATA(inode));
+}
+
+/* Our procfs callbacks.  We only need to specialize open. */
+static struct file_operations fops = {
+   .open    = VNetProcOpen,
+   .read    = seq_read,
+   .llseek  = seq_lseek,
+   .release = single_release,
+};
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProcMakeEntryInt --
+ *
+ *      Make an entry in the vnets proc file system.
+ *
+ * Results:
+ *      errno. If errno is 0 and then ret is filled in with the
+ *      resulting proc entry.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetProcMakeEntryInt(VNetProcEntry   *parent,   // IN:
+                     char            *name,     // IN:
+                     int              mode,     // IN:
+                     void            *data,     // IN:
+                     VNetProcReadFn  *fn,       // IN:
+                     VNetProcEntry  **ret)      // OUT:
+{
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
+   VNetProcEntry *ent = kmalloc(sizeof *ent, GFP_KERNEL);
+   if (ent != NULL) {
+      if (mode & S_IFDIR) {
+         ent->pde    = proc_mkdir(name, NULL);
+      } else {
+         ent->data   = data;
+         ent->fn     = fn;
+         ent->pde    = proc_create_data(name, mode, parent->pde, &fops, ent);
+      }
+      if (ent->pde != NULL) {
+         *ret = ent;
+         return 0;
+      }
+      kfree(ent);
+   }
+   return -ENOMEM;
+#else
+   VNetProcEntry *ent = create_proc_entry(name, mode, parent);
+   if (ent != NULL) {
+      ent->data      = data;
+      ent->read_proc = fn;
+      *ret           = ent;
+      return 0;
+   }
+   return -ENOMEM;
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProcRemoveEntryInt --
+ *
+ *      Remove a previously installed proc entry.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetProcRemoveEntryInt(VNetProcEntry *node,     // IN:
+                       VNetProcEntry *parent)   // IN:
+{
+   if (node != NULL) {
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
+      proc_remove(node->pde);
+      kfree(node);
+#else
+      remove_proc_entry(node->name, parent);
+#endif
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProc_MakeEntry --
+ *
+ *      Make an entry in the vnets proc file system.
+ *
+ * Results: 
+ *      errno. If errno is 0 and ret is non NULL then ret is filled
+ *      in with the resulting proc entry.
+ *      
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetProc_MakeEntry(char              *name,  // IN:
+                   int                mode,  // IN:
+                   void              *data,  // IN:
+                   VNetProcReadFn    *fn,    // IN:
+                   VNetProcEntry    **ret)   // OUT:
+{
+   return VNetProcMakeEntryInt(base, name, mode, data, fn, ret);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProc_RemoveEntry --
+ *
+ *      Remove a previously installed proc entry.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetProc_RemoveEntry(VNetProcEntry *node)
+{
+   VNetProcRemoveEntryInt(node, base);
+}
+
+
+#else /* CONFIG_PROC_FS */
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProc_Init --
+ *
+ *      Initialize the vnets procfs entries.
+ *
+ * Results: 
+ *      errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetProc_Init(void)
+{
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProc_Cleanup --
+ *
+ *      Cleanup the vnets proc filesystem entries.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetProc_Cleanup(void)
+{
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProc_MakeEntry --
+ *
+ *      Make an entry in the vnets proc file system.
+ *
+ * Results: 
+ *      errno. If errno is 0 and ret is non NULL then ret is filled
+ *      in with the resulting proc entry.
+ *      
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetProc_MakeEntry(char              *name,
+                   int                mode,
+                   void              *data,
+                   VNetProcReadFn    *fn,
+                   VNetProcEntry    **ret)
+{
+   return -ENXIO;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetProc_RemoveEntry --
+ *
+ *      Remove a previously installed proc entry.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VNetProc_RemoveEntry(VNetProcEntry *parent)
+{
+}
+
+#endif /* CONFIG_PROC_FS */
diff --git a/vmnet-only/skblin.c b/vmnet-only/skblin.c
new file mode 100644
index 00000000..e3a6ccdc
--- /dev/null
+++ b/vmnet-only/skblin.c
@@ -0,0 +1,41 @@
+/*********************************************************
+ * Copyright (C) 2006 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * Detect whether skb_linearize takes one or two arguments.
+ */
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#if LINUX_VERSION_CODE <= KERNEL_VERSION(2, 6, 17)
+/*
+ * Since 2.6.18 all kernels have single-argument skb_linearize.  For
+ * older kernels use autodetection.  Not using autodetection on newer
+ * kernels saves us from compile failure on some post 2.6.18 kernels
+ * which do not have selfcontained skbuff.h.
+ */
+
+#include <linux/skbuff.h>
+
+int test_skb_linearize(struct sk_buff *skb)
+{
+   return skb_linearize(skb);
+}
+
+#endif
diff --git a/vmnet-only/smac.c b/vmnet-only/smac.c
new file mode 100644
index 00000000..71b711ef
--- /dev/null
+++ b/vmnet-only/smac.c
@@ -0,0 +1,4951 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * smac.c --
+ *
+ *      This file defines functionality that allows the
+ *      bridge to be used across links that do
+ *      not support promiscuous mode, or do not provide the
+ *      ability to transmit ethernet frames whose MAC source
+ *      address does not match the hardware's MAC address.
+ *
+ *      This code extension basically forces the bridge to
+ *      use a single MAC, thus the name SMAC.
+ */
+
+/* platform-dependent includes */
+
+#ifdef _WIN32
+
+#define BINARY_COMPATIBLE 0 // NT-only driver (optimizes some NDIS calls)
+#include <ndis.h>
+#include <ntstrsafe.h>
+
+#include "vnetInt.h"
+
+#else /* _WIN32 */
+
+#undef __KERNEL__ //To prevent including any kernel specific stuff 
+
+#ifdef VMX86_DEVEL
+#define DBG 1
+#else
+#undef DBG
+#endif /* VMX86_DEVEL */
+
+#ifdef __APPLE__
+#include <sys/kpi_mbuf.h>
+#include <libkern/libkern.h>
+#endif
+
+#include "smac_compat.h"
+
+#endif /* _WIN32 */
+
+/* platform-independent includes */
+#include "smac.h"
+#include "vm_basic_defs.h"
+#include "vm_basic_asm.h"
+
+#define SMAC_MODULE "SMAC: "
+#define MODULE_NAME SMAC_MODULE
+
+/* platform-dependent defines */
+#ifdef _WIN32
+#define ALLOCATEMEMORY(a,b) VNet_AllocateMemoryWithTag((a),(b))
+#define FREEMEMORY(a)       VNet_FreeMemory((a))
+#define MEMCPY(a,b,c)       NdisMoveMemory((a),(b),(c))
+#define MEMSET(a,b,c)       NdisFillMemory((a),(c),(b))
+
+#define SPINLOCKINIT()      do { } while (0)
+#define INITSPINLOCK(a)     do { NdisAllocateSpinLock( (a) ); } while(0)
+#define RAISEIRQL()         do { irql = KeRaiseIrqlToDpcLevel(); } while(0)
+#define ACQUIRESPINLOCK(a)  do { ASSERT(KeGetCurrentIrql() == DISPATCH_LEVEL); \
+                                 NdisDprAcquireSpinLock( (a) ); } while(0)
+#define RELEASESPINLOCK(a)  do { NdisDprReleaseSpinLock( (a) ); } while(0)
+#define LOWERIRQL()         do { KeLowerIrql(irql); } while(0)
+#define FREESPINLOCK(a)     do { NdisFreeSpinLock( (a) ); } while(0)
+#define ASSERTLOCKHELD()    ASSERT(KeGetCurrentIrql() == DISPATCH_LEVEL)
+#define SNPRINTF(a)            (RtlStringCbPrintfA a)
+
+#elif defined __linux__ || defined __APPLE__
+
+#define ALLOCATEMEMORY(a,b) SMACL_Alloc((a))
+#define MEMCPY(a,b,c)       SMACL_Memcpy((a),(b),(c))
+#define MEMSET(a,b,c)       SMACL_Memset((a),(b),(c))
+
+#define INITSPINLOCK(a)     SMACL_InitSpinlock( (a) )
+#define RAISEIRQL()         do { } while (0)
+#define LOWERIRQL()         do { } while (0)
+#define ASSERTLOCKHELD()    do { } while (0)
+
+#define UNREFERENCED_PARAMETER(a) { (a) = (a); }
+
+/*
+ * The following are defined to create OS dependent versions of
+ * functionality available on Windows.
+ */
+
+#undef ASSERT
+
+#ifdef DBG
+#   if defined __APPLE__
+#      define VNETKdPrint(a)         (Log a)
+#   else // __linux__
+#      define VNETKdPrint(a)         (SMACL_Print a)
+#   endif
+#   define ASSERT(a) do {if (!(a)) {VNETKdPrint(("ASSERT FAILED: "#a));}} while(0)
+#else
+#   define VNETKdPrint(a)         do { } while (0)
+#   define ASSERT(a)              do { } while (0)
+#endif
+
+#define VNETKdPrintCall(a)     VNETKdPrint((MODULE_NAME "Calling    : %s\n", a))
+#define VNETKdPrintReturn(a)   VNETKdPrint((MODULE_NAME "Returned   : %s\n", a))
+
+#ifndef MAC_EQ
+#define MAC_EQ(a,b)    (SMACL_Memcmp((a),(b),ETH_ALEN)==0)
+#endif /* MAC_EQ */
+
+#define IS_MULTICAST(_hdr)   ((_hdr)[0] & 0x1)
+#define IS_BROADCAST(_a) \
+   ((_a)[0] == 0xff && (_a)[1] == 0xff && (_a)[2] == 0xff && \
+    (_a)[3] == 0xff && (_a)[4] == 0xff && (_a)[5] == 0xff)
+
+#ifdef __linux__
+#define FREEMEMORY(a)       SMACL_Free((a))
+#define SPINLOCKINIT()      unsigned long flags
+#define FREESPINLOCK(a)     SMACL_Free(*a)
+#define ACQUIRESPINLOCK(a)  SMACL_AcquireSpinlock( (a), &flags)
+#define RELEASESPINLOCK(a)  SMACL_ReleaseSpinlock( (a), &flags)
+extern int VNetSnprintf(char *str, size_t size, const char *format, ...);
+#define SNPRINTF(a)         (VNetSnprintf a)
+#else /* __APPLE__ */
+#define FREEMEMORY(a)       SMACL_Free((a), sizeof *(a))
+#define SPINLOCKINIT()      do { } while (0)
+#define FREESPINLOCK(a)     SMACL_FreeSpinlock( (a) )
+#define ACQUIRESPINLOCK(a)  SMACL_AcquireSpinlock( *(a) )
+#define RELEASESPINLOCK(a)  SMACL_ReleaseSpinlock( *(a) )
+#define SNPRINTF(a)         (snprintf a)
+#endif
+
+#else
+#error "unknown platform"
+#endif /* _WIN32 */
+
+/* Offsets/lengths for IPv4, UDP, and ARP headers. */
+#define IP_HEADER_LEN               20
+#define IP_HEADER_DEST_ADDR_OFFSET  16
+#define IP_HEADER_SRC_ADDR_OFFSET   12
+#define IP_HEADER_FLAGS_OFFSET	    6
+#define IP_HEADER_PROTO_OFFSET	    9
+#define UDP_HEADER_LEN              8
+#define ARP_HEADER_LEN              28
+#define ARP_SENDER_MAC_OFFSET       8
+#define ARP_SENDER_IP_OFFSET        14
+#define ARP_TARGET_MAC_OFFSET       18
+#define ARP_TARGET_IP_OFFSET        24
+
+#define IP_ADDR_BROADCAST           0xFFFFFFFF
+
+#define IPv4                        4
+#define IPv6                        6
+#define IP_STRING_SIZE              40 /* To express IP in string format. */
+#define MAC_STRING_SIZE             18 /* To express MAC in string format. */
+
+/* Offsets/lengths for IPv6 headers. */
+#define IPv6_HEADER_LEN               40
+#define IPv6_HEADER_SRC_ADDR_OFFSET   8
+#define IPv6_HEADER_DST_ADDR_OFFSET   24
+#define IPv6_NEXT_HEADER_OFFSET       6
+#define ICMPv6_TYPE_OFFSET            0  /* From start of ICMPv6 payload. */
+#define ICMPv6_CHECKSUM_OFFSET        2  /* From start of ICMPv6 payload. */
+#define ICMPv6_NDP_NBR_LEN            24 /*
+                                          * Message length (not including
+                                          * options) for neighbor solicitation
+                                          * and advertisement messages.
+                                          */
+#define ICMPv6_NDP_RTR_SOL_LEN        8  /* For router solicitation. */
+#define ICMPv6_NDP_RTR_ADV_LEN        16 /* For router advertisement. */
+#define ICMPv6_TARGET_IP_OFFSET       8  /* From start of ICMPv6 payload. */
+#define ICMPv6_NDP_OPTION_TYPE_OFFSET 0  /* Offset from start of option. */
+#define ICMPv6_NDP_OPTION_LEN_OFFSET  1  /* Offset from start of option. */
+#define ICMPv6_NDP_MAC_OFFSET         2  /* Offset from start of option. */
+#define ICMPv6_NDP_OPTION_SRC_MAC     1  /* Source link-layer option. */
+#define ICMPv6_NDP_OPTION_TARGET_MAC  2  /* Target link-layer option. */
+#define ICMPv6_NDP_RTR_SOLICITATION   133 /* Router solicitation. */
+#define ICMPv6_NDP_RTR_ADVERTISEMENT  134 /* Router advertisement. */
+#define ICMPv6_NDP_NBR_SOLICITATION   135 /* Neighbor solicitation. */
+#define ICMPv6_NDP_NBR_ADVERTISEMENT  136 /* Neighbor advertisement. */
+
+/*
+ * To limit the amount of kernel log information, define 
+ * WIRELESS_BE_QUIET or WIRELESS_BE_VERY_QUIET.  The former
+ * reduces the logging to a point where the host system isn't
+ * bogged down with logging all the details of broadcast traffic
+ * coming in from the company network.  The latter define will
+ * completely turn off wireless logging.
+ */
+
+#define  WIRELESS_BE_VERY_QUIET
+//#define  WIRELESS_BE_QUIET
+
+#ifdef WIRELESS_BE_VERY_QUIET
+#define WW_VNETKdPrint(a) 
+#define WW_DEVEL_ONLY(a)
+#define W_VNETKdPrint(a) 
+#define W_DEVEL_ONLY(a)
+#else // WIRELESS_BE_VERY_QUIET
+
+#ifdef  WIRELESS_BE_QUIET
+#define WW_VNETKdPrint(a)
+#define WW_DEVEL_ONLY(a)
+#define W_VNETKdPrint(a) VNETKdPrint(a)
+#  ifdef DBG
+#     define W_DEVEL_ONLY(a) a
+#  else
+#     define W_DEVEL_ONLY(a)
+#endif
+#else // WIRELESS_BE_QUIET
+#define WW_VNETKdPrint(a) VNETKdPrint(a)
+#  ifdef DBG
+#     define WW_DEVEL_ONLY(a) a
+#  else
+#     define WW_DEVEL_ONLY(a)
+#  endif
+#define W_VNETKdPrint(a) VNETKdPrint(a)
+#  ifdef DBG
+#     define W_DEVEL_ONLY(a) a
+#  else
+#     define W_DEVEL_ONLY(a)
+#  endif
+#endif // WIRELESS_BE_QUIET
+
+#endif // WIRELESS_BE_VERY_QUIET
+
+/*
+ * Host-to-Network / Network-to-Host byte-order routines
+ */
+
+#ifdef __APPLE__
+#undef HTONL
+#undef NTOHL
+#undef HTONS
+#undef NTOHS
+#endif /* __APPLE__ */
+
+/*
+ * For use in case labels where compile-time consts are required (obj builds)
+ */
+#define CONST_NTOHL(i) \
+   (((uint32)(i))>>24 | ((i)&0xff)<<24 | ((i)&0x00ff0000)>>8 | ((i)&0x0000ff00)<<8)
+
+/*
+ * All other uses should call inline BswapNN() for type checking
+ */
+#define HTONL(i) Bswap32(i)
+#define NTOHL(i) Bswap32(i)
+#define HTONS(i) Bswap16(i)
+#define NTOHS(i) Bswap16(i)
+
+/*
+ * IPmacLookupEntry: defines entry in IP/MAC hash tables for finding which 
+ * IP corresonds to which MAC
+ */
+
+#ifdef _WIN32
+typedef uint64 SmacLastAccess;
+#define LAST_ACCESS_FORMAT "%"FMT64"u" // format of lastAccess for printf()
+#else
+typedef unsigned long SmacLastAccess;
+#define LAST_ACCESS_FORMAT "%lu"      // format of lastAccess for printf()
+#endif /* _WIN32 */
+
+typedef union IPAddrUnion {
+   uint32 ipv4Addr;
+   IPv6Addr ipv6Addr;
+} IPAddrUnion;
+
+typedef struct IPAddrContainer {
+   IPAddrUnion addr;
+   uint16 ver; /* IPv4 or IPv6 (uint16 pads better). */
+} IPAddrContainer;
+
+typedef struct IPmacLookupEntry {
+   struct IPmacLookupEntry *ipNext;   // pointer to next item in bucket in IP hash table
+   IPAddrContainer addrContainer;     // Struct holding the v4/v6 address
+   uint8 mac[ETH_ALEN];               // ethernet MAC address
+   SmacLastAccess lastAccess;         // estimated time of entry's last use
+} IPmacLookupEntry;
+
+/*
+ * EthernetHeader: struct that corresponds with common ethernet header
+ * (an ethernet frame that contians a VLAN header has different
+ * format: 2 additional bytes after srcAddr)
+ */
+
+typedef struct EthernetHeader {
+   uint8 destAddr[ETH_ALEN];   // destination MAC
+   uint8 srcAddr[ETH_ALEN];    // source MAC
+   uint16 lengthType;          // length/type field
+} EthernetHeader;
+
+/*
+ * EthClass: used to classify the various ethernet media types
+ * into a small group of classes.
+ */
+
+typedef enum {
+   EthClassIllegal = 0x345,   // media type in an unrefined/reserved range
+   EthClassCommon,	      // means known but no special handling needed
+   EthClassUncommon,	      // like common, but should trigger more debug printouts
+   EthClassUnknown,	      // not specifically known/handled), but a legal type
+   EthClassIPv4,	      // IPv4 type
+   EthClassARP,		      // one of the various ARP protocols
+   EthClassVLAN,	      // VLAN type
+   EthClassIPv6,              // IPv6 type
+   EthClassEAPOL,             // 802.1x type (EAPOL)
+} EthClass;
+
+/*
+ * SMACState: encapsulates all wireless state for a specific host adapter
+ */
+
+#define SMAC_HASH_TABLE_SIZE 256 // length of table, must be power of 2
+#define SMAC_HASH_MASK       (SMAC_HASH_TABLE_SIZE - 1) // hash bits
+
+typedef struct SMACState {
+#ifdef _WIN32
+   NDIS_SPIN_LOCK	 smacSpinLock;	     // spinlock that protects wireless state
+#else /* _WIN32 */
+   void            	 *smacSpinLock;       // spinlock that protects wireless state
+#endif /* _WIN32 */
+   SmacLastAccess	 lastUptimeRead;     // used to track uptime counter overflow
+   struct IPmacLookupEntry * IPlookupTable[SMAC_HASH_TABLE_SIZE];  // IP hash table IP->MAC
+   uint32 numberOfIPandMACEntries;	     // # of hash table entries
+   IPAddrContainer lastIPadded;		     // last IP added to hash
+   uint8  lastMACadded[ETH_ALEN];	     // last MAC added to hash
+   struct IPmacLookupEntry * lastEntryAdded; // ptr to cache entry (to update timestamp)
+   Bool	  smacForwardUnknownPackets;         // forward "all" packets? (typically doesn't)
+   uint8  macAddress[ETH_ALEN];              // pointer to host MAC address
+} SMACState;
+
+/*
+ * Function prototypes
+ */
+
+static INLINE uint32 SUM32(uint32 in);
+static uint32 CalcChecksumDiff(uint32 sumBefore, uint32 sumAfter);
+static uint16 UpdateSum(uint16 oricheck, uint32 sumDiff);
+
+static INLINE IPmacLookupEntry *
+LookupByIPNoAcquireLock(SMACState *state,
+                        const IPAddrContainer *addrContainer);
+static Bool LookupByIP(SMACState *state, const IPAddrContainer *addrContainer,
+                       uint8 *macAddress);
+static INLINE Bool LookupByIPv4(SMACState *state, uint32 ipv4Addr,
+                                uint8 *macAddress);
+
+static INLINE Bool RemoveIPfromHashTableNoAcquireLock(SMACState *state,
+						      IPmacLookupEntry *entryToRemove);
+
+static void TrimLookupTableIfNecessary(SMACState *state);
+
+static INLINE void SetCacheEntry(SMACState *state, IPmacLookupEntry *entry);
+
+static Bool AddIPandMACcombo(SMACState *state,
+                             const IPAddrContainer *addrContainer, uint8 *mac);
+static INLINE Bool AddIPv4andMACcombo(SMACState *state, uint32 ipv4Addr,
+                                      uint8 *mac);
+static INLINE Bool AddIPv6andMACcombo(SMACState *state,
+                                      const IPv6Addr *ipv6Addr, uint8 *mac);
+
+static void ProcessOutgoingIPv4Packet(SMACPacket *packet, uint32 ethHeaderLen);
+static Bool ProcessOutgoingIPv6Packet(SMACPacket *packet, uint32 ethHeaderLen,
+                                      const uint8 *smacAddress, Bool *toHost);
+static Bool
+PatchMacAddrFixChecksum(SMACPacket *packet, const uint32 packetLen,
+                        const uint32 checksumOffset,
+                        const uint32 patchMacOffset, const uint8 *macAddress,
+                        const char *logPrefix);
+#ifdef DBG
+static void ProcessIncomingIPv4Packet(SMACPacket *packet, 
+				      Bool knownMacForIp);
+#endif
+static SmacLastAccess GetSystemUptime(SMACState *state);
+
+/* get information from packet */
+static INLINE uint32 GetPacketLength(SMACPacket *packet);
+static Bool GetPacketData(SMACPacket *packet, uint32 offset, 
+			  uint32 length, void *data);
+
+/* set information in packet */
+static Bool SetPacketByte(SMACPacket *packet, uint32 offset, 
+			  uint8 data);
+
+/* clone source / write data to clone */
+static Bool ClonePacket(SMACPackets *packets);
+static Bool CopyDataToClonedPacket(SMACPackets *packets, const void *source,
+				   uint32 offset, uint32 length);
+
+/* write data to source (on Windows) / write data to clone (on Linux) */
+static Bool CopyDataForPacketFromHost(SMACPackets *packets, uint32 changeNum,
+				      uint32 offset, const uint8 *macAddress);
+
+static EthClass LookupTypeClass(uint16 typeValue);
+#ifdef DBG
+#ifdef _WIN32
+_At_(type, _In_z_bytecount_(typeLen))
+#endif
+static void LookupTypeName(uint16 typeValue, char *type, size_t typeLen);
+#endif
+
+
+/*
+ * Various utility functions operating on IPv4/v6 addresses, address
+ * containers, or IP/MAC lookup entries.
+ */
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IPv4Hash --
+ * IPv6Hash -- 
+ *
+ *      Returns a one byte hash of an IPv4 (IPv6) address by adding
+ *      all the octets in the address.
+ *
+ * Results:
+ *      One byte hash value.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint8
+IPv4Hash(uint32 addr) // IN:
+{
+   return ((addr >> 24 & 0xff) + (addr >> 16 & 0xff) + (addr >> 8 & 0xff) +
+           (addr & 0xff)) & SMAC_HASH_MASK;
+}
+
+static INLINE uint8
+IPv6Hash(const IPv6Addr *addr) // IN:
+{
+   int i;
+   uint8 hash = (uint8)(addr->addrLo & 0xff) + (uint8)(addr->addrHi & 0xff);
+
+   for (i = 1; i < 4; i++) {
+      hash += (uint8)(addr->addrLo >> (i * 8) & 0xff) +
+              (uint8)(addr->addrHi >> (i * 8) & 0xff);
+   }
+   return hash & SMAC_HASH_MASK;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IsIPAddrContainerV4 --
+ * IsIPAddrContainerV6 -- 
+ * IsLookupEntryV4 --
+ * IsLookupEntryV6 --
+ *
+ *      Checks if an IP address container (lookup entry) is of type v4 (v6).
+ *
+ * Results:
+ *      TRUE iff of type v4 (v6).
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+IsIPAddrContainerV4(const IPAddrContainer *addrContainer) // IN:
+{
+   return addrContainer->ver == IPv4;
+}
+
+static INLINE Bool
+IsIPAddrContainerV6(const IPAddrContainer *addrContainer) // IN:
+{
+   return addrContainer->ver == IPv6;
+}
+
+static INLINE Bool
+IsLookupEntryV4(const IPmacLookupEntry *entry) // IN:
+{
+   return IsIPAddrContainerV4(&entry->addrContainer);
+}
+
+static INLINE Bool
+IsLookupEntryV6(const IPmacLookupEntry *entry) // IN:
+{
+   return IsIPAddrContainerV6(&entry->addrContainer);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Container{Get,Set}IPv4Addr --
+ * Container{Get,Set}IPv6Addr -- 
+ * LookupEntry{Get,Set}IPv4Addr --
+ * LookupEntry{Get,Set}IPv4Addr --
+ *
+ *      Returns/sets an IPv4 (IPv6) address from/to an IP address container
+ *      (IP/MAC lookup entry) structure.  Assumes that the caller has checked
+ *      the version type of the address prior to calling the Get function.
+ *
+ * Results:
+ *      IP address (for the Get function), none for the Set function.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint32
+ContainerGetIPv4Addr(const IPAddrContainer *addrContainer) // IN:
+{
+   ASSERT(IsIPAddrContainerV4(addrContainer));
+   return addrContainer->addr.ipv4Addr;
+}
+
+static INLINE uint32
+LookupEntryGetIPv4Addr(const IPmacLookupEntry *entry) // IN:
+{
+   ASSERT(IsLookupEntryV4(entry));
+   return ContainerGetIPv4Addr(&entry->addrContainer);
+}
+
+static INLINE void
+ContainerSetIPv4Addr(IPAddrContainer *addrContainer, // IN:
+                     uint32 ipv4Addr)                // IN:
+{
+   addrContainer->ver = IPv4;
+   addrContainer->addr.ipv4Addr = ipv4Addr;
+}
+
+static INLINE void
+LookupEntrySetIPv4Addr(IPmacLookupEntry *entry, // IN:
+                       uint32 ipv4Addr)         // IN:
+{
+   ContainerSetIPv4Addr(&entry->addrContainer, ipv4Addr);
+}
+
+static INLINE const IPv6Addr *
+ContainerGetIPv6Addr(const IPAddrContainer *addrContainer) // IN:
+{
+   ASSERT(IsIPAddrContainerV6(addrContainer));
+   return &addrContainer->addr.ipv6Addr;
+}
+
+static INLINE const IPv6Addr *
+LookupEntryGetIPv6Addr(const IPmacLookupEntry *entry) // IN:
+{
+   ASSERT(IsLookupEntryV6(entry));
+   return ContainerGetIPv6Addr(&entry->addrContainer);
+}
+
+static INLINE void
+ContainerSetIPv6Addr(IPAddrContainer *addrContainer, // IN:
+                     const IPv6Addr *ipv6Addr)       // IN:
+{
+   addrContainer->ver = IPv6;
+   addrContainer->addr.ipv6Addr.addrHi = ipv6Addr->addrHi;
+   addrContainer->addr.ipv6Addr.addrLo = ipv6Addr->addrLo;
+}
+
+static INLINE void
+LookupEntrySetIPv6Addr(IPmacLookupEntry *entry,  // IN:
+                       const IPv6Addr *ipv6Addr) // IN:
+{
+   ContainerSetIPv6Addr(&entry->addrContainer, ipv6Addr);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LookupEntrySetIPAddrContainer --
+ *
+ *      Copies an IP address container to an IP/MAC lookup entry.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+LookupEntrySetIPAddrContainer(IPmacLookupEntry *entry,              // OUT:
+                              const IPAddrContainer *addrContainer) // IN:
+{
+   if (IsIPAddrContainerV4(addrContainer)) {
+      LookupEntrySetIPv4Addr(entry, ContainerGetIPv4Addr(addrContainer));
+   } else {
+      LookupEntrySetIPv6Addr(entry, ContainerGetIPv6Addr(addrContainer));
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IPAddrContainerHash --
+ * LookupEntryIPAddrHash --
+ *
+ *      Return the hash of a given IP address container (IP/MAC lookup
+ *      entry) structure.
+ *
+ * Results:
+ *      One byte hash of the IP address.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint8
+IPAddrContainerHash(const IPAddrContainer *addrContainer) // IN:
+{
+   return IsIPAddrContainerV4(addrContainer) ?
+      IPv4Hash(ContainerGetIPv4Addr(addrContainer)) :
+      IPv6Hash(ContainerGetIPv6Addr(addrContainer));
+}
+
+static INLINE uint8
+LookupEntryIPAddrHash(const IPmacLookupEntry *entry) // IN:
+{
+   return IPAddrContainerHash(&entry->addrContainer);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IPv6AddrEquals --
+ *
+ *      Checks if two given IPv6 addresses match.
+ *
+ * Results:
+ *      TRUE iff the addresses match.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+IPv6AddrEquals(const IPv6Addr *addr1, // IN:
+               const IPv6Addr *addr2) // IN:
+{
+   return addr1->addrHi == addr2->addrHi && addr1->addrLo == addr2->addrLo;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * AddrContainersVersionsMatch --
+ *
+ *      Checks if two given IP address containers are of the same version.
+ *
+ * Results:
+ *      TRUE iff the versions match.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+AddrContainersVersionsMatch(const IPAddrContainer *one, // IN:
+                            const IPAddrContainer *two) // IN:
+{
+   return one->ver == two->ver;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * AddrContainersMatch --
+ *
+ *      Checks if two given IP address containers match (same version and
+ *      same IP address).
+ *
+ * Results:
+ *      TRUE iff the versions and the addresses match.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+AddrContainersMatch(const IPAddrContainer *one, // IN:
+                    const IPAddrContainer *two) // IN:
+{
+   if (AddrContainersVersionsMatch(one, two)) {
+      if (IsIPAddrContainerV4(one)) {
+         return ContainerGetIPv4Addr(one) == ContainerGetIPv4Addr(two);
+      } else {
+         return IPv6AddrEquals(&one->addr.ipv6Addr, &two->addr.ipv6Addr);
+      }
+   }
+   return FALSE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * AddrContainerMatchIPv4Address --
+ *
+ *      Checks if a given IP address container matches a given IPv4 address.
+ *
+ * Results:
+ *      TRUE iff the versions and the addresses match.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+AddrContainerMatchIPv4Address(const IPAddrContainer *addrContainer, // IN:
+                              uint32 ipv4Addr)                      // IN:
+{
+   IPAddrContainer ipv4AddrContainer;
+
+   ContainerSetIPv4Addr(&ipv4AddrContainer, ipv4Addr);
+   return AddrContainersMatch(addrContainer, &ipv4AddrContainer);
+}
+
+
+#ifdef DBG
+/*
+ *----------------------------------------------------------------------
+ *
+ * ContainerPrintIPAddrToString --
+ * LookupEntryPrintIPAddrToString --
+ * PrintIPv4AddrToString --
+ * PrintIPv6AddrToString --
+ * PrintMACAddrToString
+ *
+ *      Uses platform specific snprintf() to convert an IP address (or
+ *      MAC address) to string format and copies it to a given output
+ *      string.
+ *
+ * Results:
+ *      Pointer to the given string.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE char *
+ContainerPrintIPAddrToString(char *str,                            // OUT:
+                             size_t size,                          // IN:
+                             const IPAddrContainer *addrContainer) // IN:
+{
+   if (IsIPAddrContainerV4(addrContainer)) {
+      uint32 addr = ContainerGetIPv4Addr(addrContainer);
+      SNPRINTF((str, size, "%u.%u.%u.%u", addr & 0xff, addr >> 8 & 0xff,
+                addr >> 16 & 0xff, addr >> 24 & 0xff));
+   } else {
+      const IPv6Addr *addr = ContainerGetIPv6Addr(addrContainer);
+
+      SNPRINTF((str, size, "%x:%x:%x:%x:%x:%x:%x:%x",
+                NTOHS((uint16)(addr->addrHi & 0xffff)),
+                NTOHS((uint16)(addr->addrHi >> 16 & 0xffff)),
+                NTOHS((uint16)(addr->addrHi >> 32 & 0xffff)),
+                NTOHS((uint16)(addr->addrHi >> 48 & 0xffff)),
+                NTOHS((uint16)(addr->addrLo & 0xffff)),
+                NTOHS((uint16)(addr->addrLo >> 16 & 0xffff)),
+                NTOHS((uint16)(addr->addrLo >> 32 & 0xffff)),
+                NTOHS((uint16)(addr->addrLo >> 48 & 0xffff))));
+   }
+   return str;
+}
+
+static INLINE char *
+LookupEntryPrintIPAddrToString(char *str,                     // OUT:
+                               size_t size,                   // IN:
+                               const IPmacLookupEntry *entry) // IN:
+{
+   return ContainerPrintIPAddrToString(str, size, &entry->addrContainer);
+}
+
+static INLINE void
+PrintIPv4AddrToString(char *str,       // OUT:
+                      size_t size,     // IN:
+                      uint32 ipv4Addr) // IN:
+{
+   IPAddrContainer addrContainer;
+
+   ContainerSetIPv4Addr(&addrContainer, ipv4Addr);
+   ContainerPrintIPAddrToString(str, size, &addrContainer);
+}
+
+static INLINE char *
+PrintIPv6AddrToString(char *str,                // OUT:
+                      size_t size,              // IN:
+                      const IPv6Addr *ipv6Addr) // IN:
+{
+   IPAddrContainer addrContainer;
+
+   ContainerSetIPv6Addr(&addrContainer, ipv6Addr);
+   return ContainerPrintIPAddrToString(str, size, &addrContainer);
+}
+
+static INLINE char *
+PrintMACAddrToString(char *str,        // OUT:
+                     size_t size,      // IN:
+                     const uint8 *mac) // IN:
+{
+   SNPRINTF((str, size, "%02x:%02x:%02x:%02x:%02x:%02x",
+             mac[0], mac[1], mac[2], mac[3], mac[4], mac[5]));
+   return str;
+}
+#endif /* DBG */
+
+
+/*
+ * IP hash table routines: the following routines pertain to operations
+ * on the IP hash table. SMACState->smacSpinLock should be held when reading or
+ * writing data in the hash table.  A read/write lock might be better
+ * but the locks are usually held for a brief period of time.  
+ *
+ * 'lastIPadded' and 'lastMACadded' are used to cache the last entry that
+ * was added to the hash table.  For most packets we attempt to add IP/MAC
+ * information from that packet to the hash table.  In most cases (especially
+ * during file transfers) the entry will already be added to the table so we
+ * cache the last addition to minimize overhead.  The cache information is
+ * not used for lookups, only to make adds more efficient.
+ */
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LookupByIP --
+ * LookupByIPNoAcquireLock -- 
+ *
+ *      Lookup entry or MAC address that corresponds to the 
+ *      specified IP address.   Locking and non-locking versions
+ *      are provided.  The non-locking version returns the actual
+ *      table entry, while the locking version only returns the 
+ *      actual MAC address (to avoid reference counting).
+ *
+ * Results:
+ *      Nonlocking: pointer to entry (if found), otherwise NULL
+ *      Locking: TRUE if MAC found, otherwise FALSE
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE IPmacLookupEntry *
+LookupByIPNoAcquireLock(SMACState *state,                     // IN: state
+                        const IPAddrContainer *addrContainer) // IN: v4/v6 addr
+{
+   uint8 hash = IPAddrContainerHash(addrContainer);
+   IPmacLookupEntry *curr;
+
+   ASSERT(SMAC_HASH_TABLE_SIZE == 256);
+
+   /*
+    * Search thru bucket for match.
+    */
+
+   for (curr = state->IPlookupTable[hash]; curr; curr = curr->ipNext) {
+      if (AddrContainersMatch(&curr->addrContainer, addrContainer)) {
+         break;
+      }
+   }
+   return curr;
+}
+
+
+static Bool
+LookupByIP(SMACState *state,                     // IN: adapter 
+           const IPAddrContainer *addrContainer, // IN: IP to lookup
+           uint8 *macAddress)                    // OUT: (optional) MAC of IP
+                                                 //      (uint8[ETH_ALEN])
+{
+   IPmacLookupEntry *entry;
+   WW_DEVEL_ONLY(char ipStr[IP_STRING_SIZE];)
+   SPINLOCKINIT();
+
+   WW_VNETKdPrint((MODULE_NAME "LookupByIP: told to find %s\n",
+                   ContainerPrintIPAddrToString(ipStr, sizeof ipStr,
+                                                addrContainer)));
+
+   ACQUIRESPINLOCK(&state->smacSpinLock);
+   entry = LookupByIPNoAcquireLock(state, addrContainer);
+   if (entry != NULL && macAddress != NULL) {
+      MEMCPY(macAddress, entry->mac, ETH_ALEN);
+   }
+   RELEASESPINLOCK(&state->smacSpinLock);
+   return entry != NULL;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LookupByIPv4 --
+ *
+ *      Helper wrapper function for LookupByIP() for IPv4 cases.
+ *
+ * Results:
+ *      As in LookupByIP().
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+LookupByIPv4(SMACState *state,  // IN:
+             uint32 ipv4Addr,   // IN:
+             uint8 *macAddress) // OUT:
+{
+   IPAddrContainer addrContainer;
+
+   ContainerSetIPv4Addr(&addrContainer, ipv4Addr);
+   return LookupByIP(state, &addrContainer, macAddress);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * RemoveIPfromHashTable --
+ * RemoveIPfromHashTableNoAcquireLock --
+ *
+ *      Removed specified entry from the IP hash table.  Function
+ *      presumes that specified table entry still contains the IP 
+ *      address that was used to add the entry to the hash table.
+ *      Locking and no-locking version of function are provided
+ *
+ *      This function doesn't check whether the cached entry is
+ *      being removed (and thus won't reset the cached entry). This
+ *      code is primarily used to remove the oldest entry, and by
+ *      definition the cached entry is the newest (i.e., it's never
+ *      the oldest and thus won't be removed).
+ *
+ * Results:
+ *      TRUE if entry removed, FALSE otherwise.
+ *
+ * Side effects:
+ *      May remove entry from IP hash table.  Actual entry is not
+ *      modified nor deallocated by this function.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+RemoveIPfromHashTableNoAcquireLock(SMACState *state,                 // IN: state
+				   IPmacLookupEntry * entryToRemove) // IN: packet
+{
+   uint8 ipHashToRemove;
+   IPmacLookupEntry * prev = NULL, *entry;
+
+   ASSERT(entryToRemove);
+   ASSERT(SMAC_HASH_TABLE_SIZE == 256);
+
+   ipHashToRemove = LookupEntryIPAddrHash(entryToRemove);
+   entry = state->IPlookupTable[ipHashToRemove]; // get bucket
+      
+   /*
+    * locate and remove old IP entry from bucket
+    */
+
+   while (entry) {
+      if (entry == entryToRemove) {
+	 if (prev) {
+	    W_VNETKdPrint((MODULE_NAME "RemoveIPfromHashTable: removed IP "
+			   "entry from middle of bucket\n"));
+	    prev->ipNext = entry->ipNext;
+	 } else {
+	    W_VNETKdPrint((MODULE_NAME "RemoveIPfromHashTable: removed IP "
+			   "entry from front of bucket\n"));
+	    state->IPlookupTable[ipHashToRemove] = entry->ipNext;
+	 }
+	 return TRUE;
+      } else {
+	 prev = entry;
+	 entry = entry->ipNext;
+      }
+   }
+   return FALSE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * TrimLookupTableIfNecessary --
+ *
+ *      If the number of entries in the IP and MAC tables exceeds a
+ *      specified value (currently 20), then we remove and deallocate
+ *      an entry--ideally the entry which has been used least recently
+ *      is removed.  The code presumes that this function will be called
+ *      anytime a new entry is added, thus we should never need to
+ *      remove more than one entry per function call.
+ *
+ *      Function presumes that state lock is held while this function
+ *      is called.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      May remove and deallocates an entry from the IP and MAC hash
+ *      tables.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+TrimLookupTableIfNecessary(SMACState *state) // IN: smac state
+{
+   IPmacLookupEntry * oldestEntry = NULL;      // oldest entry found
+   SmacLastAccess oldestUpdate = (uint64)~0;	  // age of oldest entry
+   SmacLastAccess currentUptime = 0;           // time since the system was booted
+   int i;
+
+   VNETKdPrintCall(("TrimLookupTableIfNecessary"));
+   ASSERT(state);
+   ASSERT(SMAC_HASH_TABLE_SIZE == 256);
+   ASSERTLOCKHELD();
+
+   if (state->numberOfIPandMACEntries <= 20) { // if not too many entries
+      VNETKdPrint((MODULE_NAME "TrimLookupTableIfNeccessary: number of "
+                   "entries is small: %u.\n", state->numberOfIPandMACEntries));
+      return;
+   }
+
+   VNETKdPrint((MODULE_NAME "TrimLookupTableIfNecessary: "
+		 "reducing # of entries\n"));
+   
+   currentUptime = GetSystemUptime(state); /* must be called with lock held */
+   
+   VNETKdPrint((MODULE_NAME "TrimLookupTableIfNecessary: current uptime is "
+		LAST_ACCESS_FORMAT "\n", currentUptime));
+
+   /*
+    * NOTE: this code presumes that no system will ever be up long enough
+    * for the uptime to wrap.  To get around this assumption we could try to
+    * determine "oldest" by computing which entry has the largest difference
+    * from the current updtime.  However, there are no guarantees that this
+    * metric is any more accurate.  Given that we never expect more than 20
+    * entries to ever exist, I won't implement a more sophisiticated 
+    * mechanism at this time.
+    */
+
+   /*
+    * Search thru entire table to find oldest uptime, and remove it
+    */
+
+   for (i = 0; i < SMAC_HASH_TABLE_SIZE; ++i) {
+      IPmacLookupEntry *currentEntry = state->IPlookupTable[i];
+      while (currentEntry) {
+	 if (currentEntry->lastAccess < oldestUpdate) { // if older than candidate
+
+	    /* 
+	     * Skip cached entry since the entry was used most recently, but its
+	     * timestamp might be old since the timestamp is only updated after
+	     * the entry is no longer cached (i.e., something else is now the newest)
+	     *
+	     * This code will only be executed if at least 20 entries exist, so there
+	     * must be some much better candidates elsewhere in the table.
+	     */
+
+	    if (currentEntry == state->lastEntryAdded) {
+	       VNETKdPrint((MODULE_NAME "TrimLookupTableIfNecessary: oldest "
+		  "candidate is the cached entry, so skipping\n"));
+	    } else {
+	       DEVEL_ONLY(char ipStr[IP_STRING_SIZE];)
+
+	       VNETKdPrint((MODULE_NAME "TrimLookupTableIfNecessary: current "
+	                    "oldest candidate: %s time " LAST_ACCESS_FORMAT "\n",
+	                    LookupEntryPrintIPAddrToString(ipStr, sizeof ipStr,
+	                                                   currentEntry),
+	                    currentEntry->lastAccess));
+	       oldestEntry = currentEntry;
+	       oldestUpdate = currentEntry->lastAccess;
+	    }
+	 }
+	 if (currentEntry->lastAccess > currentUptime) {
+	    VNETKdPrint((MODULE_NAME "TrimLookupTableIfNecessary: "
+			 "ERROR: last access " LAST_ACCESS_FORMAT 
+			 " > current uptime " LAST_ACCESS_FORMAT "\n", 
+			 currentEntry->lastAccess, currentUptime));
+	 }
+	 
+	 currentEntry = currentEntry->ipNext;
+      }
+   }
+
+   if (oldestEntry) {
+      DEVEL_ONLY(char ipStr[IP_STRING_SIZE];)
+
+      VNETKdPrint((MODULE_NAME "TrimLookupTableIfNecessary: found oldest "
+                   "candidate: %s time " LAST_ACCESS_FORMAT "\n",
+                   LookupEntryPrintIPAddrToString(ipStr, sizeof ipStr,
+                                                  oldestEntry),
+                   oldestEntry->lastAccess));
+      if (!RemoveIPfromHashTableNoAcquireLock(state, oldestEntry)) {
+	 VNETKdPrint((MODULE_NAME "TrimLookupTableIfNecessary: could not "
+		      "find entry in IP table\n"));
+	 ASSERT(0); // should never occur
+      } else {
+	 FREEMEMORY(oldestEntry);
+	 --state->numberOfIPandMACEntries;
+      }
+   }
+   else {
+      VNETKdPrint((MODULE_NAME "TrimLookupTableIfNecessary: "
+		   "found no entry to remove!!\n"));
+   }
+
+   VNETKdPrintReturn(("TrimLookupTableIfNecessary"));   
+   return;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SetCacheEntry --
+ *
+ *      Sets the cached MAC/IP entry for an adapter, and updates the
+ *      access time for the previous cache entry (if any).  The cache
+ *      is used to avoid the overhead of checking for the existance of,
+ *      for the purposes of adding, a MAC/IP entry that has already
+ *      been added recently.
+ *
+ *      Function is called with state->smacSpinLock held.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Modified the cached entry for the adapter, and updates the
+ *      access time for the previous cache entry (if any)
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+SetCacheEntry(SMACState *state,         // IN: smac state
+	      IPmacLookupEntry *entry)	// IN: entry to cache
+{
+   ASSERT(state);
+   ASSERT(entry);
+
+   /* 
+    * Set new cached entry, but first set the current cache entry's
+    * access time to the current time
+    */
+
+   if (state->lastEntryAdded) {
+      state->lastEntryAdded->lastAccess = GetSystemUptime(state);
+   }
+
+   state->lastIPadded = entry->addrContainer;
+   MEMCPY(state->lastMACadded, entry->mac, ETH_ALEN);
+   state->lastEntryAdded = entry;
+   entry->lastAccess = GetSystemUptime(state);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * AddIPandMACcombo --
+ *
+ *      Adds an entry for a paired MAC/IP{v4,v6} into the IP and MAC
+ *      hash tables.
+ *
+ * Results:
+ *      TRUE if added, updated, or already present, FALSE on error.
+ *
+ * Side effects:
+ *      Allocates a new table entry and adds it to the IP and MAC
+ *      hash tables.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+AddIPandMACcombo(SMACState *state,                     // IN: smac state
+                 const IPAddrContainer *addrContainer, // IN: IPv4/v6 address to add
+                 uint8 *mac)                           // IN: ethernet MAC to add
+{
+   Bool result = TRUE;
+   IPmacLookupEntry *entryIP = NULL;
+   DEVEL_ONLY(char ipStr[IP_STRING_SIZE];)
+   DEVEL_ONLY(char macStr[MAC_STRING_SIZE];)
+   SPINLOCKINIT();
+
+   /*
+    * If the current IP/MAC is the same as the immediately prior add, then
+    * return and don't bother to process this request.
+    */
+
+   VNETKdPrint((MODULE_NAME "AddIPMAC:  told to add %s %s\n", 
+                ContainerPrintIPAddrToString(ipStr, sizeof ipStr,
+                                             addrContainer),
+                PrintMACAddrToString(macStr, sizeof macStr, mac)));
+
+   ASSERTLOCKHELD();
+   ASSERT(SMAC_HASH_TABLE_SIZE == 256);
+
+   if (AddrContainersMatch(&state->lastIPadded, addrContainer) &&
+       MAC_EQ(mac, state->lastMACadded)) {
+      VNETKdPrint((MODULE_NAME "AddIPMAC: cache says already present\n"));
+      return TRUE;
+   }
+
+   if (IsIPAddrContainerV4(addrContainer)) {
+      uint32 addr = ContainerGetIPv4Addr(addrContainer);
+
+      /*
+       * Don't allow an IP of 0.0.0.0 or 255.255.255.255 to be added.  In fact,
+       * consider deleting any existing MAC entry that was provided, since the
+       * IP is apparently no longer in use.
+       */
+
+      if (!addr || addr == IP_ADDR_BROADCAST) {
+         VNETKdPrint((MODULE_NAME "AddIPMAC: trying to add IP 0.0.0.0 or "
+                      "255.255.255.255, disallowing add & removing MAC "
+                      "entry.\n"));
+         return TRUE;
+      }
+   } else {
+      const IPv6Addr *addr = ContainerGetIPv6Addr(addrContainer);
+
+      /*
+       * Don't allow unspecified IPv6 addresses.  There is no IPv6 broadcast
+       * address to check here.
+       */
+
+      if (addr->addrHi == CONST64U(0) && addr->addrLo == CONST64U(0)) {
+         VNETKdPrint((MODULE_NAME "AddIPMAC:  trying to add unspecified IPv6 "
+                     "address  ::/128, disallowing adding of MAC entry.\n"));
+         return TRUE;
+      }
+   }
+
+   ACQUIRESPINLOCK(&state->smacSpinLock);
+
+   /* 
+    * Lookup table entry for specified IP addr and ethernet MAC.
+    */
+
+   entryIP = LookupByIPNoAcquireLock(state, addrContainer);
+
+   /*
+    * If an entry for the specified IP addr was found, and the MACs match,
+    * then we don't need to add a new entry nor modify any existing entries 
+    * and can return immediately.
+    */
+
+   if (entryIP && MAC_EQ(entryIP->mac, mac)) {
+      VNETKdPrint((MODULE_NAME "AddIPMAC: entry already exists, "
+	           "and matches current IP/MAC\n"));
+
+      /* 
+       * Update the cached entry to this new request.
+       */
+
+      SetCacheEntry(state, entryIP);
+      goto exit;
+   }
+
+   /*
+    * If no table entry was found for the IP, then this is a completely new add 
+    * (also, no changes need to made to pre-existing table entries).
+    */
+
+   if (!entryIP) {
+      uint8 ipHash = IPAddrContainerHash(addrContainer);
+      
+      IPmacLookupEntry *entry = ALLOCATEMEMORY(sizeof *entry,
+                                               REORDER_TAG('SMle'));
+      VNETKdPrint((MODULE_NAME "AddIPMACnew:  neither MAC or IP is in table, "
+                   "so adding new entry for %s %s\n",
+                   ContainerPrintIPAddrToString(ipStr, sizeof ipStr,
+                                                addrContainer),
+                   PrintMACAddrToString(macStr, sizeof macStr, mac)));
+
+      if (!entry) {
+	 // entry allocation error
+	 VNETKdPrint((MODULE_NAME "AddIPMACnew: Failed to allocate "
+		      " MAC/IP entry\n"));
+	 result = FALSE;
+	 goto exit;
+      }
+
+      ++state->numberOfIPandMACEntries;
+
+      // initialize the contents of the table entry
+      LookupEntrySetIPAddrContainer(entry, addrContainer);
+      entry->lastAccess = 0; /* initialize to 0 for sanity, although it's not vital */
+
+      MEMCPY(entry->mac, mac, ETH_ALEN);
+
+      // add entry to IP hash table
+      entry->ipNext = state->IPlookupTable[ipHash];
+      state->IPlookupTable[ipHash] = entry;
+
+      VNETKdPrint((MODULE_NAME "AddIPMACnew: entry allocated, and added\n"));
+      SetCacheEntry(state, entry);
+      TrimLookupTableIfNecessary(state);
+
+   } else {
+
+      /*
+       * If table entry was found for IP, but the MACs don't match, then this means
+       * that a new/different ethernet device/MAC is using the IP address.  We need
+       * to update the contents of the table entry to specify the new MAC
+       */
+
+      VNETKdPrint((MODULE_NAME "AddIPMACmacmod: IP has changed from known "
+	           "MAC %02x:%02x:%02x:%02x:%02x:%02x to new unknown "
+		   "MAC %02x:%02x:%02x:%02x:%02x:%02x\n",
+		   entryIP->mac[0]&0xff, entryIP->mac[1]&0xff, 
+		   entryIP->mac[2]&0xff, entryIP->mac[3]&0xff, 
+		   entryIP->mac[4]&0xff, entryIP->mac[5]&0xff,
+		   mac[0]&0xff, mac[1]&0xff, mac[2]&0xff, mac[3]&0xff, 
+		   mac[4]&0xff, mac[5]&0xff));
+
+      // update MAC in the table entry
+      MEMCPY(entryIP->mac, mac, ETH_ALEN);
+      
+      // update which was the last IP/MAC combo to be added
+      SetCacheEntry(state, entryIP);
+      // no new entry added, so no need to call TrimLookupTableIfNecessary()
+   }
+
+exit:
+
+   RELEASESPINLOCK(&state->smacSpinLock);
+   return result;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * AddIPv4andMACcombo --
+ * AddIPv6andMACcombo --
+ *
+ *      Helper wrapper functions for AddIPandMACcombo() for the IPv4/v6
+ *      cases.
+ *
+ * Results:
+ *      As in AddIPandMACcombo().
+ *
+ * Side effects:
+ *      As in AddIPandMACcombo().
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+AddIPv4andMACcombo(SMACState *state, // IN:
+                   uint32 ipv4Addr,  // IN:  IPv4 address to add
+                   uint8 *mac)       // IN:  ethernet MAC to add
+{
+   IPAddrContainer addrContainer;
+
+   ContainerSetIPv4Addr(&addrContainer, ipv4Addr);
+   return AddIPandMACcombo(state, &addrContainer, mac);
+}
+
+static INLINE Bool
+AddIPv6andMACcombo(SMACState *state,
+                   const IPv6Addr *ipv6Addr, // IN:  IPv6 address to add
+                   uint8 *mac)               // IN:  ethernet MAC to add
+{
+   IPAddrContainer addrContainer;
+
+   ContainerSetIPv6Addr(&addrContainer, ipv6Addr);
+   return AddIPandMACcombo(state, &addrContainer, mac);
+}
+
+
+/*
+ * Overview of functions:
+ *
+ * "LookupTypeClass" and "LookupTypeName" are used to identify an 
+ * ethernet frame's type, esentially IP, ARP, or neither.
+ * "LookupTypeName" is used for debugging purposes, since it also
+ * returns a string representing the name of the type.
+ *
+ * When the bridge wishes to send a packet to the host/network, it
+ * calls "SMAC_CheckPacketToHost", which essentially handles the
+ * link layer and ARP.  If the packet is IPv4 then it calls 
+ * ProcessOutgoingIPv4Packet to analyze (and potentially modify)
+ * the packet.  Currently ProcessOutgoingIPv4Packet only turns on
+ * the broadcast flag for DHCP client packets.
+ *
+ * When the bridge receives a packet from the host/network, it
+ * calls "SMAC_CheckPacketFromHost", which essentially handles the
+ * link layer and ARP.  If the packet is IPv4 then it calls 
+ * ProcessIncomingIPv4Packet to analyze (and potentially modify)
+ * the packet.
+ *
+ * On Linux, the packet modifications are made to a private clone
+ * of the network packet.  We don't want to modify a packet from
+ * the host, nor do we want to make modifications in a way that's
+ * visible to VMs on the same subnet.
+ *
+ * On Windows, we only clone packets that are headed towards the host.
+ * Packets from the host can be modified since they're already a private
+ * copy.  However, we might not have the whole packet and thus need to
+ * store the changes in a separate table until the whole packet is
+ * received (at which time the modifications can then be made).
+ *
+ * On Mac OS, the packet modifications are made to the original network packet,
+ * since the packet passed to us is already pre-cloned and private and can be
+ * modified here. So cloning is faked by simply setting the clone to be a
+ * pointer to the original packet.
+ */
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SMAC_CheckPacketFromHost --
+ *
+ *      Examines the contents of a packet that has been received from
+ *      the network.  On Windows the function will provide suggestions 
+ *      (via table) for where MAC substitution should occur.
+ *      Function supports IP, ARP, RARP, IARP, and DHCP.  On Linux the
+ *      function will clone the packet and make modifications to the
+ *      clone (the caller is responsible for freeing the original and
+ *      the cloned packets).
+ *
+ *      NOTE: On Windows this function presumes it is called at DISPATCH_LEVEL
+ *
+ * Results:
+ *      Returns 'PacketStatusForwardPacket' if packet should/can be 
+ *      received, 'PacketStatusDropPacket' if packet should be filtered 
+ *      and not received, PacketStatusTooShort if insufficient data 
+ *      provided to process packet (suggested action it to receive 
+ *      packet in its entirety, and call this function
+ *      again on the whole packet)
+ *
+ * Side effects:
+ *      May add/modify the adapter's MAC/IP hash tables.  May clone a
+ *      packet if function returns PacketStatusForwardPacket.
+ *
+ *----------------------------------------------------------------------
+ */
+
+PacketStatus SMACINT
+SMAC_CheckPacketFromHost(SMACState *state,       // IN: pointer to state
+			 SMACPackets *packets)   // IN/OUT: packet to process
+{
+   EthernetHeader eh;
+   EthClass typeClass;
+   SMACPacket *packet = NULL; // original packet from host
+
+   ASSERT(state);
+   ASSERT(packets);
+
+   WW_VNETKdPrint((MODULE_NAME "FromHost: Called\n"));
+
+   ASSERTLOCKHELD();
+
+#ifdef _WIN32
+   {
+      MacReplacementTable *macTable = packets->table;
+      ASSERT(macTable);
+      macTable->numOfOffsets = 0;
+   }
+#endif /* _WIN32 */
+
+   packet = &(packets->orig);
+
+   /*
+    * Read in the Ethernet header, and return failure if this
+    * is a runt packet that doesn't have a whole header
+    */
+
+   ASSERT(sizeof eh == ETH_HLEN);
+   if (!GetPacketData(packet, 0, sizeof eh, &eh)) {
+      VNETKdPrint((MODULE_NAME "FromHost: Packet missing eth header\n"));
+      return PacketStatusDropPacket; // instruct bridge to drop this runt packet
+   }
+
+#ifdef __linux__
+   /* 
+    * Reject the duplicate packet (occurs only in Infrastructure mode)
+    *
+    * When the vm is communicating with the host, the host arp table 
+    * would have the vm's mac address same as the physical hw address.
+    * so when SMAC_PacketFromHost is called it will create a duplicate of 
+    * the packet and let the original pass as is, this original packet 
+    * would then be transmitted on the network, where the AP would return
+    * it back to us because it matches the hardware address , this is the 
+    * duplicate packet we are talking about.
+    */
+   if (SMACL_IsSkbHostBound(packet->skb) && 
+       MAC_EQ(state->macAddress, eh.srcAddr)) {
+      W_VNETKdPrint((MODULE_NAME "FromHostIP: incoming request has "
+                     "same mac as destination, so blackholing\n"));
+      return PacketStatusDropPacket;
+   }
+#endif
+
+   /*
+    * Lookup the ethernet media type of the packet
+    */
+
+   typeClass = LookupTypeClass(NTOHS(eh.lengthType));
+
+   /*
+    * For reference, the VLAN support was removed since it was determined that
+    * for Windows, such information would be present only in the OOB area of a
+    * NDIS packet, and thus no specific support/handling for VLAN is required
+    * for that OS.
+    *
+    * For any other OS, we need to add support to the vmnet driver for that OS
+    * to allow VLAN tagged frames.
+    */
+
+#if 0
+
+   /*
+    * If broadcast, then allow packet with no further checks.  We might be
+    * able to actually enable this code, depending on how we want to handle
+    * DHCP replies.  Currently DHCP replies don't need to be processed, so
+    * it's probably okay to enable this.  Currently it's disabled so that
+    * the debug statements can continue to give us information about each 
+    * packet.
+    */
+   
+   if (IS_MULTICAST(eh.destAddr) || IS_BROADCAST(eh.destAddr)) { 
+      return PacketStatusForwardPacket;
+   }
+
+#endif /* 0 */
+
+   /*
+    * DEBUG: if not IP & not ARP & not EAPOL
+    */
+
+   if (typeClass != EthClassIPv4 && typeClass != EthClassIPv6 &&
+       typeClass != EthClassARP && typeClass != EthClassEAPOL) {
+
+      /* 
+       * If not a common/known media type, then print a status 
+       * message and return
+       */
+
+#ifdef DBG
+      if (typeClass != EthClassCommon) { // print only if not a common type
+         char type[50] = ""; // holds textual name of type
+         LookupTypeName(NTOHS(eh.lengthType), type, sizeof type); // lookup ethernet type
+         VNETKdPrint((MODULE_NAME "FromHost: non-IP & non-ARP %s "
+                      "%02x:%02x:%02x:%02x:%02x:%02x -> "
+                      "%02x:%02x:%02x:%02x:%02x:%02x %s\n",
+                      (IS_MULTICAST(eh.destAddr) || IS_BROADCAST(eh.destAddr))?
+                      "(b|m)cast":"ucast",
+                      eh.srcAddr[0], eh.srcAddr[1], eh.srcAddr[2],
+                      eh.srcAddr[3], eh.srcAddr[4], eh.srcAddr[5],
+                      eh.destAddr[0], eh.destAddr[1], eh.destAddr[2],
+                      eh.destAddr[3], eh.destAddr[4], eh.destAddr[5], type));
+      }
+#endif /* DBG */
+
+      /*
+       * Let these unrecognized packets through only if they are broadcast or
+       * multicast. Drop unicast packets because it's easier to debug a lack
+       * of traffic than damaged traffic.
+       */
+
+      if (IS_MULTICAST(eh.destAddr) || IS_BROADCAST(eh.destAddr)) {
+         VNETKdPrint((MODULE_NAME "FromHost: Forward unrecognized "
+                      "non-arp/ip b/mcast\n"));
+         return PacketStatusForwardPacket;
+      } else {
+#ifdef DBG
+         char type[50] = ""; // holds textual name of type
+         LookupTypeName(NTOHS(eh.lengthType), type, sizeof type);
+         VNETKdPrint((MODULE_NAME "FromHost: Dropping unrecognized "
+                      "unicast non-IP & non-ARP unicast packet: %s\n", type));
+         VNETKdPrint((MODULE_NAME "FromHost: the non-IP & non-ARP is "
+                      "%02x:%02x:%02x:%02x:%02x:%02x -> "
+                      "%02x:%02x:%02x:%02x:%02x:%02x\n",
+                      eh.srcAddr[0], eh.srcAddr[1], eh.srcAddr[2],
+                      eh.srcAddr[3], eh.srcAddr[4], eh.srcAddr[5],
+                      eh.destAddr[0], eh.destAddr[1], eh.destAddr[2],
+                      eh.destAddr[3], eh.destAddr[4], eh.destAddr[5]));
+#endif
+         /*
+          * Drop non-IP/non-ARP unicast packets, unless we've been
+          * requested to forward unknown/unrecognized packets.
+          */
+
+         if (state->smacForwardUnknownPackets) {
+            return PacketStatusForwardPacket;
+         } else {
+            return PacketStatusDropPacket;
+         }
+      }
+   }
+
+   /*
+    * If IP packet, then lookup ethernet MAC based on dest IP and replace 
+    * dest ethernet MAC with that of the lookup table entry
+    */
+
+   if (typeClass == EthClassIPv4 || typeClass == EthClassIPv6) { // IP packet
+      IPAddrContainer addrContainer;
+
+      /*
+       * First, we do some IP version dependent parsing (checking basic fields
+       * in the packet, extracting destination IP address, etc.).  Then we
+       * perform the common processing for IPv4/IPv6 packets (finding
+       * destination MAC address from SMAC hash table, replacing destination
+       * MAC in the packet --- the wireless PNIC's MAC address --- with the MAC
+       * address of the VM's VNIC.
+       */
+
+      if (typeClass == EthClassIPv4) { // IPv4
+         uint8  ipHeader[IP_HEADER_LEN];   // IP header
+         uint32 ipVer;                     // IP header ver
+         uint32 ipHeaderLen;               // IP header length 
+
+         /* Verify that we have at least a whole, minimal IP header */
+         if (!GetPacketData(packet, ETH_HLEN, sizeof ipHeader, ipHeader)) {
+            VNETKdPrint((MODULE_NAME "FromHostIP: Got type IP, "
+                         "but only have partial IP header\n"));
+            return PacketStatusTooShort;
+         }
+
+         ipVer = ipHeader[0] >> 4;              // IP header ver
+         ipHeaderLen = 4 * (ipHeader[0] & 0xf); // IP header length
+
+         /*
+          * Verify basic fields in IP header
+          */
+
+         if (ipVer != 4 || ipHeaderLen < 20 ||
+             GetPacketLength(packet) - ETH_HLEN < ipHeaderLen) {
+            VNETKdPrint((MODULE_NAME "FromHostIP: got an IP version %u, "
+                         "or len %u < reported len %u\n", ipVer,
+                         GetPacketLength(packet) - ETH_HLEN, ipHeaderLen));
+            if ((GetPacketLength(packet) - ETH_HLEN) < ipHeaderLen) {
+
+               /*
+                * insufficient data -- process anyway since we have the necessary
+                * amount of information (first 20 bytes) to process this packet?
+                */
+
+               VNETKdPrint((MODULE_NAME "FromHostIP: got an IP "
+                                 "that's too short\n"));
+               return PacketStatusTooShort; 
+            } else {
+               VNETKdPrint((MODULE_NAME "FromHostIP: got an IP "
+                            "that's unrecognised\n"));
+               return PacketStatusDropPacket; // invalid/unrecognized data
+            }
+         }
+
+         /*
+          * Extract the IPv4 destination address.
+          */
+
+         ContainerSetIPv4Addr(&addrContainer,
+                              *((uint32 *)(ipHeader +
+                                           IP_HEADER_DEST_ADDR_OFFSET)));
+      } else { // IPv6
+         uint8 ipv6Header[IPv6_HEADER_LEN];
+         uint8 ipv6Ver;
+         IPv6Addr ipv6DstAddr;
+
+         if (!GetPacketData(packet, ETH_HLEN, sizeof ipv6Header, ipv6Header)) {
+            VNETKdPrint((MODULE_NAME "FromHostIP: Got type IPv6, but only have "
+                         "partial IPv6 header.\n"));
+            return PacketStatusTooShort;
+         }
+
+         ipv6Ver = ipv6Header[0] >> 4;
+         if (ipv6Ver != IPv6 || GetPacketLength(packet) < ETH_HLEN +
+                                                          IPv6_HEADER_LEN) {
+            VNETKdPrint((MODULE_NAME "FromHostIP:  got an IP version %u, or "
+                         "length %u less than minimum length %d.\n", ipv6Ver,
+                         GetPacketLength(packet), ETH_HLEN + IPv6_HEADER_LEN));
+            return PacketStatusDropPacket;
+         }
+
+         /*
+          * Extract the IPv6 destination address.
+          */
+
+         ipv6DstAddr.addrHi = *((uint64 *)(ipv6Header +
+                                           IPv6_HEADER_DST_ADDR_OFFSET));
+         ipv6DstAddr.addrLo = *((uint64 *)(ipv6Header +
+                                           IPv6_HEADER_DST_ADDR_OFFSET +
+                                           sizeof ipv6DstAddr.addrHi));
+         ContainerSetIPv6Addr(&addrContainer, &ipv6DstAddr);
+      }
+
+      /*
+       * Broadcast/multicast processing: don't modify dest MAC but check if the 
+       * payload should be modified.
+       *
+       * Unicast processing: modify MAC (if packet destined for VM) and check if
+       * the payload should be modified
+       */
+
+      if (IS_MULTICAST(eh.destAddr) || IS_BROADCAST(eh.destAddr)) {
+    
+         /*
+          * Check if payload should be modified.
+          */
+
+         /* 
+          * NOTE: ProcessIncomingIPv4Packet doesn't currently modify packets,
+          * so in an actual product release we can remove this call.
+          *
+          * TODO: investigate if there is work to be done here for IPv6 case.
+          */
+
+#ifdef DBG
+         if (typeClass == EthClassIPv4) {
+            ProcessIncomingIPv4Packet(packet, FALSE); 
+         }
+#endif
+         W_VNETKdPrint((MODULE_NAME "FromHostIP: forward b/mcast IP\n"));
+         return PacketStatusForwardPacket;
+      } else { // unicast ethernet
+         Bool foundMac;
+         uint8 vmMacAddress[ETH_ALEN];
+         DEVEL_ONLY(char ipStr[IP_STRING_SIZE];)
+
+         /*
+          * For unicast IP processing: lookup MAC based on IP addr
+          */
+
+         foundMac = LookupByIP(state, &addrContainer, vmMacAddress);
+
+         if (!foundMac && 
+             AddrContainerMatchIPv4Address(&addrContainer, IP_ADDR_BROADCAST)) {
+            /*
+             * If IPv4 destination address is the IP limited broadcast address
+             * '255.255.255.255', then SMAC the unicast ethernet MAC address into
+             * the ethernet broadcast MAC address 'ff:ff:ff:ff:ff:ff' and forward
+             * the packet.
+             *
+             * Certain DHCP Servers/Relay Agents choose to ignore the
+             * recommendations of RFC 1542 "Clarifications and Extensions for the
+             * Bootstrap Protocol" section 4.1.2, and send DHCP Offers/ACKs to a
+             * unicast ethernet address in response to DHCP Discovers/Requests
+             * with the "Broadcast" flag set. See PRs 224129, 172947.
+             *
+             * Other than such packets, there shouldn't be any other IPv4 packets
+             * sent to the IP limited broadcast address but not to the ethernet
+             * broadcast address, but even if there are, we'll forward such
+             * packets onto the VNet and let the guests decide what to do about
+             * them.
+             */
+
+            ASSERT(typeClass == EthClassIPv4);
+            MEMSET(vmMacAddress, 0xFF, ETH_ALEN);
+            foundMac = TRUE;
+         }
+
+         if (foundMac) { // if IP is known on VNet, then substitute MAC
+            W_VNETKdPrint((MODULE_NAME "FromHostIP: would assign MAC"
+                           " of IP %s to packet\n",
+                           ContainerPrintIPAddrToString(ipStr, sizeof ipStr,
+                                                        &addrContainer)));
+
+            /*
+             * Eth dest MAC needs to be corrected.
+             */
+
+            if (!CopyDataForPacketFromHost(packets, 0, 0, vmMacAddress)) {
+               VNETKdPrint((MODULE_NAME "FromHostIP: couldn't clone packet\n"));
+               return PacketStatusDropPacket;
+            }
+
+            /*
+             * NOTE: ProcessIncomingIPv4Packet doesn't currently modify packets,
+             * so in an actual product release we can remove this call.
+             */
+
+#ifdef DBG
+            if (typeClass == EthClassIPv4) {
+               ProcessIncomingIPv4Packet(packet, foundMac);
+            }
+#endif /* DBG */
+            W_VNETKdPrint((MODULE_NAME "FromHostIP: forward IP\n"));
+            return PacketStatusForwardPacket;
+         } else { // IP is unknown on VNet
+            VNETKdPrint((MODULE_NAME "FromHostIP: could not find IP "
+                         "%s in lookup.\n",
+                         ContainerPrintIPAddrToString(ipStr, sizeof ipStr,
+                                                      &addrContainer)));
+            if (state->smacForwardUnknownPackets) {
+               return PacketStatusForwardPacket;
+            } else {
+               return PacketStatusDropPacket; // drop packet
+            }
+         } // end IP addr lookup
+      } // end unicast
+   } // end IP
+
+   /*
+    * If ARP packet, then lookup ethernet MAC based on dest IP and replace 
+    * dest ethernet MAC (and potentially ARP MAC) with that of the lookup table entry
+    */
+
+   else if (typeClass == EthClassARP) { // ARP packet
+      uint32 arpHeaderWord1; // first word in ARP header
+      uint32 arpHeaderWord2; // second word in ARP header
+
+      if (GetPacketLength(packet) < ETH_HLEN + ARP_HEADER_LEN) {
+         VNETKdPrint((MODULE_NAME "FromHostARP: ARP packet is insufficient "
+                     "length of IPv4 and Ethernet, expected %d got %u\n",
+                     ETH_HLEN + ARP_HEADER_LEN, GetPacketLength(packet)));
+         return PacketStatusTooShort;
+      }
+
+      /*
+       * Verify the first word of ARP header (hardcoded for ethernet and IPv4)
+       *
+       * I recently added IEEE802 support.  These types of ARP requests were
+       * observed on the company network, so someone uses them.  As long as
+       * the address lengths are the same then I imagine that the processing
+       * is identical and we can handle them (lengths are checked as part
+       * of processing the second word of ARP header).
+       */
+      
+      if (!GetPacketData(packet, ETH_HLEN, sizeof arpHeaderWord1, 
+                         &arpHeaderWord1)) {
+         VNETKdPrint((MODULE_NAME "FromHostARP: couldn't read "
+                      "ARP header #1\n"));
+         return PacketStatusTooShort;
+      }
+
+      if (arpHeaderWord1 != HTONL(0x00010800) /* ethernet */ &&
+         arpHeaderWord1 != HTONL(0x00060800) /* ieee802  */ ) {
+         VNETKdPrint((MODULE_NAME "FromHostARP: ARP header1 appears "
+                      "wrong, got %08x\n", arpHeaderWord1));
+         return PacketStatusDropPacket;
+      }
+
+      /*
+       * Perform action based on opcode in second word of ARP header.
+       */
+
+      if (!GetPacketData(packet, ETH_HLEN + sizeof arpHeaderWord1,
+          sizeof arpHeaderWord2, &arpHeaderWord2)) {
+         VNETKdPrint((MODULE_NAME "FromHostARP: couldn't read "
+                      "ARP header #2\n"));
+         return PacketStatusTooShort;
+      }
+
+#ifdef DBG
+
+      /*
+       * DEBUG: print general information about the packet
+       */
+
+      switch (arpHeaderWord2) {
+	 case CONST_NTOHL(0x06040001):
+	    WW_VNETKdPrint((MODULE_NAME "FromHostARP: "	       
+			  "ARP header2 indicates ARP request\n"));
+	    break;
+	 case CONST_NTOHL(0x06040002):
+	    W_VNETKdPrint((MODULE_NAME "FromHostARP: "
+			 "ARP header2 indicates ARP reply\n"));
+	    break;
+	 case CONST_NTOHL(0x06040003):
+	    VNETKdPrint((MODULE_NAME "FromHostARP: "
+			 "ARP header2 indicates RARP request\n"));
+	    break;
+	 case CONST_NTOHL(0x06040004):
+	    VNETKdPrint((MODULE_NAME "FromHostARP: "
+			 "ARP header2 indicates RARP reply\n"));
+	    break;
+	 case CONST_NTOHL(0x06040008):
+	    VNETKdPrint((MODULE_NAME "FromHostARP: "
+			 "ARP header2 indicates IARP request\n"));
+	    break;
+	 case CONST_NTOHL(0x06040009):
+	    VNETKdPrint((MODULE_NAME "FromHostARP: "
+			 "ARP header2 indicates IARP reply\n"));
+	    break;
+	 default:
+	    VNETKdPrint((MODULE_NAME "FromHostARP: "
+			 "ARP header2 indicates unknown opcode\n"));
+	    break;
+      }
+
+      {
+	 uint8 data[ETH_ALEN + 4] = {0}; // MAC and IP in one contiguous buffer
+	 if (GetPacketData(packet, ETH_HLEN + ARP_SENDER_MAC_OFFSET, 
+			   sizeof data, data)) {
+	    WW_VNETKdPrint((MODULE_NAME "FromHostARP: sender MAC is "
+	       "%02x:%02x:%02x:%02x:%02x:%02x IP is %d.%d.%d.%d\n",
+	       ((unsigned char*)data)[0]&0xff, ((unsigned char*)data)[1]&0xff,
+	       ((unsigned char*)data)[2]&0xff, ((unsigned char*)data)[3]&0xff,
+	       ((unsigned char*)data)[4]&0xff, ((unsigned char*)data)[5]&0xff, 
+	       ((unsigned char*)data)[6]&0xff, ((unsigned char*)data)[7]&0xff, 
+	       ((unsigned char*)data)[8]&0xff, ((unsigned char*)data)[9]&0xff));
+	 } else {
+	    VNETKdPrint((MODULE_NAME "FromHostARP: couldn't read "
+			  "sender MAC/IP\n"));
+	 }
+      
+	 if (GetPacketData(packet, ETH_HLEN + ARP_TARGET_MAC_OFFSET, 
+			   sizeof data, data)) {
+	    WW_VNETKdPrint((MODULE_NAME "FromHostARP: target MAC is "
+	       "%02x:%02x:%02x:%02x:%02x:%02x IP is %d.%d.%d.%d\n",
+	       ((unsigned char*)data)[0]&0xff, ((unsigned char*)data)[1]&0xff, 
+	       ((unsigned char*)data)[2]&0xff, ((unsigned char*)data)[3]&0xff, 
+	       ((unsigned char*)data)[4]&0xff, ((unsigned char*)data)[5]&0xff, 
+	       ((unsigned char*)data)[6]&0xff, ((unsigned char*)data)[7]&0xff, 
+	       ((unsigned char*)data)[8]&0xff, ((unsigned char*)data)[9]&0xff));
+	 } else {
+	    VNETKdPrint((MODULE_NAME "FromHostARP: couldn't read "
+			 "target MAC/IP\n"));
+	 }
+      }
+
+#endif
+
+      /*
+       * ARP handling for *incoming traffic*
+       *
+       * ARP: host wants to know the MAC that corresponds to a particular IP
+       * 1 ARP request:  <srcMAC, srcIP, 0,      dstIP>
+       *   ALLOW CONDITIONALLY: if dest eth mac broadcast then nothing to modify,
+       *                        otherwise need to patch ucast dest eth mac.
+       * 2 ARP reply:    <srcMAC, srcIP, dstMAC, dstIP>
+       *   ALLOW IF BROADCAST: broadcast so nothing to modify (except ARP dest MAC?)
+       *   ALLOW IF LOOKUP: lookup dstIP and mofify dstMAC (&ethDestMAC) to match VM
+       *
+       * RARP: host knows its MAC and wants to find out which IP it is assigned
+       * 3 RARP request: <srcMAC, 0    , srcMAC, 0    >  can't store <MAC,IP>, 
+       *   ALLOW CONDITIONALLY: if dest eth mac broadcast then nothing to modify,
+       *                        otherwise need to patch ucast dest eth mac.
+       * 4 RARP reply:   <srcMAC, srcIP, dstMAC, dstIP>
+       *   ALLOW IF BROADCAST: broadcast so nothing to modify (except ARP dest MAC?)
+       *   ALLOW IF LOOKUP: lookup dstIP and modify dstMAC (&ethDestMAC) to match VM
+       *
+       * IARP: host knows a peer's MAC and wants to determine its IP address
+       * 8 IARP request: <srcMAC, srcIP, dstMAC, 0    >
+       *   ALLOW CONDITIONALLY: if dest eth mac broadcast then nothing to modify,
+       *                        otherwise need to patch ucast dest eth mac.
+       * 9 IARP reply:   <srcMAC, srcIP, dstMAC, dstIP>
+       *   ALLOW IF BROADCAST: broadcast so nothing to modify (except ARP dest MAC?)
+       *   ALLOW IF LOOKUP: lookup dstIP and modify dstMAC (&ethDestMAC) to match VM
+       */
+
+      if (arpHeaderWord2 == HTONL(0x06040001) ||  // If ARP request
+	  arpHeaderWord2 == HTONL(0x06040003) ||  // If RARP request
+	  arpHeaderWord2 == HTONL(0x06040008)) {  // If IARP request
+
+	 uint32 targetAddr;
+	 uint32 sourceAddr;
+	 Bool foundIP;
+
+	 if (!GetPacketData(packet, ETH_HLEN + ARP_TARGET_IP_OFFSET, 
+			    sizeof targetAddr, &targetAddr) ||
+	     !GetPacketData(packet, ETH_HLEN + ARP_SENDER_IP_OFFSET, 
+			    sizeof sourceAddr, &sourceAddr)) {
+	    VNETKdPrint((MODULE_NAME "FromHostARP: "
+			 "couldn't read target and/or sourceAddr\n"));
+	    return PacketStatusTooShort;
+	 }
+
+	 /*
+	  * Some host configurations will require allowing packet loopback, meaning
+	  * that we'll see the packets that we're transmitting.  Since we're performing
+	  * MAC tricks, the guest could see its own ARP request--this echoed ARP request
+	  * will contain the host's wireless MAC, and thus the guest OS might think that
+	  * there is a address conflict.  Thus, if we receive an ARP request whose source
+	  * IP address is a known VM (or 0.0.0.0, as commonly used by Vista-and-later),
+	  * and the MAC is the wireless hardware, then the ARP request is dropped.
+	  * This will allow address conflicts to be detected when a conflict
+	  * exists with another device, but it prevents conflict detection when
+	  * the conflict is present on/within the host.
+	  */
+
+	 foundIP = sourceAddr == 0 || LookupByIPv4(state, sourceAddr, NULL);
+	 if (foundIP) { // if known IP is contained within request
+	    uint8 packetMac[ETH_ALEN];
+	    VNETKdPrint((MODULE_NAME "FromHostARP: observed a "
+	                 "incoming request from an IP we know about\n"));
+
+	    if (!GetPacketData(packet, ETH_HLEN + ARP_SENDER_MAC_OFFSET, 
+			       sizeof packetMac, packetMac)) {
+	       VNETKdPrint((MODULE_NAME "FromHostARP: "
+			    "couldn't read MAC\n"));
+	       return PacketStatusTooShort;
+	    }
+
+	    /*
+	     * Check if the sender MAC is using the wireless MAC
+	     */
+
+	    if (MAC_EQ(state->macAddress, packetMac)) {
+
+	       /*
+	        * Sender is using wireless MAC, so drop packet 
+		* -- the reasons for this are stated above in the large comment block.
+	        */
+
+	       VNETKdPrint((MODULE_NAME "FromHostARP: incoming request using "
+	                    "wireless hardware addr, so blackholing\n"));
+	       return PacketStatusDropPacket;
+	    }
+	    /*
+	     * Requester IP matches a VM IP, but the source MAC is different.
+	     * This is apparently a true conflict with another network peer, so
+	     * we'll forward the packet 
+	     */
+	    VNETKdPrint((MODULE_NAME "FromHostARP: incoming request using "
+			 "non-wireless-hardware-addr, may conflict--allowing\n"));
+	 } else {
+	    /*
+	     * We don't have information about the source (typical case), 
+             * so forward the packet.
+	     */
+	    WW_VNETKdPrint((MODULE_NAME "FromHostARP: got ARP, no record of "
+			    "source so forward\n"));
+	 }
+
+	 if (IS_MULTICAST(eh.destAddr) || IS_BROADCAST(eh.destAddr)) {
+	    /* dest mac is broacast, so can just forward */
+	    return PacketStatusForwardPacket;
+	 } else if (!MAC_EQ(state->macAddress, eh.destAddr)) {
+	    VNETKdPrint((MODULE_NAME "FromHostARP: incoming request using "
+			 "non-wireless-hardware-addr eth dest MAC, dropping\n"));
+	    return PacketStatusDropPacket;
+	 } else {
+	    Bool  foundMac;
+	    uint8 vmMacAddress[ETH_ALEN];
+
+	    /* 
+	     * Someone sent request to VM with the host's destination MAC,
+	     * so need to patch this with the VM's MAC so the VM can reply.
+	     */
+	    
+	    /*
+	     * Unicast destination--lookup MAC in table.  If entry exists then 
+	     * do MAC replacement and return.  Otherwise, drop the packet
+	     */
+	    
+	    foundMac = LookupByIPv4(state, targetAddr, vmMacAddress);
+	    if (!foundMac) {
+	       W_VNETKdPrint((MODULE_NAME "FromHostARP: target IP in request ARP was"
+			      " NOT found in table, presuming for another peer\n"));
+	       return PacketStatusDropPacket;
+	    }
+	    
+	    VNETKdPrint((MODULE_NAME "FromHostARP: target IP in "
+			 "request ARP was found in table\n"));
+	    
+#ifdef DBG
+	    {
+	       uint8 packetMac[ETH_ALEN];
+	       if (!GetPacketData(packet, ETH_HLEN + ARP_TARGET_MAC_OFFSET, 
+				  sizeof packetMac, packetMac)) {
+		  VNETKdPrint((MODULE_NAME "FromHostARP: "
+			       "couldn't read MAC\n"));
+		  return PacketStatusTooShort;
+	       }
+	       W_VNETKdPrint((MODULE_NAME "FromHostARP: will modify request "
+			      "ARP ETH MAC %02x.%02x.%02x.%02x.%02x.%02x "
+			      "dest address and ARP target address "
+			      "%02x.%02x.%02x.%02x.%02x.%02x to "
+			      "match VM %02x.%02x.%02x.%02x.%02x.%02x\n",
+			      eh.destAddr[0], eh.destAddr[1], eh.destAddr[2], 
+			      eh.destAddr[3], eh.destAddr[4], eh.destAddr[5],
+			      packetMac[0], packetMac[1], packetMac[2], 
+			      packetMac[3], packetMac[4], packetMac[5],  
+			      vmMacAddress[0], vmMacAddress[1], vmMacAddress[2], 
+			      vmMacAddress[3], vmMacAddress[4], vmMacAddress[5]));
+	    }
+#endif
+	    /*
+	     * Copy in the MAC that will be written to eth dest MAC.
+	     */
+	    
+	    if (!CopyDataForPacketFromHost(packets, 0, 0, vmMacAddress)) {
+	       W_VNETKdPrint((MODULE_NAME "FromHostIP: couldn't clone request packet\n"));
+	       return PacketStatusDropPacket;
+	    }
+	    return PacketStatusForwardPacket;
+	 }
+      }
+
+      if (arpHeaderWord2 == HTONL(0x06040002) ||  // If ARP reply
+	  arpHeaderWord2 == HTONL(0x06040004) ||  // If RARP reply
+	  arpHeaderWord2 == HTONL(0x06040009)) {  // If IARP reply
+	 uint32 targetAddr;
+	 Bool foundMac;
+	 uint8 vmMacAddress[ETH_ALEN];
+
+	 if (!GetPacketData(packet, ETH_HLEN + ARP_TARGET_IP_OFFSET, 
+			    sizeof targetAddr, &targetAddr)) {
+	    VNETKdPrint((MODULE_NAME "FromHostARP: couldn't target IP\n"));
+	    return PacketStatusTooShort;
+	 }
+
+	 /*
+	  * If broadcast then return because we don't need to modify anything
+	  */
+
+	 if (IS_MULTICAST(eh.destAddr) || IS_BROADCAST(eh.destAddr)) {
+	    VNETKdPrint((MODULE_NAME "FromHostARP: observed a "
+	                 "broadcast ARP, RARP, or IARP reply packet\n"));
+
+	    /* 
+	     * Don't need to make changes since target MAC is the broadcast addr
+	     */
+
+	    /*
+	     * Ethernet MAC is broadcast, but the dest ARP address might
+	     * be unicast (in fact, it likely is), so we should patch the
+	     * destination ARP MAC address??
+	     */
+
+	    foundMac = LookupByIPv4(state, targetAddr, vmMacAddress);
+	    if (foundMac) {
+	       uint8 packetMac[ETH_ALEN];
+
+	       VNETKdPrint((MODULE_NAME "FromHostARP: target IP in "
+	                    "broadcast reply ARP was found in table\n"));
+	       
+	       if (!GetPacketData(packet, ETH_HLEN + ARP_TARGET_MAC_OFFSET, 
+				  sizeof packetMac, packetMac)) {
+		  VNETKdPrint((MODULE_NAME "FromHostARP: "
+			       "couldn't read MAC\n"));
+		  return PacketStatusTooShort;
+	       }
+
+	       W_VNETKdPrint((MODULE_NAME "FromHostARP: will modify reply "
+			      "ARP target address %02x.%02x.%02x.%02x.%02x.%02x to "
+			      "match VM %02x.%02x.%02x.%02x.%02x.%02x\n",
+			      packetMac[0], packetMac[1], packetMac[2], 
+			      packetMac[3], packetMac[4], packetMac[5], 
+			      vmMacAddress[0], vmMacAddress[1], vmMacAddress[2], 
+			      vmMacAddress[3], vmMacAddress[4], vmMacAddress[5]));
+	       
+               /*
+		* Copy in the MAC that will be written to ARP dest MAC
+	        */
+
+	       if (!CopyDataForPacketFromHost(packets, 0, 
+				              ETH_HLEN + ARP_TARGET_MAC_OFFSET,
+                                              vmMacAddress)) {
+		  VNETKdPrint((MODULE_NAME "FromHostIP: couldn't "
+			       "clone packet\n"));
+		  return PacketStatusDropPacket;
+	       }
+	       return PacketStatusForwardPacket;
+	    } else {
+	       W_VNETKdPrint((MODULE_NAME "FromHostARP: target IP in broadcast "
+			      "reply ARP was NOT found in table\n"));
+	       return PacketStatusForwardPacket; 
+	    }
+	 }
+
+	 W_VNETKdPrint((MODULE_NAME "FromHostARP: target IP is %d.%d.%d.%d\n", 
+			(targetAddr)&0xff, (targetAddr>>8)&0xff, 
+			(targetAddr>>16)&0xff, (targetAddr>>24)&0xff));
+#ifdef DBG
+	 {
+	    uint32 senderAddr;
+	    if (!GetPacketData(packet, ETH_HLEN + ARP_SENDER_IP_OFFSET, 
+			       sizeof senderAddr, &senderAddr)) {
+	       VNETKdPrint((MODULE_NAME "FromHostARP: couldn't "
+			    "read IP addr\n"));
+	       return PacketStatusTooShort;
+	    }
+	    W_VNETKdPrint((MODULE_NAME "FromHostARP: sender IP %d.%d.%d.%d\n", 
+	                   (senderAddr&0xff), (senderAddr>>8)&0xff, 
+	                   (senderAddr>>16)&0xff, (senderAddr>>24)&0xff));
+	 }
+#endif
+
+	 /*
+	  * Unicast destination--lookup MAC in table.  If entry exists then 
+	  * do MAC replacement and return.  Otherwise, drop the packet
+	  */
+
+	 // see if the reply is for a host that we're aware of, and modify as necessary
+	 foundMac = LookupByIPv4(state, targetAddr, vmMacAddress);
+	 if (foundMac) {
+	    VNETKdPrint((MODULE_NAME "FromHostARP: target IP in "
+	                 "reply ARP was found in table\n"));
+
+#ifdef DBG
+	    {
+	       uint8 packetMac[ETH_ALEN];
+	       if (!GetPacketData(packet, ETH_HLEN + ARP_TARGET_MAC_OFFSET, 
+				  sizeof packetMac, packetMac)) {
+		  VNETKdPrint((MODULE_NAME "FromHostARP: "
+			       "couldn't read MAC\n"));
+		  return PacketStatusTooShort;
+	       }
+	       W_VNETKdPrint((MODULE_NAME "FromHostARP: will modify reply "
+			      "ARP ETH MAC %02x.%02x.%02x.%02x.%02x.%02x "
+			      "dest address and ARP target address "
+			      "%02x.%02x.%02x.%02x.%02x.%02x to "
+			      "match VM %02x.%02x.%02x.%02x.%02x.%02x\n",
+			      eh.destAddr[0], eh.destAddr[1], eh.destAddr[2], 
+			      eh.destAddr[3], eh.destAddr[4], eh.destAddr[5],
+			      packetMac[0], packetMac[1], packetMac[2], 
+			      packetMac[3], packetMac[4], packetMac[5],  
+			      vmMacAddress[0], vmMacAddress[1], vmMacAddress[2], 
+			      vmMacAddress[3], vmMacAddress[4], vmMacAddress[5]));
+	    }
+#endif
+	    /*
+	     * Copy in the MAC that will be written to eth 
+	     * dest MAC and ARP dest MAC
+	     */
+
+	    if (!CopyDataForPacketFromHost(packets, 0, 0, vmMacAddress)) {
+	       W_VNETKdPrint((MODULE_NAME "FromHostIP: couldn't "
+			      "clone packet\n"));
+	       return PacketStatusDropPacket;
+	    }
+	    if (!CopyDataForPacketFromHost(packets, 1, 
+		                           ETH_HLEN + ARP_TARGET_MAC_OFFSET, 
+                                           vmMacAddress)) {
+	       W_VNETKdPrint((MODULE_NAME "FromHostIP: "
+			      "couldn't clone packet #2\n"));
+	       return PacketStatusDropPacket;
+	    }
+
+	    return PacketStatusForwardPacket;      
+	 } else {
+	    W_VNETKdPrint((MODULE_NAME "FromHostARP: target IP in reply ARP was"
+			   " NOT found in table, presuming for another peer\n"));
+	    return PacketStatusDropPacket;
+	 }
+      }
+      VNETKdPrint((MODULE_NAME "FromHostARP: unrecognized ARP type %08x\n",
+		   arpHeaderWord2));
+      return PacketStatusDropPacket;
+   } else { // if EAPOL packet: typeClass == EthClassEAPOL
+
+      /*
+       * Allow incoming EAPOL packets to proceed unmolested provided the
+       * destination address matches the hardware address.
+       */
+
+      if (!MAC_EQ(state->macAddress, eh.destAddr)) {
+         VNETKdPrint((MODULE_NAME "FromHostEAPOL: incoming request using "
+                      "non-wireless-hardware-addr eth dest MAC, dropping\n"));
+         return PacketStatusDropPacket;
+      }
+      return PacketStatusForwardPacket;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SMAC_CheckPacketToHost --
+ *
+ *      Modifies packet contents to be suitable for transmission over
+ *      a wireless network.  Function supports IP, ARP, RARP, IARP.
+ *      Function will support DHCP in the future.  This function clones
+ *      the source packet, modifies the clone packet in situations
+ *      where the packet should be forwarded to the host.
+ *
+ *      NOTE: On Windows this function presumes it is called at DISPATCH_LEVEL
+ *
+ * Results:
+ *      Returns 'PacketStatusTooShort' if insufficient data to process
+ *      packet (suggest packet drop), 'PacketStatusDropPacket' if the
+ *      packet should be dropped, or 'PacketStatusForwardPacket' if
+ *      the packet should be forwarded.
+ *
+ * Side effects:
+ *      Modifies contents of network packet, if nessary.
+ *
+ *----------------------------------------------------------------------
+ */
+
+PacketStatus SMACINT
+SMAC_CheckPacketToHost(SMACState *state,     // IN: pointer to state
+		       SMACPackets *packets) // IN/OUT: packet to process; cloned/modified packet
+{
+   uint8 buf[sizeof(EthernetHeader) + 4]; /* allocate extra 4 for VLAN headers */
+   EthernetHeader *eh = (EthernetHeader*)buf;
+   uint32 ethHeaderLen = ETH_HLEN; // tracks length of ethernet header
+   SMACPacket *packet = NULL;
+   EthClass typeClass; // classification of ethernet frame's type
+
+   ASSERT(state);
+
+   W_VNETKdPrint((MODULE_NAME "ToHost: Called\n"));
+   ASSERTLOCKHELD();
+   ASSERT(sizeof(EthernetHeader) == ETH_HLEN);
+
+   packet = &(packets->orig);
+   ASSERT(packet);
+
+   /*
+    * Verify that we have at least a minimal packet
+    */
+
+   if (!GetPacketData(packet, 0, ethHeaderLen, eh)) {
+      VNETKdPrint((MODULE_NAME "ToHost: Packet missing eth header\n"));
+      return PacketStatusTooShort;
+   }
+
+   /*
+    * Lookup the ethernet media type of the packet
+    */
+
+   typeClass = LookupTypeClass(NTOHS(eh->lengthType));
+
+   /*
+    * If packet type is a VLAN header, then adjust pointers and 
+    * decode the "real" media type which follows the VLAN header
+    */
+
+   if (typeClass == EthClassVLAN) {
+      uint16 actualType = 0;
+
+      ethHeaderLen +=4;
+      if (!GetPacketData(packet, 0, ethHeaderLen, eh)) {
+	 VNETKdPrint((MODULE_NAME "  ToHost: Packet is using VLAN header, "
+	              "but supplied header is too small\n"));
+	 return PacketStatusTooShort;
+      }
+
+      actualType = *(uint16*)(((uint8*)&(eh->lengthType)) + 4);
+      
+      VNETKdPrint((MODULE_NAME "  ToHost: Taking special measures for VLAN\n"));
+      typeClass = LookupTypeClass(NTOHS(actualType));
+   }
+
+   /*
+    * If the packet is not type IP, ARP or EAPOL, then drop the packet
+    * unless it is a broadcast packet (broadcast packets don't
+    * require much manipulating, so they should be safe to let thru).
+    */
+
+   if (typeClass != EthClassIPv4 && typeClass != EthClassIPv6 &&
+       typeClass != EthClassARP && typeClass != EthClassEAPOL) {
+
+      /*
+       * DEBUG: if not a common/known media type, then print a status message
+       */
+
+#ifdef DBG
+      if (typeClass != EthClassCommon) {
+         char type[50] = ""; // holds textual name of type
+         if (ethHeaderLen == ETH_HLEN) { // if not a vlan packet
+            LookupTypeName(NTOHS(eh->lengthType), type, sizeof type);
+         } else { // if a vlan packet
+            uint16 actualType = *(uint16*)(((uint8*)&(eh->lengthType)) + 4);
+            LookupTypeName(NTOHS(actualType), type, sizeof type);
+         }
+         VNETKdPrint((MODULE_NAME "  ToHost: non-IP & non-ARP "
+		     "%02x:%02x:%02x:%02x:%02x:%02x -> "
+		     "%02x:%02x:%02x:%02x:%02x:%02x %s\n",
+             eh->srcAddr[0]&0xff, eh->srcAddr[1]&0xff,
+             eh->srcAddr[2]&0xff, eh->srcAddr[3]&0xff,
+             eh->srcAddr[4]&0xff, eh->srcAddr[5]&0xff,
+             eh->destAddr[0]&0xff, eh->destAddr[1]&0xff,
+             eh->destAddr[2]&0xff, eh->destAddr[3]&0xff,
+             eh->destAddr[4]&0xff, eh->destAddr[5]&0xff, type));
+      }
+#endif
+
+      /*
+       * Let these unrecognized packets through only if they are broadcast or
+       * multicast, and drop unicast packets (it's easier/debug loss of traffic
+       * versus corrupted/invalid traffic).
+       */
+
+      if (IS_MULTICAST(eh->destAddr) || IS_BROADCAST(eh->destAddr)) {
+
+         /*
+          * Modify the source address to be that of the wireless hardware, so
+          * that this packet can be transmitted.  First we need to duplicate
+          * the packet so that other VMs don't get confused about MACs that
+          * arbitrarily change between the VM's MAC and the host's MAC.
+          */
+
+         if (!ClonePacket(packets)) {
+            VNETKdPrint((MODULE_NAME "  ToHost: couldn't clone packet\n"));
+            return PacketStatusDropPacket;
+         }
+
+         CopyDataToClonedPacket(packets, state->macAddress, 
+                                ETH_ALEN /* offset for source MAC */, 
+                                ETH_ALEN /* length */);
+         return PacketStatusForwardPacket;
+      } else {
+
+         /* 
+          * Drop the packet, but first display a status message indicating
+          * that we're dropping this packet (largely so we know what kind/type
+          * of traffic that we are dropping
+          */
+
+#ifdef DBG
+         char type[50] = ""; // holds textual name of type
+         if (ethHeaderLen == ETH_HLEN) { // if not a vlan packet
+            LookupTypeName(NTOHS(eh->lengthType), type, sizeof type);
+         } else { // if a vlan packet
+            uint16 actualType = *(uint16*)(((uint8*) & (eh->lengthType)) + 4);
+            LookupTypeName(NTOHS(actualType), type, sizeof type);
+         }
+         VNETKdPrint((MODULE_NAME "  ToHost: Dropping unrecognized "
+                      "unicast non-IP & non-ARP unicast packet: %s\n", type));
+         VNETKdPrint((MODULE_NAME "  ToHost: the non-IP & non-ARP is "
+                      "%02x:%02x:%02x:%02x:%02x:%02x -> "
+                      "%02x:%02x:%02x:%02x:%02x:%02x\n",
+                      eh->srcAddr[0]&0xff, eh->srcAddr[1]&0xff, 
+                      eh->srcAddr[2]&0xff, eh->srcAddr[3]&0xff, 
+                      eh->srcAddr[4]&0xff, eh->srcAddr[5]&0xff, 
+                      eh->destAddr[0]&0xff, eh->destAddr[1]&0xff, 
+                      eh->destAddr[2]&0xff, eh->destAddr[3]&0xff, 
+                      eh->destAddr[4]&0xff, eh->destAddr[5]&0xff));   
+#endif
+         return PacketStatusDropPacket;
+      }
+   }
+
+   /*
+    * If IP packet, then store <source IP address, source MAC address> in lookup 
+    * table and replace source ethernet MAC with that of the wireless hardware.
+    */
+
+   if (typeClass == EthClassIPv4 || typeClass == EthClassIPv6) {
+      W_DEVEL_ONLY(char macStr1[MAC_STRING_SIZE];)
+      W_DEVEL_ONLY(char macStr2[MAC_STRING_SIZE];)
+
+      if (typeClass == EthClassIPv4) {
+         uint8 ipHeader[IP_HEADER_LEN];
+         uint32 ipVer;       // version of IP header
+         uint32 ipHeaderLen; // reported length of IPv4 header
+         
+         uint16 ipLen;       // reported length of IPv4 packet
+         uint32 ipSrcAddr;   // source address
+
+         /*
+          * Read in the IPv4 header.
+          */
+
+         if (!GetPacketData(packet, ethHeaderLen, sizeof ipHeader, ipHeader)) {
+            VNETKdPrint((MODULE_NAME "  ToHostIP: got an IP type, "
+                         "but incomplete header\n"));
+            return PacketStatusTooShort;
+         }
+
+
+         ipVer = ipHeader[0] >> 4;
+         ipHeaderLen = 4 * (ipHeader[0]&0xf); // reported length of IP header
+         
+         ipLen = NTOHS(*(uint16*)(ipHeader + 2)); // packet len
+         ipSrcAddr = *((uint32*)(ipHeader + IP_HEADER_SRC_ADDR_OFFSET));
+
+         /*
+          * Verify basic fields in IPv4 header.
+          */
+      
+         if (ipVer != IPv4 || ipHeaderLen < IP_HEADER_LEN ||
+             GetPacketLength(packet) < ethHeaderLen + ipHeaderLen) {
+            VNETKdPrint((MODULE_NAME "ToHostIP:  IPv4 packet's ver = %u, "
+                         "reported length = %u, reported length = %u.\n",
+                         ipVer, GetPacketLength(packet),
+                         ethHeaderLen + ipHeaderLen));
+            return PacketStatusDropPacket;
+         }
+
+         /*
+          * Store IPv4/MAC combo in lookup table, that way we can replace
+          * the MAC when any replies to this IP are received.
+          */
+      
+         if (!AddIPv4andMACcombo(state, ipSrcAddr, eh->srcAddr)) {
+            return PacketStatusDropPacket;
+         }
+      } else {
+         uint8 ipv6Header[IPv6_HEADER_LEN];
+         uint8 ipv6Ver;
+         IPv6Addr ipv6SrcAddr;
+
+         /*
+          * Read the IPv6 header.
+          */
+
+         if (!GetPacketData(packet, ethHeaderLen, sizeof ipv6Header,
+             ipv6Header)) {
+            VNETKdPrint((MODULE_NAME "ToHostIP:  got incomplete IPv6 "
+                         "header.\n"));
+            return PacketStatusTooShort;
+         }
+
+         ipv6Ver = ipv6Header[0] >> 4;
+         if (ipv6Ver != IPv6 || GetPacketLength(packet) < ethHeaderLen +
+                                                          IPv6_HEADER_LEN) {
+            VNETKdPrint((MODULE_NAME "  ToHostIP: got an IP version %u, or "
+                         "length %u less than minimum length %u.\n", ipv6Ver,
+                         GetPacketLength(packet), ethHeaderLen +
+                         IPv6_HEADER_LEN));
+            return PacketStatusDropPacket;
+         }
+
+         ipv6SrcAddr.addrHi = *((uint64 *)(ipv6Header +
+                                           IPv6_HEADER_SRC_ADDR_OFFSET));
+         ipv6SrcAddr.addrLo = *((uint64 *)(ipv6Header +
+                                           IPv6_HEADER_SRC_ADDR_OFFSET +
+                                           sizeof ipv6SrcAddr.addrHi));
+
+         /*
+          * Store IPv6/MAC combo in lookup table, that way we can replace
+          * the MAC when any replies to this IP are received.
+          */
+      
+         if (!AddIPv6andMACcombo(state, &ipv6SrcAddr, eh->srcAddr)) {
+            return PacketStatusDropPacket;
+         }
+      }
+
+      /*
+       * Now the code common to IPv4 and IPv6 cases start.
+       *
+       * First, replace source MAC with wireless hardware MAC.
+       */
+
+      W_VNETKdPrint((MODULE_NAME "  ToHostIP: modifying ETH MAC %s source "
+                     "address to match wireless hardware MAC %s\n",
+                     PrintMACAddrToString(macStr1, sizeof macStr1,
+                                          eh->srcAddr),
+                     PrintMACAddrToString(macStr2, sizeof macStr2,
+                                          state->macAddress)));
+
+      /* 
+       * Duplicate the packet so that other VMs don't get confused about 
+       * MACs that arbitrarily change between the VM's MAC and the host's 
+       * MAC.
+       */
+
+      if (!ClonePacket(packets)) {
+         VNETKdPrint((MODULE_NAME "  ToHostIP: couldn't clone packet\n"));
+         return PacketStatusDropPacket;
+      }
+       
+      /*
+       * Make any necessary modifications to packet payload.
+       */
+
+      if (typeClass == EthClassIPv4) {
+         ProcessOutgoingIPv4Packet(&packets->clone, ethHeaderLen);
+      } else {
+         Bool toHost = FALSE; /* Updated only on Windows Vista and later. */
+
+         if (!ProcessOutgoingIPv6Packet(&packets->clone, ethHeaderLen,
+                                        state->macAddress, &toHost)) {
+            VNETKdPrint((MODULE_NAME "  ToHostIP: error in processing "
+                         "outgoing IPv6 packet.\n"));
+            return PacketStatusDropPacket;
+         }
+
+         if (UNLIKELY(toHost)) {
+            /*
+             * Don't replace the ethernet source MAC address in the packet with
+             * state->macAddress.
+             */
+
+            return PacketStatusForwardPacket;
+         }
+      }
+      CopyDataToClonedPacket(packets, state->macAddress, 
+                             ETH_ALEN /* offset for source MAC */, 
+                             ETH_ALEN /* length */);
+      return PacketStatusForwardPacket;
+   } 
+
+   /*
+    * If ARP packet, then store <source IP address, source MAC address> in 
+    * lookup table (if possible) and replace source ethernet MAC (and source 
+    * ARP MAC, if appropriate) with that of the wireless hardware
+    */
+
+   else if (typeClass == EthClassARP) { // ARP packet
+      uint32 arpHeaderWord1; // first word of ARP header
+      uint32 arpHeaderWord2; // second word of ARP header
+
+      /*
+       * Verify that packet meets minimum length expectations, the ARP header 
+       * is 7 words for ethernet and IPv4, but the length may actually be 60 
+       * due to ethernet's minimum length requirements.
+       */
+
+      if (GetPacketLength(packet) < ethHeaderLen + ARP_HEADER_LEN) {
+         VNETKdPrint((MODULE_NAME "  ToHostARP: ARP packet is insufficient "
+                      "length of IPv4 and Ethernet, expected %u got %u\n",
+                      ethHeaderLen + ARP_HEADER_LEN, GetPacketLength(packet)));
+         return PacketStatusDropPacket;
+      }
+
+      /*
+       * Verify the first word of the ARP header (hardcoded for ethernet and IPv4)
+       *
+       * I recently added IEEE802 support.  These types of ARP requests were
+       * observed on the company network, so someone uses them.  As long as
+       * the address lengths are the same then I imagine that the processing
+       * is identical and we can handle them (lengths are checked as part
+       * of processing the second word of ARP header).
+       */
+
+      if (!GetPacketData(packet, ethHeaderLen, sizeof arpHeaderWord1,
+          &arpHeaderWord1) ||
+          !GetPacketData(packet, ethHeaderLen + sizeof arpHeaderWord1,
+          sizeof arpHeaderWord2, &arpHeaderWord2)) {
+         VNETKdPrint((MODULE_NAME "ToHostARP: ARP header couldnt be loaded\n"));
+         return PacketStatusDropPacket;
+      }
+
+      if (arpHeaderWord1 != HTONL(0x00010800) /* ethernet */ &&
+         arpHeaderWord1 != HTONL(0x00060800) /* ieee802  */ ) {
+         VNETKdPrint((MODULE_NAME "  ToHostARP: ARP header appears wrong, "
+                      "got %08x\n", arpHeaderWord1));
+         return PacketStatusDropPacket;
+      }
+
+      /*
+       * Perform action based on opcode in second word of ARP header.
+       * DEBUG: print general information about the packet
+       */
+
+#ifdef DBG
+      switch (arpHeaderWord2) {
+	 case CONST_NTOHL(0x06040001):
+	    W_VNETKdPrint((MODULE_NAME "  ToHostARP: "
+	                 "ARP header2 indicates ARP request\n"));
+	    break;
+	 case CONST_NTOHL(0x06040002):
+	    W_VNETKdPrint((MODULE_NAME "  ToHostARP: "
+	                 "ARP header2 indicates ARP reply\n"));
+	    break;
+	 case CONST_NTOHL(0x06040003):
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: "
+	                 "ARP header2 indicates RARP request\n"));
+	    break;
+	 case CONST_NTOHL(0x06040004):
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: "
+	                 "ARP header2 indicates RARP reply\n"));
+	    break;
+	 case CONST_NTOHL(0x06040008):
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: "
+	                 "ARP header2 indicates IARP request\n"));
+	    break;
+	 case CONST_NTOHL(0x06040009):
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: "
+	                 "ARP header2 indicates IARP reply\n"));
+	    break;
+	 default:
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: "
+	                 "ARP header2 indicates unknown opcode\n"));
+	    break;
+      }
+
+      {
+	 uint8 packetMac[ETH_ALEN];
+	 uint8 packetIP[4];
+
+	 if (!GetPacketData(packet, ethHeaderLen + ARP_SENDER_MAC_OFFSET, 
+			    sizeof packetMac, packetMac)) {
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: couldn't read MAC\n"));
+	    return PacketStatusTooShort;
+	 }
+	 if (!GetPacketData(packet, ethHeaderLen + ARP_SENDER_IP_OFFSET, 
+			    sizeof packetIP, packetIP)) {
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: couldn't read IP\n"));
+	    return PacketStatusTooShort;
+	 }
+
+	 W_VNETKdPrint((MODULE_NAME "  ToHostARP: sender MAC is "
+			"%02x:%02x:%02x:%02x:%02x:%02x IP is %d.%d.%d.%d\n",
+			packetMac[0], packetMac[1], packetMac[2], 
+			packetMac[3], packetMac[4], packetMac[5], 
+			packetIP[0], packetIP[1],  packetIP[2], packetIP[3]));
+
+	 if (!GetPacketData(packet, ethHeaderLen + ARP_TARGET_MAC_OFFSET, 
+			    sizeof packetMac, packetMac)) {
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: couldn't read MAC\n"));
+	    return PacketStatusTooShort;
+	 }
+	 if (!GetPacketData(packet, ethHeaderLen + ARP_TARGET_IP_OFFSET, 
+			    sizeof packetIP, packetIP)) {
+	    VNETKdPrint((MODULE_NAME "  ToHostARP: couldn't read IP\n"));
+	    return PacketStatusTooShort;
+	 }
+
+	 W_VNETKdPrint((MODULE_NAME "  ToHostARP: target MAC is "
+			"%02x:%02x:%02x:%02x:%02x:%02x IP is %d.%d.%d.%d\n",
+			packetMac[0], packetMac[1], packetMac[2], 
+			packetMac[3], packetMac[4], packetMac[5], 
+			packetIP[0], packetIP[1],  packetIP[2], packetIP[3]));
+      }
+#endif
+
+      /*
+       * ARP handling for *outgoing traffic*
+       *
+       * ARP: host wants to know the MAC that corresponds to a particular IP
+       * 1 ARP request:  <srcMAC, srcIP, 0,      dstIP> store source <MAC,IP>, 
+       *   modify source MAC in eth & ARP
+       * 2 ARP reply:    <srcMAC, srcIP, dstMAC, dstIP> store source <MAC,IP>, 
+       *   modify source MAC in eth & ARP
+       *
+       * RARP: host knows its MAC and wants to find out which IP it is 
+       *   assigned (simple form of DHCP)
+       * 3 RARP request: <srcMAC, 0    , srcMAC, 0    >  can't store <MAC,IP>, 
+       *   should modify srcMAC but response would be MAC/IP of host 
+       *   I'm tempted to blackhole this packet, but for now I will just modify 
+       *   the eth MAC and allow it to be sent
+       *   -- for now, presuming that lookup done on second srcMAC, but packet
+       *      sent to first srcMAC (in other words, like IARP).  This may
+       *      be more correct / interoperable, but we still won't be able to
+       *      handle RARP replies properly unless they are broadcasted.
+       * 4 RARP reply:   <srcMAC, srcIP, dstMAC, dstIP> store source <MAC,IP>, 
+       *   modify source MAC in eth & ARP
+       *
+       * IARP: host knows a peer's MAC and wants to determine its IP address
+       * 8 IARP request: <srcMAC, srcIP, dstMAC, 0    > store source <MAC,IP>, 
+       *   modify source MAC in eth & ARP
+       * 9 IARP reply:   <srcMAC, srcIP, dstMAC, dstIP> store source <MAC,IP>, 
+       *   modify source MAC in eth & ARP
+       */
+
+      if (arpHeaderWord2 == HTONL(0x06040001) ||
+	  arpHeaderWord2 == HTONL(0x06040002) ||
+	  arpHeaderWord2 == HTONL(0x06040003) ||
+	  arpHeaderWord2 == HTONL(0x06040004) ||
+	  arpHeaderWord2 == HTONL(0x06040008) ||
+	  arpHeaderWord2 == HTONL(0x06040009)) {
+
+	 if (arpHeaderWord2 != HTONL(0x06040003)) { // don't store MAC/IP for RARP req.
+	    uint32 IPaddr;
+	    uint8 packetMac[ETH_ALEN];
+
+	    W_VNETKdPrint((MODULE_NAME "  ToHostARP: adding MAC/IP "
+			   "combo to lookup table\n"));
+
+	    /* read IP */
+	    if (!GetPacketData(packet, ethHeaderLen + ARP_SENDER_IP_OFFSET, 
+			       sizeof IPaddr, &IPaddr)) {
+	       VNETKdPrint((MODULE_NAME "  ToHostARP: couldn't read IP\n"));
+	       return PacketStatusTooShort;
+	    }
+
+	    /* read MAC */
+	    if (!GetPacketData(packet, ethHeaderLen + ARP_SENDER_MAC_OFFSET, 
+			       sizeof packetMac, packetMac)) {
+	       VNETKdPrint((MODULE_NAME "  ToHostARP: couldn't read MAC\n"));
+	       return PacketStatusTooShort;
+	    }
+	    
+	    /*
+	     * Store <IP,MAC> combo in table.  For MAC we could also use 
+	     * (char*)(packet)+ETH_ALEN, but it's more consistent with the ARP
+	     * protocol to use the MAC located within the packet
+	     */
+	    
+	    if (!AddIPv4andMACcombo(state, IPaddr, packetMac)) { 
+	       return PacketStatusDropPacket;
+	    }
+	 }
+
+	 /*
+	  * First we need to duplicate the packet so that other VMs don't 
+	  * get confused about MACs that arbitrarily change between the 
+	  * VM's MAC and the host's MAC.
+	  */
+
+	 {
+            uint32  offset = ethHeaderLen + ARP_SENDER_MAC_OFFSET;
+
+	    if (!ClonePacket(packets)) {
+	       VNETKdPrint((MODULE_NAME "  ToHostARP: couldn't "
+                            "clone packet\n"));
+	       return PacketStatusDropPacket;
+	    }
+
+	    /*
+	     * Substitute sender ethernet MAC with the wireless hardware's MAC
+	     */
+
+	    W_VNETKdPrint((MODULE_NAME "  ToHostARP: modifying ETH MAC "
+			"%02x.%02x.%02x.%02x.%02x.%02x source address to match"
+			" wireless hardware %02x.%02x.%02x.%02x.%02x.%02x \n",
+			eh->srcAddr[0]&0xff, eh->srcAddr[1]&0xff, 
+                        eh->srcAddr[2]&0xff, eh->srcAddr[3]&0xff, 
+                        eh->srcAddr[4]&0xff, eh->srcAddr[5]&0xff, 
+			state->macAddress[0]&0xff, state->macAddress[1]&0xff, 
+			state->macAddress[2]&0xff, state->macAddress[3]&0xff, 
+			state->macAddress[4]&0xff, state->macAddress[5]&0xff));
+	 
+	    CopyDataToClonedPacket(packets, state->macAddress, ETH_ALEN /* offset */,
+				   ETH_ALEN /* length */);
+
+	    /* 
+	     * Modify ARP source MAC
+	     */
+
+#if defined(_WIN32) && NDIS_SUPPORT_NDIS6
+            /*
+             *  In normal case, we will substitute ARP source MAC with the
+             *  wireless hardware's MAC in the ARP payload.
+             *
+             * However if the target IP address is host IP address,
+             *  the arp protocol payload should not be touched. Otherwise
+             * the Windows TCP/IP stack will not respond for the request.
+             * (This behavior is seen in Vista and after.)
+             * Since the ARP payload is not touched, We should change the
+             * destination MAC in the MAC header to wireless hardware MAC
+             * so that no other host will receive and process the ARP packet
+             */
+            {
+               ULONG ipAddr;
+               if (!GetPacketData(packet, ethHeaderLen + ARP_TARGET_IP_OFFSET,
+                                  sizeof ipAddr, &ipAddr)) {
+                  VNETKdPrint((MODULE_NAME " ToHostARP: couldn't get target "
+                               "IP address\n"));
+                  return PacketStatusTooShort;
+               }
+               if (BridgeIPv4MatchAddrMAC(ipAddr, state->macAddress)) {
+                  offset = 0;
+               }
+            }
+#endif 
+
+
+#ifdef DBG
+            {
+	       uint8 macAddr[ETH_ALEN];
+	       if (!GetPacketData(packet, offset, sizeof macAddr, macAddr)) {
+		  VNETKdPrint((MODULE_NAME "  ToHostARP: "
+			       "couldn't read data at offset %u\n", offset));
+		  return PacketStatusTooShort;
+	       }
+
+	       W_VNETKdPrint((MODULE_NAME "  ToHostARP: modifying %s from "
+                              "%02x.%02x.%02x.%02x.%02x.%02x to "
+			      "wireless hardware address "
+                              "%02x.%02x.%02x.%02x.%02x.%02x \n",
+                              (offset == 0) ? "destination address of MAC header"
+                              : "ARP payload source MAC address",
+			      macAddr[0], macAddr[1], macAddr[2],
+			      macAddr[3], macAddr[4], macAddr[5],
+			      state->macAddress[0], state->macAddress[1],
+			      state->macAddress[2], state->macAddress[3],
+			      state->macAddress[4], state->macAddress[5]));
+            }
+#endif
+	    CopyDataToClonedPacket(packets, state->macAddress, offset, ETH_ALEN);
+	    return PacketStatusForwardPacket;
+	 }
+      }
+
+      VNETKdPrint((MODULE_NAME "  ToHostARP: unrecognized ARP type %08x\n",
+		   arpHeaderWord2));
+      return PacketStatusDropPacket;
+   } else { // if EAPOL packet: typeClass == EthClassEAPOL
+
+      /*
+       * Allow outgoing EAPOL packets to proceed unmolested provided the
+       * source address matches the hardware address.
+       */
+
+      if (!MAC_EQ(state->macAddress, eh->srcAddr)) {
+         VNETKdPrint((MODULE_NAME "ToHostEAPOL: outgoing request using "
+                      "non-wireless-hardware-addr eth source MAC, dropping\n"));
+         return PacketStatusDropPacket;
+      }
+      return PacketStatusForwardPacket;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * ProcessOutgoingIPv4Packet --
+ *
+ *      This function is used to examine IPv4 packets, and make any
+ *      adjustments (if necessary) to the IP header and/or payload.
+ *      The caller should have determined that the packet is IPv4
+ *      before calling this function.
+ *
+ *      Currently this function just makes sure that the broadcast
+ *      bit is set on outgoing client DHCP packets that are being
+ *      sent to a server.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      May modify the contents of the packet.  Length should be 
+ *      unchanged.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+ProcessOutgoingIPv4Packet(SMACPacket *packet,  // IN: cloned packet to process
+			  uint32 ethHeaderLen) // IN: length of ethernet header
+{
+   uint8  proto;   // protocol within ip
+   uint16 ipFlags; // flags and offset
+
+   /*
+    * Should certain checks, e.g., IP version field, be checked here,
+    * or assume that caller has already performed this check?
+    */
+
+   // check should have been performed by caller
+   ASSERT(GetPacketLength(packet) >= IP_HEADER_LEN + ethHeaderLen); 
+
+   if (!GetPacketData(packet, ethHeaderLen + IP_HEADER_PROTO_OFFSET, 
+		      sizeof proto, &proto)) {
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get protocol\n"));
+      ASSERT(0); // should never occur
+      return;      
+   }
+
+   if (!GetPacketData(packet, ethHeaderLen + IP_HEADER_FLAGS_OFFSET,
+		      sizeof ipFlags, &ipFlags)) {
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get flags\n"));
+      ASSERT(0); // should never occur
+      return;      
+   }
+
+   /*
+    * Verify offset=0 and M=0: mask off "fragment" flag, 
+    * all others should be zero.  This is to ensure that we're processing
+    * only the front of the actual packet (i.e., validate that what we
+    * think if offset 0 is really offset 0).
+    */
+
+   if (ipFlags & HTONS((uint16)(0xbfff))) { 
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got a fragmented IP "
+	           "(ipFlags %04x), so not performing higher-level processing\n",
+		   ipFlags));
+      return;
+   }
+
+   /*
+    * NOTE: the following switch statement can be replaced with a single
+    * check for proto==17, since UDP is the only non-debug case
+    */
+
+   switch (proto) {
+   case 1: { // ICMP
+#ifdef DBG
+      uint8  ipHeader[IP_HEADER_LEN];
+      uint32 ipHeaderLen = 0;
+      uint32 ipVer = 0;
+      uint16 ipLen = 0;
+      uint8  typeField = 0;
+      uint8  codeField = 0;
+
+      /* Verify that we have at least a whole, minimal IP header */
+      if (!GetPacketData(packet, ethHeaderLen, sizeof ipHeader, ipHeader)) {
+         VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get IP\n"));
+         return;
+      }
+
+      ipHeaderLen = 4 * (ipHeader[0] & 0xf); // version of IP header
+      ipVer = ipHeader[0] >> 4; // length of IP header
+      ipLen = NTOHS(*(uint16*)(ipHeader + 2)); // total datagram len
+
+      if (ipVer == 4 && GetPacketLength(packet) >=
+          ipHeaderLen + ethHeaderLen + 2 * 4 &&
+          GetPacketData(packet, ethHeaderLen + ipHeaderLen,
+                        sizeof typeField, &typeField) &&
+          GetPacketData(packet, ethHeaderLen + ipHeaderLen + 1,
+                        sizeof codeField, &codeField)) {
+         VNETKdPrint((MODULE_NAME "ProcessOutgoing: got ICMP, "
+                      "type = %u, code = %u,\n", typeField, codeField));
+      } else {
+         VNETKdPrint((MODULE_NAME "ProcessOutgoing: got ICMP, "
+                      "but couldn't process\n"));
+      }
+#endif /* DBG */
+      return;
+   }
+   case 2: // IGMP
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got IGMP\n"));
+      return;
+   case 4: // IP in IP
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got IP in IP\n"));
+      return;
+   case 6: // TCP
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got TCP\n"));
+      return;
+   case 17: { // UDP
+      uint8 ipHeaderFirstByte;
+      uint32 ipHeaderLen; // length of IP header
+      uint16 srcPort;     // UDP source port
+      uint16 destPort;    // UDP dest port
+
+      if (!GetPacketData(packet, ethHeaderLen, 
+			 sizeof ipHeaderFirstByte, &ipHeaderFirstByte)) {
+	 VNETKdPrint((MODULE_NAME "FromHostIP: Failed to get IP length\n"));
+	 return;
+      }
+     
+      ipHeaderLen = 4 * (ipHeaderFirstByte & 0xf); // version of IP header
+
+      W_VNETKdPrint((MODULE_NAME "ProcessOutgoing: got UDP\n"));
+
+      /*
+       * Verify that sufficient data for UDP packet header is present
+       */
+      
+      if (GetPacketLength(packet) < ethHeaderLen + ipHeaderLen + UDP_HEADER_LEN) {
+	 VNETKdPrint((MODULE_NAME "ProcessOutgoing: UDP header not present\n"));
+	 return;
+      }
+
+      /*
+       * decode the source and destination ports in UDP header
+       */
+
+      if (!GetPacketData(packet, ethHeaderLen + ipHeaderLen, 
+			 sizeof srcPort, &srcPort) ||
+	  !GetPacketData(packet, ethHeaderLen + ipHeaderLen + 2, 
+			 sizeof destPort, &destPort)) {
+	 VNETKdPrint((MODULE_NAME "FromHostIP: Failed to get UDP ports\n"));
+	 return;
+      }
+
+      srcPort  = NTOHS(srcPort);
+      destPort = NTOHS(destPort);
+
+#ifdef DBG
+      {
+	 uint8 srcAddr[4];
+	 uint8 destAddr[4];
+
+	 if (!GetPacketData(packet, ethHeaderLen + IP_HEADER_SRC_ADDR_OFFSET, 
+			    sizeof srcAddr, srcAddr) ||
+	     !GetPacketData(packet, ethHeaderLen + IP_HEADER_DEST_ADDR_OFFSET, 
+			    sizeof destAddr, destAddr)) {
+	    VNETKdPrint((MODULE_NAME "FromHostIP: Failed to get IP addrs\n"));
+	    ASSERT(0); // should never happen
+	 } else {
+	    W_VNETKdPrint((MODULE_NAME "ProcessOutgoing: got UDP, "
+		      "src %d.%d.%d.%d %d dest %d.%d.%d.%d %d\n", 
+		      srcAddr[0], srcAddr[1], srcAddr[2], srcAddr[3], srcPort, 
+		      destAddr[0], destAddr[1], destAddr[2], destAddr[3],
+                      destPort));
+	 }
+      }
+#endif
+      
+      if (destPort == 67) { // if destined for DHCP server port
+	 uint32 firstDHCPword;
+	 uint16 dhcpFlags;
+
+	 VNETKdPrint((MODULE_NAME "ProcessOutgoing: got client "
+	              "DHCP packet destined for a server\n"));
+
+	 /*
+	  * The minimum length of a DHCP packet must be 243 bytes:-
+	  * 240 (DHCP header including magic cookie) + 3 (message type option)
+	  * RFC 2131 mandates having the 'message type' option in every DHCP packet.
+	  */
+
+	 if (GetPacketLength(packet) < ethHeaderLen + ipHeaderLen +
+               UDP_HEADER_LEN + 243) {
+	    VNETKdPrint((MODULE_NAME "ProcessOutgoing: packet "
+	                 "too small for DHCP\n"));
+	    return;
+	 }
+
+	 /*
+	  * Verify that the first word in the DHCP header matches
+	  * out expectations
+	  */
+
+	 if (!GetPacketData(packet, ethHeaderLen + ipHeaderLen + 
+                  UDP_HEADER_LEN, sizeof firstDHCPword, &firstDHCPword)) {
+	    VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get first "
+	                 "DHCP word\n"));
+	    return;
+	 }
+
+	 firstDHCPword = NTOHL(firstDHCPword);
+	 if ((firstDHCPword & 0xffffff00) != 0x01010600) {
+	    VNETKdPrint((MODULE_NAME "ProcessOutgoing: DHCP "
+	                 "first word appears incorrect\n"));
+	    return;
+	 }
+
+	 /*
+	  * Turn on the broadcast flag, just in case.  This
+	  * instructs/requests that the server broadcast the reply
+	  * back, which is a nice way to avoid the issue about
+	  * whether to set chaddr to the VM MAC or the wireless MAC.
+	  * 
+	  * If chaddr is set to wireless MAC then we'd receive the reply,
+	  * but the DHCP server might confuse us with the host and send
+	  * us a copy of the host's current IP address assignment.  This
+	  * confusion should be occur if all OSes used the client identifier
+	  * extension, but we can't rely on this.
+	  *
+	  * If chaddr is set to VM MAC then no alias confusion should occur,
+	  * but the reply might be unicast to the VM's MAC (in which case
+	  * we might not , or will not, receive the reply).  To avoid the
+	  * receive issue, it's easiest to just set the broadcast packet
+	  * if it's not already set.
+	  *
+	  * One potential downside is that the VM might be expecting a unicast
+	  * reply, and it's unclear whether it can or will handling a 
+	  * broadcast reply properly.  We can special case this support, if
+	  * necessary.
+	  */
+
+	 if (!GetPacketData(packet, ethHeaderLen + ipHeaderLen + 
+                            UDP_HEADER_LEN + 10, sizeof dhcpFlags, &dhcpFlags)) {
+	    VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get "
+	                 "DHCP flags\n"));
+	    return;
+	 }
+
+	 dhcpFlags = NTOHS(dhcpFlags);
+	 if (dhcpFlags & 0x8000) { // if flag already set, then no work to do
+	    VNETKdPrint((MODULE_NAME "ProcessOutgoing: DHCP broadcast "
+	                 "bit is already set\n"));
+	 } else {
+
+	    /*
+	     * Get the original checksum
+	     */
+
+	    uint16 oriChecksum;
+
+	    if (!GetPacketData(packet, ethHeaderLen + ipHeaderLen + 6, 
+			       sizeof oriChecksum, &oriChecksum)) {
+	       VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get "
+			    "UDP checksum\n"));
+	       return;
+	    }
+	    oriChecksum = NTOHS(oriChecksum);
+
+            VNETKdPrint((MODULE_NAME "ProcessOutgoing: DHCP broadcast bit "
+	                 "NOT set, need to do so\n"));
+
+	    if (oriChecksum) { // if checksum specified
+
+	       /*
+	        * Compute the checksum over the word that we're about to change
+		*/
+
+	       uint32 sumBefore;   // checksum before
+	       uint32 sumAfter;    // checksum after changes
+	       uint32 sumDiff;     // difference in checksum
+	       uint16 newChecksum; // new checksum
+	       
+	       /* checksum bytes 8-11 */
+
+	       if (!GetPacketData(packet, ethHeaderLen + ipHeaderLen + 
+                                  UDP_HEADER_LEN + 8,
+				  sizeof sumBefore, &sumBefore)) {
+		  VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get "
+			       "UDP checksum before\n"));
+		  return;
+	       }
+
+	       sumBefore = SUM32(sumBefore); // checksum before
+
+	       VNETKdPrint((MODULE_NAME "ProcessOutgoing: DHCP UDP checksum "
+		            "is present, changing flags and checksum\n"));
+
+	       /*
+	        * Set the actual flag in bytes 10 and 11
+		*/
+
+	       dhcpFlags |= 0x8000;
+
+	       if (!SetPacketByte(packet, ethHeaderLen + ipHeaderLen + 
+                                  UDP_HEADER_LEN + 11, dhcpFlags & 0xff) || 
+		   !SetPacketByte(packet, ethHeaderLen + ipHeaderLen + 
+                                  UDP_HEADER_LEN + 10, dhcpFlags >> 8)) {
+		  VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't set "
+		               "new UDP flags\n"));
+		  return;
+	       }
+	       
+	       /*
+	        * Compute the checksum over the word that we have just changed
+		*/
+
+	       /* checksum (again) bytes 8-11 */
+
+	       if (!GetPacketData(packet, ethHeaderLen + ipHeaderLen + 
+                                  UDP_HEADER_LEN + 8,
+				  sizeof sumAfter, &sumAfter)) {
+		  VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get "
+			       "UDP checksum after\n"));
+		  ASSERT(0); // should never occur
+		  return;
+	       }
+
+	       sumAfter = SUM32(sumAfter);
+
+	       /*
+	        * Compute difference/delta between old and new checksums
+		*/
+
+   	       sumDiff = CalcChecksumDiff(sumBefore, sumAfter);
+    
+	       /*
+	        * Compute new checksum, based on delta from existing checksum
+		*/
+
+	       newChecksum = UpdateSum(oriChecksum, sumDiff);
+
+	       /*
+	        * Verify that the new checksum isn't 0 (in which case make it ~0)
+		*/
+
+	       if (!newChecksum) {
+		  newChecksum = 0xffff;
+	       }
+
+	       /*
+	        * Write back the new checksum
+		*/
+
+	       if (!SetPacketByte(packet, ethHeaderLen + ipHeaderLen + 6, 
+				  newChecksum >> 8) ||
+		   !SetPacketByte(packet, ethHeaderLen + ipHeaderLen + 7, 
+				  newChecksum & 0xff)) {
+		  VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't set "
+		               "new UDP checksum\n"));
+		  return;
+	       }
+	    } else {
+	       VNETKdPrint((MODULE_NAME "ProcessOutgoing: DHCP UDP "
+		            "checksum is NOT present, changing only flags\n"));
+	       /*
+	        * Set the actual flag without modifying checksum
+		*/
+
+	       dhcpFlags |= 0x8000;
+	       if (!SetPacketByte(packet, ethHeaderLen + ipHeaderLen + 
+                                  UDP_HEADER_LEN + 11, dhcpFlags & 0xff) || 
+		   !SetPacketByte(packet, ethHeaderLen + ipHeaderLen + 
+                                  UDP_HEADER_LEN + 10, dhcpFlags >> 8)) {
+		  VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't set "
+		               "new UDP flags, non-checksum case\n"));
+		  return;
+	       }
+	    }
+	 }
+
+#ifdef DBG
+	 {
+	    uint32 IPDestAddr;
+	    if (!GetPacketData(packet, ethHeaderLen + IP_HEADER_DEST_ADDR_OFFSET, 
+			       sizeof IPDestAddr, &IPDestAddr)) {
+	       VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get "
+			    "IP dest addr\n"));
+	       return;
+	    }
+	    
+	    if (IPDestAddr == IP_ADDR_BROADCAST) {
+	       VNETKdPrint((MODULE_NAME "ProcessOutgoing: server-bound DHCP "
+			    "packet is broadcast\n"));
+	    } else {
+	       VNETKdPrint((MODULE_NAME "ProcessOutgoing: server-bound DHCP "
+			    "packet is unicast\n"));
+	    }
+	 }
+#endif
+	 return;
+      } else if (destPort == 68) { // if packet for destined DHCP client port
+#ifdef DBG
+	 uint32 IPDestAddr = 0;
+	 if (!GetPacketData(packet, ethHeaderLen + IP_HEADER_DEST_ADDR_OFFSET, 
+			    sizeof IPDestAddr, &IPDestAddr)) {
+	    VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get "
+			 "IP dest addr\n"));
+	    return;
+	 }
+
+	 VNETKdPrint((MODULE_NAME "ProcessOutgoing: got server "
+	              "DHCP packet destined for a client\n"));
+
+	 if (IPDestAddr == IP_ADDR_BROADCAST) {
+	    VNETKdPrint((MODULE_NAME "ProcessOutgoing: client-bound "
+	                 "DHCP packet is broadcast\n"));
+	 } else {
+	    VNETKdPrint((MODULE_NAME "ProcessOutgoing: client-bound "
+	                 "DHCP packet is unicast\n"));
+	 }
+#endif /* DBG */
+	 return;
+      } else {
+	 W_VNETKdPrint((MODULE_NAME "ProcessOutgoing: got UDP srcPort "
+	              "%d destPort %d\n", srcPort, destPort));
+	 return;
+      }
+   }
+   case 27: // RDP
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got RDP\n"));
+      return;
+   case 41: // IPv6
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got IPv6\n"));
+      return;
+   case 51: // Authentication Header
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got Authentication Header\n"));
+      return;
+   case 55: // Mobile IP
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got Mobile IP\n"));
+      return;
+   case 103: // PIM
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got PIM\n"));
+      return;
+   case 111: // IPX in IP
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: got IPX in IP\n"));
+      return;
+   default:
+      VNETKdPrint((MODULE_NAME "ProcessOutgoing: Unknown/unhandled "
+	           "service reported by IP packet\n"));
+      return;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PatchMacAddrFixChecksum --
+ *
+ *      This function takes in a packet and patches the MAC address at
+ *      a given offset in the packet with a given MAC address.  It also
+ *      updates the 2byte checksum field in the packet at a given offset.
+ *
+ * Results:
+ *      TRUE on success, FALSE on failure.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+PatchMacAddrFixChecksum(SMACPacket *packet,          // IN:
+                        const uint32 packetLen,      // IN:
+                        const uint32 checksumOffset, // IN:
+                        const uint32 patchMacOffset, // IN:
+                        const uint8 *macAddress,     // IN:
+                        const char *logPrefix)       // IN:
+{
+   uint16 oriChecksum;
+   uint32 sumBefore[2];
+   uint32 sumAfter[2];
+   uint32 sumDiff;
+   uint16 newChecksum;
+   int i;
+
+   UNREFERENCED_PARAMETER(logPrefix);
+   if (!packet || checksumOffset + sizeof oriChecksum > packetLen ||
+       patchMacOffset + ETH_ALEN > packetLen) {
+      VNETKdPrint((MODULE_NAME "%s:  patching MAC address got invalid input: "
+                   "packet = %p, packetLen = %u, checksumOffset = %u, "
+                   "patchMacOffset = %u.\n", logPrefix, packet, packetLen,
+                   checksumOffset, patchMacOffset));
+      return FALSE;
+   }
+
+   if (!GetPacketData(packet, checksumOffset, sizeof oriChecksum,
+                      &oriChecksum)) {
+      VNETKdPrint((MODULE_NAME "%s:  couldn't get original checksum value.\n",
+                   logPrefix));
+      return FALSE;
+   }
+
+   oriChecksum = NTOHS(oriChecksum);
+
+   sumBefore[1] = 0; /* Clear out any garbage. */
+   if (!GetPacketData(packet, patchMacOffset, sizeof sumBefore[0],
+                      &sumBefore[0]) ||
+       !GetPacketData(packet, patchMacOffset + sizeof sumBefore[0], ETH_ALEN -
+                      sizeof sumBefore[0], &sumBefore[1])) {
+      VNETKdPrint((MODULE_NAME "%s:  couldn't get original MAC address in "
+                   "packet\n", logPrefix));
+      return FALSE;
+   }
+
+   sumAfter[0] = *(uint32 *)macAddress;
+   sumAfter[1] = *(uint16 *)(macAddress + sizeof sumAfter[0]);
+
+   sumBefore[0] = SUM32(sumBefore[0]);
+   sumAfter[0] = SUM32(sumAfter[0]);
+
+   sumDiff = CalcChecksumDiff(sumBefore[0], sumAfter[0]);
+   newChecksum = UpdateSum(oriChecksum, sumDiff);
+   sumDiff = CalcChecksumDiff(sumBefore[1], sumAfter[1]);
+   newChecksum = UpdateSum(newChecksum, sumDiff);
+
+   for (i = 0; i < ETH_ALEN; i++) {
+      if (!SetPacketByte(packet, patchMacOffset + i, macAddress[i])) {
+         VNETKdPrint((MODULE_NAME "%s:  couldn't patch MAC address.\n",
+                      logPrefix));
+         return FALSE;
+      }
+   }
+
+   if (!SetPacketByte(packet, checksumOffset, newChecksum >> 8) ||
+       !SetPacketByte(packet, checksumOffset + 1, newChecksum & 0xff)) {
+      VNETKdPrint((MODULE_NAME "%s:  couldn't set new checksum in packet.\n",
+                   logPrefix));
+      return FALSE;
+   }
+
+   return TRUE;
+}
+
+
+#if defined(_WIN32) && NDIS_SUPPORT_NDIS6
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IPv6IsMulticast --
+ *
+ *      Determines if a given IPv6 address is a multicast address or not.
+ *
+ * Results:
+ *      TRUE/FALSE.
+ *
+ * Side effects:
+ *       None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER Bool
+IPv6IsMulticast(const IPv6Addr *ipv6Addr) // IN:
+{
+   return *(uint8 *)ipv6Addr == 0xff;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IsPacketDestinationTheHost --
+ *
+ *      Given an IPv6 packet determines if it is destined to a unicast IPv6
+ *      address associated with the host interface.
+ *
+ * Results:
+ *      TRUE/FALSE.
+ *
+ * Side effects:
+ *       None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER Bool
+IsPacketDestinationTheHost(const uint8 *dstMACAddr,  // IN:
+                           const uint8 *smacAddress, // IN:
+                           const IPv6Addr *ipv6Addr) // IN:
+{
+   if (IS_MULTICAST(dstMACAddr)) { /* Multicast or broadcast. */
+      return IPv6IsMulticast(ipv6Addr) ? FALSE :
+                                         BridgeIPv6MatchAddrMAC(ipv6Addr,
+                                                                smacAddress);
+   } else { /* Unicast. */
+      return MAC_EQ(dstMACAddr, smacAddress);
+   }
+}
+
+#endif
+
+#define NEXTHDR_HOP        0
+#define NEXTHDR_ROUTING    43
+#define NEXTHDR_AUTH       51
+#define NEXTHDR_DEST       60
+#define NEXTHDR_MOBILITY   135
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SmacWalkIPv6ExtensionHeaders --
+ *
+ *      Walks (some) IPv6 extension headers in a given packet.  The packet's
+ *      length and offset within packet of start of IPv6 header & payload
+ *      is input to this function.  There are two outputs: the next header
+ *      type of the PDU contained (when it does not match any of the
+ *      extension headers that we walk or a higher level PDU type such as
+ *      TCP or UDP), and the offset of this PDU within the packet.
+ *
+ * Results:
+ *      TRUE on success, FALSE on failure.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+SmacWalkIPv6ExtensionHeaders(SMACPacket *packet,        // IN:
+                             const uint32 packetLen,    // IN:
+                             const uint32 ethHeaderLen, // IN:
+                             uint8 *nextHeaderPtr,      // OUT:
+                             uint32 *nextHeaderOffset)  // OUT:
+{
+   uint8 nextHeader;
+   uint32 offset; /* Bytes inspected. */
+   uint32 headerLen; /* Length of current header. */
+
+   ASSERT(packet && packetLen >= IPv6_HEADER_LEN + ethHeaderLen &&
+          nextHeaderPtr && nextHeaderOffset);
+
+   if (!GetPacketData(packet, ethHeaderLen + IPv6_NEXT_HEADER_OFFSET,
+                      sizeof nextHeader, &nextHeader)) {
+      return FALSE;
+   }
+
+   headerLen = IPv6_HEADER_LEN;
+   offset = ethHeaderLen + headerLen;
+   while (offset < packetLen - 1) { /* Subtract 1 b/c we lookahead 2 bytes. */
+      switch (nextHeader) {
+      case NEXTHDR_HOP:
+      case NEXTHDR_ROUTING:
+      case NEXTHDR_AUTH:
+      case NEXTHDR_DEST:
+      case NEXTHDR_MOBILITY:
+         if (!GetPacketData(packet, offset + 1, sizeof(uint8), &headerLen)) {
+            return FALSE;
+         }
+         if (nextHeader == NEXTHDR_AUTH) {
+            headerLen = (headerLen + 2) << 2;
+         } else {
+            headerLen = (headerLen + 1) << 3;
+         }
+         if (!GetPacketData(packet, offset, sizeof nextHeader, &nextHeader)) {
+            return FALSE;
+         }
+         offset += headerLen;
+         break;
+
+      default:
+         goto out;
+      }
+   }
+
+out:
+   *nextHeaderOffset = offset;
+   *nextHeaderPtr = nextHeader;
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * ProcessOutgoingIPv6Packet --
+ *
+ *      This function is used to examine IPv6 packets, and make any
+ *      modifications (if necessary).  Currently it assumes no IPv6
+ *      extension options are present, and processes ICMPv6 payloads
+ *      only.  If the source link layer option in an NDP (ICMPv6) packet
+ *      is present, this function replaces that MAC address with the
+ *      MAC address of the wireless PNIC so that replies (neighbour
+ *      advertisements) would be addressed to the host.  The ICMPv6
+ *      checksums are updated accordingly.
+ *      The caller should have determined that the packet is IPv6
+ *      before calling this function.
+ *
+ * Results:
+ *      TRUE on success, FALSE on failure.
+ *
+ * Side effects:
+ *      May modify the contents of the packet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+ProcessOutgoingIPv6Packet(SMACPacket *packet,       // IN:  cloned packet
+                          uint32 ethHeaderLen,      // IN:
+                          const uint8 *smacAddress, // IN:  wireless PNIC's MAC
+                          Bool *toHost)             // OUT: destined to host?
+{
+   uint8 nextHeader = 0; /* Silence compiler warnings. */
+   uint32 nextHeaderOffset = 0; /* Silence compiler warnings. */
+   const uint32 packetLen = GetPacketLength(packet);
+#if defined(_WIN32) && NDIS_SUPPORT_NDIS6
+   uint8 dstMACAddr[ETH_ALEN];
+#endif
+
+   UNREFERENCED_PARAMETER(toHost);
+
+   /*
+    * Assume caller has done certain checks.
+    */
+
+   ASSERT(packetLen >= IPv6_HEADER_LEN + ethHeaderLen);
+   ASSERT(toHost && !*toHost);
+
+#if defined(_WIN32) && NDIS_SUPPORT_NDIS6
+   {
+      IPv6Addr dstAddr;
+
+      if (!GetPacketData(packet, 0, sizeof dstMACAddr, &dstMACAddr)) {
+         VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6: couldn't get "
+                      "destination MAC address.\n"));
+         return FALSE;
+      }
+      if (!GetPacketData(packet, ethHeaderLen + IPv6_HEADER_DST_ADDR_OFFSET,
+                         sizeof dstAddr, &dstAddr)) {
+         VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6: couldn't get "
+                      "destination IPv6 address.\n"));
+         return FALSE;
+      }
+
+      *toHost = IsPacketDestinationTheHost(dstMACAddr, smacAddress, &dstAddr);
+      if (*toHost) {
+         return TRUE;
+      }
+   }
+#endif
+
+   if (!SmacWalkIPv6ExtensionHeaders(packet, packetLen, ethHeaderLen,
+                                     &nextHeader, &nextHeaderOffset)) {
+      VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6:  couldn't get "
+                   "next header.\n"));
+      return FALSE;
+   }
+
+   switch (nextHeader) {
+   case 58: { /* ICMPv6. */
+      uint8 type;
+      uint8 optionToFind;
+      uint32 ndpMsgLen;
+      const uint32 icmpv6ChecksumOffset = nextHeaderOffset +
+                                          ICMPv6_CHECKSUM_OFFSET;
+
+      if (!GetPacketData(packet, nextHeaderOffset + ICMPv6_TYPE_OFFSET,
+                         sizeof type, &type)) {
+         VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6:  couldn't get ICMPv6 "
+                      "type value.\n"));
+         return FALSE;
+      }
+
+      switch (type) {
+      case ICMPv6_NDP_RTR_SOLICITATION:
+         optionToFind = ICMPv6_NDP_OPTION_SRC_MAC;
+         ndpMsgLen = ICMPv6_NDP_RTR_SOL_LEN;
+         break;
+
+      case ICMPv6_NDP_RTR_ADVERTISEMENT:
+         optionToFind = ICMPv6_NDP_OPTION_SRC_MAC;
+         ndpMsgLen = ICMPv6_NDP_RTR_ADV_LEN;
+         break;
+
+      case ICMPv6_NDP_NBR_SOLICITATION:
+         optionToFind = ICMPv6_NDP_OPTION_SRC_MAC;
+         ndpMsgLen = ICMPv6_NDP_NBR_LEN;
+         break;
+
+      case ICMPv6_NDP_NBR_ADVERTISEMENT:
+         optionToFind = ICMPv6_NDP_OPTION_TARGET_MAC;
+         ndpMsgLen = ICMPv6_NDP_NBR_LEN;
+         break;
+
+      default: /* Nothing left to do. */
+         return TRUE;
+      }
+
+#if defined(_WIN32) && NDIS_SUPPORT_NDIS6
+      if (type == ICMPv6_NDP_NBR_SOLICITATION) {
+         IPv6Addr targetAddr;
+
+         if (!GetPacketData(packet, nextHeaderOffset + ICMPv6_TARGET_IP_OFFSET,
+                            sizeof targetAddr, &targetAddr)) {
+            VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6:  couldn't get "
+                         "target IPv6 address in ICMPv6 NDP packet.\n"));
+            return FALSE;
+         }
+
+         *toHost = IsPacketDestinationTheHost(dstMACAddr, smacAddress,
+                                              &targetAddr);
+         if (*toHost) {
+            return TRUE;
+         }
+      }
+#endif
+
+      nextHeaderOffset += ndpMsgLen; /* Start of NDP options. */
+
+      /*
+       * Walk through all NDP options searching for the option we are
+       * interested in.
+       */
+
+      while (nextHeaderOffset < packetLen) {
+         uint8 option;
+         uint8 optionLen;
+
+         if (!GetPacketData(packet, nextHeaderOffset +
+                            ICMPv6_NDP_OPTION_TYPE_OFFSET, sizeof option,
+                            &option)) {
+            VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6:  couldn't get "
+                         "ICMPv6 NDP option type value.\n"));
+            return FALSE;
+         }
+
+         /*
+          * Replace the source/target MAC address option with the MAC address
+          * of the wireless PNIC when we find the option we are looking for.
+          */
+
+         if (option == optionToFind) {
+            return PatchMacAddrFixChecksum(packet, packetLen,
+                                           icmpv6ChecksumOffset,
+                                           nextHeaderOffset +
+                                           ICMPv6_NDP_MAC_OFFSET, smacAddress,
+                                           "Outgoing IPv6 packet");
+         }
+
+         if (!GetPacketData(packet, nextHeaderOffset +
+                            ICMPv6_NDP_OPTION_LEN_OFFSET, sizeof optionLen,
+                            &optionLen)) {
+            VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6:  couldn't get "
+                         "ICMPv6 NDP option length value.\n"));
+            return FALSE;
+         }
+
+         /*
+          * Option length is in units of 8 bytes.  Option length of 0 is
+          * invalid and such packets must be discarded.
+          */
+
+         if (UNLIKELY(!optionLen)) {
+            VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6:  got invalid "
+                         "option length (0).\n"));
+            return FALSE;
+         }
+         nextHeaderOffset += (uint32)optionLen << 3;
+      }
+
+      break;
+   }
+
+   default:
+      VNETKdPrint((MODULE_NAME "ProcessOutgoingIPv6:  Unknown/unhandled "
+                   "next header type %u in IPv6 packet.\n", nextHeader));
+      break;
+   }
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * ProcessIncomingIPv4Packet --
+ *
+ *      This function is used to examine IPv4 packets, and make any
+ *      adjustments (if necessary) to the IP header and/or payload.
+ *      The third paramter is optional (specify NULL if not provided).
+ *
+ *      Currently **this function does nothing** but print out debug
+ *      information about the contents of the IP packet
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      May modify the contents of the packet.  Length should be 
+ *      unchanged.
+ *
+ *----------------------------------------------------------------------
+ */
+
+/* 
+ * NOTE: this abstraction doesn't match reality because we may only have
+ * a partial packet received so far.  But, since we're not modifying the
+ * packet (and only trying to ID/classify it) then this shouldn't matter.
+ */
+
+#ifdef DBG
+
+static void
+ProcessIncomingIPv4Packet(SMACPacket *packet, // IN/OUT: incoming packet
+			  Bool knownMacForIp) // IN: IP is present in table?
+{
+   uint8 proto;    // protocol within ip
+   uint16 ipFlags; // offset and flags
+
+   /*
+    * Should certain checks, e.g., IP version field, be checked here,
+    * or assume that caller has already performed this check?
+    */
+
+   /*
+    * Presuming that caller has performed checks, and that IP header
+    * comes exactly ETH_HLEN bytes into the packet 
+    */
+
+   if (GetPacketLength(packet) < ETH_HLEN + IP_HEADER_LEN) {
+      return;
+   }
+
+   if (!GetPacketData(packet, ETH_HLEN + IP_HEADER_PROTO_OFFSET, sizeof proto, 
+                      &proto)) {
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: couldn't get protocol\n"));
+      return;
+   }
+
+   if (!GetPacketData(packet, ETH_HLEN + IP_HEADER_FLAGS_OFFSET, sizeof ipFlags,
+                      &ipFlags)) {
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: couldn't get ip flags\n"));
+      return;
+   }
+
+   /*
+    * Verify offset=0 and M=0: mask off "fragment" flag,
+    * all others should be zero
+    */
+
+   if (ipFlags & HTONS((uint16)~(0x4000))) {
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: got a fragmented IP "
+		   "(ipFlags %04x), so not performing higher-level processing\n",
+		   ipFlags));
+      return;
+   }
+
+   switch (proto) {
+   case 1: { // ICMP
+      uint32 ipHeaderLen = 0; // length of IP header
+      uint32 ipVer = 0;       // version of IP header
+      uint16 ipLen = 0;       // total length of datagram
+      uint8 firstByte = '\0';  // used to safely read from packet
+
+      if (!GetPacketData(packet, ETH_HLEN, sizeof firstByte, &firstByte)) {
+	 VNETKdPrint((MODULE_NAME "ProcessIncoming: ICMP read ver error\n"));
+	 return;
+      }
+      ipHeaderLen = 4 * (firstByte & 0xf); // length of IP header
+      ipVer = firstByte>>4; // version of IP header
+
+      if (!GetPacketData(packet, ETH_HLEN + 2, sizeof ipLen, &ipLen)) {
+	 VNETKdPrint((MODULE_NAME "ProcessIncoming: ICMP read len error\n"));
+	 return;
+      }
+      ipLen = NTOHS(ipLen);
+
+      if (ipVer == 4 && GetPacketLength(packet) >= 
+          ipHeaderLen + 2 * 4 + ETH_HLEN) {
+	 uint8 typeField = 0;
+	 uint8 codeField = 0;
+	 if (!GetPacketData(packet, ETH_HLEN + ipHeaderLen, 
+			    sizeof typeField, &typeField) ||
+	     !GetPacketData(packet, ETH_HLEN + ipHeaderLen + 1, 
+			    sizeof codeField, &codeField)) {
+	    VNETKdPrint((MODULE_NAME "ProcessIncoming: ICMP "
+			 "read ICMP error\n"));
+	    return;
+	 }
+
+	 W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got ICMP, "
+	                "type = %d, code = %d,\n", typeField, codeField));
+      } else {
+	 VNETKdPrint((MODULE_NAME "ProcessIncoming: got ICMP, "
+	              "but couldn't process\n"));
+      }
+      return;
+   }
+   case 2: // IGMP
+      W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got IGMP\n"));
+      return;
+   case 4: // IP in IP
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: got IP in IP\n"));
+      return;
+   case 6: // TCP
+      W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got TCP\n"));
+      return;
+   case 17: { // UDP
+      uint32 ipHeaderLen = 0;  // length of IP header
+      uint32 ipVer = 0;        // version of IP header
+      uint16 ipLen = 0;        // total length of datagram
+      uint8  firstByte;         // used to safely read from packet
+
+      if (!GetPacketData(packet, ETH_HLEN, sizeof firstByte, &firstByte)) {
+	 VNETKdPrint((MODULE_NAME "ProcessIncoming: ICMP read ver error\n"));
+	 ASSERT(0);
+	 return;
+      }
+      ipHeaderLen = 4 * (firstByte&0xf); // length of IP header
+      ipVer = firstByte >> 4; // version of IP header
+      
+      /*
+       * verifify that IP fragment offset is 0
+       */
+
+      if (!GetPacketData(packet, ETH_HLEN + 2, sizeof ipLen, &ipLen)) {
+	 VNETKdPrint((MODULE_NAME "ProcessIncoming: ICMP read len error\n"));
+	 ASSERT(0);
+	 return;
+      }
+      ipLen = NTOHS(ipLen);
+      
+      W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got UDP, "
+	 	    "IP ver %d, header len %d,"
+	            "overall len %d\n", ipVer, ipHeaderLen, ipLen));
+      
+      if (ipVer == 4 && GetPacketLength(packet) >= 
+            ipHeaderLen + 2 * 4 + ETH_HLEN) {
+	 uint16 srcPort  = 0;
+	 uint16 destPort = 0;
+	 uint8 srcAddr[4];
+	 uint8 destAddr[4];
+
+	 if (!GetPacketData(packet, ipHeaderLen + ETH_HLEN, 
+			    sizeof srcPort, &srcPort) || 
+	     !GetPacketData(packet, ipHeaderLen + ETH_HLEN + 2, 
+			    sizeof destPort, &destPort)) {
+	    VNETKdPrint((MODULE_NAME "ProcessIncoming: read "
+	 	    	 "UDP header error\n"));
+	    ASSERT(0);
+	    return;
+	 }
+
+	 srcPort  = NTOHS(srcPort);
+	 destPort = NTOHS(destPort);
+
+	 if (!GetPacketData(packet, ETH_HLEN + IP_HEADER_SRC_ADDR_OFFSET, 
+			    sizeof srcAddr, srcAddr) ||
+	     !GetPacketData(packet, ETH_HLEN + IP_HEADER_DEST_ADDR_OFFSET, 
+			    sizeof destAddr, destAddr)) {
+	    VNETKdPrint((MODULE_NAME "ProcessIncoming: couldn't read "
+			 "source and/or dest IP addr\n"));
+	    return;
+	 }
+	 
+	 W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got UDP, src "
+			"%d.%d.%d.%d %d dest %d.%d.%d.%d %d\n", 
+			srcAddr[0], srcAddr[1], srcAddr[2], srcAddr[3], 
+			srcPort, destAddr[0], destAddr[1], destAddr[2], 
+			destAddr[3], destPort));
+	 
+	 if (destPort == 67) {
+
+	    if (knownMacForIp) {
+	       W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got client DHCP "
+		              "packet destined for THIS server\n"));
+	    } else {
+	       W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got client DHCP "
+		              "packet destined for a server\n"));
+	    }
+
+	 } else if (destPort == 68) {
+
+	    if (knownMacForIp) {
+	       W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got server DHCP "
+		              "packet destined for THIS client\n"));
+	    } else {
+	       W_VNETKdPrint((MODULE_NAME "ProcessIncoming: got server DHCP "
+		              "packet destined for a client\n"));
+	    }
+
+	 }
+      }
+      return;	    
+    }
+   case 27: // RDP
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: got RDP\n"));
+      return;
+   case 41: // IPv6
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: got IPv6\n"));
+      return;
+   case 51: // Authentication Header
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: got Authentication Header\n"));
+      return;
+   case 55: // Mobile IP
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: got Mobile IP\n"));
+      return;
+   case 103: // PIM
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: got PIM\n"));
+      return;
+   case 111: // IPX in IP
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: got IPX in IP\n"));
+      return;
+   default:
+      VNETKdPrint((MODULE_NAME "ProcessIncoming: Unknown/unhandled service "
+	           "reported by IP packet\n"));
+      return;
+   }
+}
+
+#endif /* DBG */
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SMAC_InitState --
+ *
+ *      Initialize adapter SMAC state.  Presumes that the 
+ *      supplied adapter object has already been initialized to zero.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Initializes adapter SMAC state.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMAC_InitState(SMACState **ptr) // OUT: pointer to alloced/inited state
+{
+   SMACState * state;
+   VNETKdPrintCall(("SMAC_InitState"));
+   ASSERT(ptr);
+
+   state = ALLOCATEMEMORY(sizeof *state, REORDER_TAG('SMAC'));
+   if (state == NULL) {
+      *ptr = NULL;
+      return;
+   }
+
+   MEMSET(state, 0, sizeof *state);
+
+   VNETKdPrint((MODULE_NAME "SMAC_InitState: state %p\n", state));
+
+   INITSPINLOCK(&(state->smacSpinLock));
+#ifndef _WIN32
+   if (state->smacSpinLock == NULL) {
+      VNETKdPrint((MODULE_NAME "SMAC_InitState: coudln't initialize spinlock."
+                   "Freeing state.\n"));
+      FREEMEMORY(state);
+      state = NULL;
+   }
+#endif
+   VNETKdPrintReturn(("SMAC_InitState"));
+   *ptr = state;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SMAC_SetMac --
+ *
+ *      Set MAC stored in SMAC state.  Presumes that the 
+ *      supplied SMAC state has already been initialized.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Sets MAC in SMAC state.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMAC_SetMac(SMACState *state,  // IN: state to update
+	    uint8 *mac)        // IN: pointer to host adapter's MAC
+{
+   VNETKdPrintCall(("SMAC_SetMac"));
+   ASSERT(state);
+
+   VNETKdPrint((MODULE_NAME "SMAC_SetMac: state %p mac %p\n", 
+		state, mac));
+#ifdef DBG
+   if (mac) {
+      VNETKdPrint((MODULE_NAME 
+		   "mac 0x%02x:0x%02x:0x%02x:0x%02x:0x%02x:0x%02x\n", 
+		   mac[0], mac[1], mac[2], mac[3], mac[4], mac[5]));
+   }
+#endif
+
+   /* 
+    * There's likely some atomicity issues here, but grabbing a lock
+    * here won't help since the readers won't be grabbing a lock.
+    * The only time an update can occur with traffic being processed
+    * is on Linux, which I don't see as a big deal given the lack
+    * of demand for this feature on that OS.
+    */
+
+   if (mac) {
+      MEMCPY(state->macAddress, mac, ETH_ALEN);
+   } else {
+      MEMSET(state->macAddress, 0, ETH_ALEN);
+   }
+   VNETKdPrintReturn(("SMAC_SetMac"));
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SMAC_SetForwardUnknownPackets --
+ *
+ *      Initialize adapter SMAC state.  Presumes that the 
+ *      supplied adapter object has already been initialized to zero.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Initializes adapter SMAC state.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMAC_SetForwardUnknownPackets(SMACState *state,    // IN: pointer to smac state
+			      Bool forwardUnknown) // IN: T/F to forward
+{
+   VNETKdPrintCall(("SMAC_SetForwardUnknownPackets"));
+   ASSERT(state);
+   state->smacForwardUnknownPackets = forwardUnknown;
+   VNETKdPrintReturn(("SMAC_SetForwardUnknownPackets"));
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SMAC_CleanupState --
+ *
+ *      Deallocates adapter SMAC state.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      Deallocates adapter SMAC state.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMAC_CleanupState(SMACState **ptr) // IN: state to dealloc
+{
+   uint32 i = 0;
+   SMACState *state;
+#ifdef _WIN32
+   KIRQL irql;
+#endif
+   SPINLOCKINIT();
+
+   VNETKdPrintCall(("SMAC_CleanupState"));
+   ASSERT(ptr);
+
+   state = *ptr;
+   if (state == NULL) {
+      return;
+   }
+   *ptr = NULL;
+
+   RAISEIRQL();
+   ACQUIRESPINLOCK(&state->smacSpinLock);
+
+   for (i = 0; i < SMAC_HASH_TABLE_SIZE; ++i) {
+      IPmacLookupEntry * entry = state->IPlookupTable[i];
+      while (entry) {
+	 IPmacLookupEntry * next = entry->ipNext;
+	 VNETKdPrintCall(("--deleted entry\n"));
+	 FREEMEMORY(entry);
+	 --state->numberOfIPandMACEntries;
+	 entry = next;
+      }
+   }
+   if (state->numberOfIPandMACEntries != 0) {
+      VNETKdPrint((MODULE_NAME "SMAC_CleanupState: "
+                   "entry count is non-zero: %u\n",
+                   state->numberOfIPandMACEntries));
+      ASSERT(state->numberOfIPandMACEntries == 0);
+   }
+
+   RELEASESPINLOCK(&state->smacSpinLock);
+   FREESPINLOCK(&state->smacSpinLock);
+   LOWERIRQL();
+   FREEMEMORY(state);
+
+   VNETKdPrintReturn(("SMAC_CleanupState"));
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LookupTypeClass --
+ *
+ *      Examines and classifies the protocol type of an ethernet frame
+ *
+ * Results:
+ *       Returns the appropriate EthClass classification for the 
+ *       specified ethernet media type.
+ *       
+ *
+ * Side effects:
+ *      May modify the contents of the packet.  Length should be 
+ *      unchanged.
+ *
+ *----------------------------------------------------------------------
+ */
+
+EthClass
+LookupTypeClass(unsigned short typeValue) // IN: ethernet type 
+{
+   if (typeValue <=1500) {
+      return EthClassCommon;
+   }
+   if (typeValue >= 0x600) {
+      switch (typeValue) {
+      case 0x0800: // IPv4
+	 return EthClassIPv4;
+      case 0x0806: // ARP
+	 return EthClassARP;
+      case 0x0BAD: // Banyan Vines
+	 return EthClassUncommon;
+      case 0x2000: // Cisco CDP
+	 return EthClassCommon;
+      case 0x6002: // DEC MOP Remote Console
+      case 0x6558: // Trans Ether Bridging [RFC1701]
+      case 0x6559: // Raw Frame Relay [RFC1701]
+	 return EthClassUncommon;
+      case 0x8035: // Reverse ARP
+	 return EthClassARP;
+      case 0x809B: // AppleTalk
+      case 0x80F3: // AppleTalk AARP
+	 return EthClassUncommon;
+      case 0x8100: // VLAN special type
+	 return EthClassVLAN;
+      case 0x8137: // Novell 8137
+      case 0x8138: // Novell 8138
+         return EthClassUncommon;
+      case 0x86DD: // IPv6
+         return EthClassIPv6;
+      case 0x876B: // TCP/IP Compression [RFC1144]
+	 return EthClassUncommon;
+      case 0x886f: // Microsoft 886f
+	 return EthClassCommon;
+      case 0x888e: // 802.1x (aka EAPOL)
+      case 0x88c7: // 802.11i pre-authentication (treated as EAPOL)
+         return EthClassEAPOL;
+      default:
+	 return EthClassUnknown;
+      }
+   } else {
+      return EthClassUnknown;
+   }
+}
+
+
+#ifdef DBG
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * LookupTypeName --
+ *
+ *      Examines and classifies the protocol type of an ethernet frame
+ *
+ * Results:
+ *       Provides textual name of type in 'type' pointer.
+ *
+ *
+ * Side effects:
+ *      May modify the contents of the packet.  Length should be
+ *      unchanged.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#if _WIN32
+_Use_decl_annotations_
+#endif
+void
+LookupTypeName(unsigned short typeValue, // IN: ethernet type
+               char * type,              // IN/OUT: string to store type name
+               size_t typeLen)           // IN: size of out buffer
+{
+   if (!type) {
+      return;
+   }
+
+   if (typeValue <=1500) {
+      SNPRINTF((type, typeLen, "length %u", typeValue));
+      return;
+   }
+#ifdef _WIN32
+#define STRCPY_S(a,b,c) RtlStringCbCopyA(a,b,c)
+#else
+#define STRCPY_S(a,b,c) MEMCPY(a, c, sizeof c)
+#endif
+   if (typeValue >= 0x600) {
+      switch (typeValue) {
+      case 0x0800:
+         STRCPY_S(type, typeLen, "IPv4");
+         return;
+      case 0x0806:
+         STRCPY_S(type, typeLen, "ARP");
+         return;
+      case 0x0BAD:
+         STRCPY_S(type, typeLen, "Banyan VINES");
+         return;
+      case 0x2000:
+         STRCPY_S(type, typeLen, "Cisco CDP");
+         return;
+      case 0x6002:
+         STRCPY_S(type, typeLen, "DEC MOP Remote Console");
+         return;
+      case 0x6558:
+         STRCPY_S(type, typeLen, "Trans Ether Bridging [RFC1701]");
+         return;
+      case 0x6559:
+         STRCPY_S(type, typeLen, "Raw Frame Relay [RFC1701]");
+         return;
+      case 0x8035:
+         STRCPY_S(type, typeLen, "Reverse ARP");
+         return;
+      case 0x809B:
+         STRCPY_S(type, typeLen, "AppleTalk");
+         return;
+      case 0x80F3:
+         STRCPY_S(type, typeLen, "AppleTalk AARP");
+         return;
+      case 0x8100:
+         STRCPY_S(type, typeLen, "VLAN special type");
+         return;
+      case 0x8137:
+         STRCPY_S(type, typeLen, "Novell 8137");
+         return;
+      case 0x8138:
+         STRCPY_S(type, typeLen, "Novell 8138");
+         return;
+      case 0x86DD:
+         STRCPY_S(type, typeLen, "IPv6");
+         return;
+      case 0x876B:
+         STRCPY_S(type, typeLen, "TCP/IP Compression [RFC1144]");
+         return;
+      case 0x886f:
+         STRCPY_S(type, typeLen, "Microsoft 886f");
+         return;
+      case 0x888e:
+         STRCPY_S(type, typeLen, "EAPOL");
+         return;
+      case 0x88c7:
+         STRCPY_S(type, typeLen, "802.11i pre-auth");
+         return;
+      default:
+         SNPRINTF((type, typeLen, "unknown type 0x%04x", typeValue));
+         return;
+      }
+   } else {
+      SNPRINTF((type, typeLen, "invalid value 0x%04x", typeValue));
+      return;
+   }
+}
+#endif
+
+/*
+ * Checksum-related functions.  In certain cases the payload of a UDP
+ * packet needs to be modified.  The following functions are used to
+ * calculate the new checksum based on the old checksum and an offset
+ * of the changes.
+ */
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SUM32 --
+ *
+ *      performs 2's complement sum of the high bits and low bits
+ *      in a 32-bit word, resulting in a 16-bit number (with
+ *      potentially additional bits containing overflow)
+ *
+ * Results:
+ *      Returns result described above
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint32
+SUM32(uint32 in) { // IN: 32-bit number
+   return (in & 0xffff) + (in >> 16);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CalcChecksumDiff --
+ *
+ *      Computes the differences between two checksums
+ *
+ * Results:
+ *      Returns result described above
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static uint32
+CalcChecksumDiff(uint32 sumBefore, // IN: checksum before modification 
+		 uint32  sumAfter) // IN: checksum after modification
+{
+   uint32 diff; // stores resume to return
+   
+   sumBefore = SUM32(sumBefore); // Convert sum to 16-bit + overflow
+   sumBefore = SUM32(sumBefore); // Convert sum to 16-bit
+   sumAfter = SUM32(sumAfter);   // Convert sum to 16-bit + overflow
+   sumAfter = SUM32(sumAfter);   // Convert sum to 16-bit
+   
+   /*
+    * 2's complement versus 1's complement arthmetic requires the
+    * following piece of code.  I don't completely understand
+    * why it's needed, but my sources (and my own testing) say it 
+    * needs to be here.
+    */
+
+   if (sumBefore > sumAfter) { 
+      --sumAfter;
+   }
+
+   diff = sumAfter - sumBefore; // subtrace to get delta
+   diff = SUM32(diff);          // incorporate overflow to get 16-bits
+   return diff;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * UpdateSum --
+ *
+ *      Computes a new internet checksum by using an existing
+ *      checksum and a delta of changes to that checksum.
+ *
+ * Results:
+ *      Returns new checksum
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static uint16
+UpdateSum(uint16 oricheck, // IN: old checksum
+	  uint32 sumDiff)  // IN: delta of changes
+{
+   uint32 sum;
+   uint16 sumShort;
+   if (sumDiff == 0) {
+      return oricheck;
+   }
+   
+   sum = ( ~NTOHS(oricheck) & 0xffff); // undo net order & bit complement
+   sum += sumDiff;   // add in difference
+   sum = SUM32(sum); // wrap any overflow
+   sum = SUM32(sum); // wrap any overflow (again; last wrap may cause overflow)
+   sumShort = ~(uint16)(sum); // truncate to 16-bits and complement bits
+   return HTONS(sumShort); // return result in network order
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * GetSystemUptime --
+ *
+ *      Return current uptime of system, this is essentially a wrapper
+ *      that checks for overflow.  When 
+ *      overflow occurs the existing last used times reduced by half.
+ *      As part of the solution, the returned value always has the 
+ *      highest bit turned on.
+ *
+ *      Previously, this was a wrapper for NdisGetSystemUptime().
+ *      Recent updates to the DDK/WDK have confused this function - there
+ *      is now a depricated 32-bit version and a 64-bit version only 
+ *      available on newer version of the OS.  Rather than trying to be
+ *      clever, we will use KeQueryTickCount instead.
+ *
+ *      This function should only be called with the lock held.
+ *
+ * Results:
+ *      Returns uptime of system (skewed so always in upper half 
+ *      of numeric range for 32-bits)
+ *
+ * Side effects:
+ *      Updates the "last uptime" stored in adapter struct, and may
+ *      modify the uptimes of all entries in the hash table.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static SmacLastAccess 
+GetSystemUptime(SMACState *state) // IN: smac state
+{
+   SmacLastAccess currentUptime;
+
+#ifdef _WIN32
+   {
+      LARGE_INTEGER arg;
+      KeQueryTickCount(&arg);
+      currentUptime = arg.QuadPart;
+   }
+#else
+   currentUptime = SMACL_GetUptime();
+#endif
+   /*
+    * Force on the highest bit.  This basically means that recent 
+    * values have the high bit turned on, while values that were 
+    * obtained prior to the last overflow will have the highest bit
+    * (and potentially other neighboring bits) turned off.
+    */
+
+   currentUptime |= (SmacLastAccess)1 << (sizeof currentUptime * 8 - 1);
+
+   /* If overflow occurred, then reduce all existing values by half */
+   if (currentUptime < state->lastUptimeRead) {
+      uint32 i;
+      VNETKdPrint((MODULE_NAME "GetSystemUptime: overflow detected, "
+		   "adjusting counters\n"));
+      for (i = 0; i < SMAC_HASH_TABLE_SIZE; ++i) {
+	 IPmacLookupEntry *entry = state->IPlookupTable[i];
+	 while (entry) {
+	    entry->lastAccess >>= 1; /* reduce value by half */
+	    entry = entry->ipNext;
+	 }
+      }
+   }
+   state->lastUptimeRead = currentUptime;
+   return currentUptime;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * GetPacketLength --
+ *
+ *      Returns the total length of data in a packet
+ *
+ * Results:
+ *      returns length of packet
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint32 
+GetPacketLength(SMACPacket *packet) // IN: packet
+{
+   ASSERT(packet);
+#ifdef _WIN32
+   return packet->buf1Len + packet->buf2Len;
+#elif defined __linux__
+   ASSERT(packet->skb);
+   return (uint32)packet->len;
+#else /* __APPLE__ */
+   ASSERT(packet->m);
+   return SMACL_PacketLength(packet->m);
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * GetPacketData --
+ *
+ *      Copies select portion of packet
+ *
+ * Results:
+ *      TRUE if data was safely copied, otherwise FALSE (e.g., offset
+ *      too large, packet too small, etc).
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool 
+GetPacketData(SMACPacket *packet, // IN: packet to copy from
+	      uint32 offset,	  // IN: offset in packet to copy from
+	      uint32 length,	  // IN: length to copy
+	      void *data)	  // OUT: data (caller must pass in buffer >= length)
+{
+#ifdef _WIN32
+   uint32 copyOffset = 0;
+   uint32 copyLength = 0;
+#endif
+
+   ASSERT(packet);
+   ASSERT(data);
+   ASSERT(length > 0);
+
+   /* check length, be sure to handle case where offset = -1, length > 0 */
+   if (length == 0 || offset + length > GetPacketLength(packet) || 
+       offset + length < offset) {
+      /* packet not long enough for data */
+      return FALSE;
+   }
+
+#ifdef _WIN32
+   /* if offset starts in the first buffer, then copy from first buffer */   
+   if (offset < packet->buf1Len) {
+      copyOffset = offset;
+      copyLength = (offset + length > packet->buf1Len)?
+			(packet->buf1Len - copyOffset):(length);
+
+      MEMCPY(data, ((uint8*)packet->buf1) + copyOffset, copyLength);
+      offset = packet->buf1Len; /* advance offset to start of second buffer */
+
+      data = ((uint8*)data) + copyLength;
+      length -= copyLength;
+   }
+   /* copy any remaining data from second buffer */   
+   if (length) {
+      copyOffset = offset - packet->buf1Len;
+      copyLength = length;
+      MEMCPY(data, ((uint8*)packet->buf2) + copyOffset, copyLength);
+   }   
+
+#elif __linux__
+
+   MEMCPY(data, packet->startOfData + offset, length);
+
+#else /* __APPLE__ */
+
+   SMACL_CopyDataFromPkt(packet->m, offset, data, length);
+
+#endif /* _WIN32 */
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * ClonePacket --
+ *
+ *      Makes a private copy of the incoming packet.  This modified
+ *      copy is private and can be modified at will.  Caller is
+ *      responsible for freeing the cloned packet.
+ *
+ * Results:
+ *      TRUE if clone was successful, otherwise FALSE.
+ *
+ * Side effects:
+ *      Duplicates a packet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool 
+ClonePacket(SMACPackets *packets)   // IN: struct in which to clone packet
+{
+#ifdef _WIN32
+   VNetPacket * packetClone = NULL;
+
+   ASSERT(packets);
+
+   packetClone = VNet_PacketAllocate(packets->orig.buf1Len + 
+                                     packets->orig.buf2Len, 
+				     "SMAC_CheckPacketToHost");
+   if (!packetClone) {
+      VNETKdPrint((MODULE_NAME "  ToHost: couldn't clone packet\n"));
+      return FALSE;
+   }
+
+   if (packets->orig.buf1Len) {
+      MEMCPY(packetClone->data, packets->orig.buf1, packets->orig.buf1Len);
+   }
+   if (packets->orig.buf2Len) {
+      MEMCPY(packetClone->data + packets->orig.buf1Len, packets->orig.buf2, 
+	     packets->orig.buf2Len);
+   }
+
+   packets->clone.buf1 = packetClone->data;
+   packets->clone.buf1Len = packetClone->len;
+   packets->clone.buf2 = NULL;
+   packets->clone.buf2Len = 0;
+   packets->clonedPacket = packetClone;
+   return TRUE;
+
+#elif defined __linux__
+
+   packets->clone.skb = SMACL_DupPacket(packets->orig.skb);
+   if (packets->clone.skb) {
+      packets->clone.startOfData = (packets->orig.startOfData - 
+				    SMACL_PacketData(packets->orig.skb)) + 
+ 	                            SMACL_PacketData(packets->clone.skb);
+      packets->clone.len = packets->orig.len;
+   }
+   return packets->clone.skb != NULL;
+
+#else /* __APPLE__ */
+
+   /*
+    * Don't need to clone packet again. We could even get rid of "clone" from
+    * the SMACPackets struct, but this minimizes differences from other OSes.
+    */
+   packets->clone.m = packets->orig.m;
+   return packets->clone.m != NULL;
+
+#endif /* _WIN32 */
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CopyDataToClonedPacket --
+ *
+ *      Makes changes to the private clone copy of a packet.
+ *
+ * Results:
+ *      TRUE if modification was successful, otherwise FALSE.
+ *
+ * Side effects:
+ *      Modifies a packet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool 
+CopyDataToClonedPacket(SMACPackets *packets, // IN: packets
+		       const void * source,  // IN: data to copy to packet
+		       uint32 offset,	     // IN: dest offset at which to copy
+		       uint32 length)	     // IN: length of data to copy
+{
+#ifdef _WIN32
+   ASSERT(packets);
+   ASSERT(packets->clone.buf1);
+   ASSERT(packets->clone.buf1Len > offset + length);
+   ASSERT(packets->clone.buf2 == NULL);
+   ASSERT(packets->clone.buf2Len == 0);
+
+   /*
+    * For windows this code presumes that all of the clone packet's data is
+    * in the first buffer.
+    */
+
+   if (!packets || !packets->clone.buf1 || packets->clone.buf1Len 
+         <= offset + length) {
+      ASSERT(0); // should never occur
+      return FALSE;
+   }
+   MEMCPY((uint8 *)(packets->clone.buf1) + offset, source, length);
+
+#elif defined __linux__
+
+   ASSERT(packets);
+   ASSERT(packets->clone.skb);
+
+   MEMCPY((uint8 *)(packets->clone.startOfData) + offset, 
+	  source, length);
+
+#else /* __APPLE __ */
+
+   ASSERT(packets);
+   ASSERT(packets->clone.m);
+   SMACL_CopyDataToPkt(packets->clone.m, offset, source, length);
+
+#endif
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SetPacketByte --
+ *
+ *      Makes changes to a packet, either public or private
+ *
+ * Results:
+ *      TRUE if modification was successful, otherwise FALSE.
+ *
+ * Side effects:
+ *      Modifies a packet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool 
+SetPacketByte(SMACPacket *packet, // IN: packet
+	      uint32 offset,	  // IN: offset to change
+	      uint8 data)	  // IN: data to set
+{
+   ASSERT(packet);
+
+#ifdef _WIN32
+   /* check length, be sure to handle case where offset = -1, length > 0 */
+   if (offset > GetPacketLength(packet)) {
+      /* packet not long enough for data */
+      return FALSE;
+   }
+
+   /* if offset starts in the first buffer, then copy from first buffer */   
+   if (offset < packet->buf1Len) {
+      ((uint8*)packet->buf1)[offset] = data;
+   } else {
+      offset -= packet->buf1Len;
+      ((uint8*)packet->buf2)[offset] = data;
+   }
+
+#elif __linux__
+
+   ASSERT(packet);
+   ASSERT(packet->skb);
+
+   ((uint8*)packet->startOfData)[offset] = data;
+
+#else
+
+   ASSERT(packet);
+   ASSERT(packet->m);
+   SMACL_CopyDataToPkt(packet->m, offset, &data, 1);
+
+#endif /* _WIN32 */
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CopyDataForPacketFromHost --
+ *
+ *      When receiving data from the host, this function is used
+ *      to make changes to the packet.  Since the only changes we
+ *      ever make are to replace one Ethernet MAC with another, this
+ *      function currently just does MAC replacement.
+ *
+ * Results:
+ *      TRUE if modification was successful, otherwise FALSE.
+ *
+ * Side effects:
+ *      Modifies a packet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+CopyDataForPacketFromHost(SMACPackets *packets,    // IN/OUT: packets struct
+			  uint32 changeNum,        // IN: serialized # of change
+			  uint32 offset,           // IN: byte offset for change
+			  const uint8 *macAddress) // IN: new MAC to add to packet
+{
+#ifdef _WIN32
+   MacReplacementTable *table = NULL;
+   ASSERT(packets);
+   ASSERT(macAddress);
+
+   table = packets->table;
+   ASSERT(table);
+   ASSERT(changeNum == table->numOfOffsets);
+   UNREFERENCED_PARAMETER(changeNum);
+
+   if (table->numOfOffsets == 0) {
+      MEMCPY(table->mac, macAddress, ETH_ALEN);
+   }
+   table->offsets[table->numOfOffsets++] = offset;
+
+#else /* _WIN32 */
+
+   /* clone packet if this is the first change */
+   if (changeNum == 0 && !ClonePacket(packets)) {
+      VNETKdPrint((MODULE_NAME "FromHostIP: couldn't clone packet\n"));
+      return FALSE;
+   }	     
+   CopyDataToClonedPacket(packets, macAddress, offset, ETH_ALEN); 
+#endif /* _WIN32 */
+
+   return TRUE;
+}
diff --git a/vmnet-only/smac.h b/vmnet-only/smac.h
new file mode 100644
index 00000000..c8df9d2d
--- /dev/null
+++ b/vmnet-only/smac.h
@@ -0,0 +1,119 @@
+/*********************************************************
+ * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * smac.h --
+ *
+ *      This file declares functionality that allows the
+ *      bridge to be used across links that do
+ *      not support promiscuous mode, nor provide the
+ *      ability to transmit ethernet frames whose MAC source
+ *      address does not match the hardware's MAC address.
+ */
+
+#ifndef _SMAC_H_
+#define _SMAC_H_
+
+#ifdef _WIN32
+#include "vnetInt.h"
+#else /* _WIN32 */
+
+#include "vm_basic_types.h"
+
+/* linux header files include too much garbage, so just define if needed */
+#ifndef ETH_ALEN
+#define ETH_ALEN 6
+#endif /* ETH_ALEN */
+
+#ifndef ETH_HLEN
+#define ETH_HLEN 14
+#endif /* ETH_HLEN */
+
+#endif /* _WIN32 */
+
+#if defined __linux__ && !defined __x86_64__
+#define SMACINT __attribute__((cdecl, regparm(3)))
+#else
+#define SMACINT
+#endif
+
+typedef enum {
+   PacketStatusTooShort = 0x4546, // insuficient data to process packet
+   PacketStatusDropPacket,        // bridge should drop packet
+   PacketStatusForwardPacket      // bridge should accept/process/forward packet
+} PacketStatus;
+
+typedef struct IPv6Addr {
+   uint64 addrHi; /* High order 64 bits of the address. */
+   uint64 addrLo; /* Low order 64 bits of the address. */
+} IPv6Addr;
+
+struct SMACState;
+
+#if defined(_WIN32) && NDIS_SUPPORT_NDIS6
+Bool BridgeIPv6MatchAddrMAC(const IPv6Addr *addr, const uint8 *mac);
+Bool BridgeIPv4MatchAddrMAC(const ULONG ipAddr, const uint8 *mac);
+#endif
+void SMACINT
+SMAC_InitState(struct SMACState **ptr);           // IN: state to alloc/init
+void SMACINT
+SMAC_SetMac(struct SMACState *state, uint8 *mac); // IN: state, and host MAC
+void SMACINT
+SMAC_CleanupState(struct SMACState **ptr);        // IN: state to cleanup/dealloc
+
+/* 
+ * Structure is used to separate out differences 
+ * between packets on different OSes.
+ */
+
+#ifdef _WIN32
+/* defines Windows versions of SMACPacket and SMACPackets */
+#include "smac_win.h"
+#else /* _WIN32 */
+/* non-WIN32 versions of these structs */
+typedef struct SMACPacket {
+#ifdef __linux__
+   struct sk_buff *skb;  // packet
+   void *startOfData;    // handles non-uniform start of data in sk_buff
+   unsigned int len;     // compensates for ethernet header for inbound packets
+#else
+   mbuf_t m;             // packet
+#endif
+} SMACPacket;
+
+typedef struct SMACPackets {
+   SMACPacket orig;  // IN: packet
+   SMACPacket clone; // OUT: packet
+} SMACPackets;
+#endif /* _WIN32 */
+
+PacketStatus SMACINT
+SMAC_CheckPacketFromHost(struct SMACState *state,  // IN: pointer to smac state
+			 SMACPackets    *packets); // IN/OUT: packet(s) to process
+
+PacketStatus SMACINT
+SMAC_CheckPacketToHost(struct SMACState *state,  // IN: pointer to smac state
+		       SMACPackets *packets);	 // IN/OUT: packet(s) to process
+
+void SMACINT
+SMAC_SetForwardUnknownPackets(struct SMACState *state, // IN: pointer to smac state
+			      Bool forwardUnknown);    // IN: T/F to forward
+
+#endif // _SMAC_H_
+
+
diff --git a/vmnet-only/smac_compat.c b/vmnet-only/smac_compat.c
new file mode 100644
index 00000000..a7218fd3
--- /dev/null
+++ b/vmnet-only/smac_compat.c
@@ -0,0 +1,427 @@
+/*********************************************************
+ * Copyright (C) 2005 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * smac_compat.c --
+ *
+ *      This file defines an abstraction layer to handling
+ *      differences among the Linux kernel and avoiding
+ *      symbol match issues.
+ */
+
+#include "driver-config.h"
+
+#ifdef MODVERSIONS
+#include <linux/modversions.h>
+#endif
+
+#include <linux/kernel.h>
+#include <linux/version.h>
+#include <linux/sched.h>
+#include <linux/spinlock.h>       // for spinlock_t
+
+#include <linux/slab.h>
+#include <linux/poll.h>
+
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/mm.h>
+#include "compat_skbuff.h"
+#include <linux/sockios.h>
+
+#define __KERNEL_SYSCALLS__
+#include <asm/io.h>
+
+#include <linux/proc_fs.h>
+#include <linux/file.h>
+
+#include "vnetInt.h"
+#include "vmnetInt.h"
+#include "smac_compat.h"
+
+#ifdef VMX86_DEVEL
+#define DBG 1
+#else
+#undef DBG
+#endif /* VMX86_DEVEL */
+
+
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_GetUptime --
+ *
+ *      Wrapper for jiffies.
+ *
+ * Results:
+ *      Uptime in ticks
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+unsigned long SMACINT
+SMACL_GetUptime()
+{
+   return jiffies;
+}
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_Memcpy --
+ *
+ *      Wrapper for memcpy().
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Copies memory
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMACL_Memcpy(void *d,        // IN: destination pointer
+	     const void *s,  // IN: source pointer
+	     size_t l)       // IN: length to copy
+{
+   memcpy(d, s, l);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_Memcmp --
+ *
+ *      Wrapper for memcmp().
+ *
+ * Results:
+ *      refer to documentation for memcmp().
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int SMACINT
+SMACL_Memcmp(const void *p1, // IN: pointer to data
+	     const void *p2, // IN: pointer to data
+	     size_t l)       // IN: length to compare
+{
+   return memcmp(p1, p2, l);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_Memset --
+ *
+ *      Wrapper for memset().
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMACL_Memset(void *p1, // IN: pointer to data
+	     int val,  // IN: value to set
+	     size_t l) // IN: length to set
+{
+   memset(p1, val, l);
+   return;
+}
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_Alloc --
+ *
+ *      Wrapper for kmalloc().
+ *
+ * Results:
+ *      Pointer to memory if successful, NULL otherwise
+ *
+ * Side effects:
+ *      Allocates memory
+ *
+ *----------------------------------------------------------------------
+ */
+
+void* SMACINT
+SMACL_Alloc(size_t size) // IN: size to allocate
+{
+   return kmalloc(size, GFP_ATOMIC);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_Free --
+ *
+ *      Wrapper for kfree().
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Frees memory
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMACL_Free(void *ptr) // IN: pointer to free
+{
+   kfree(ptr);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_InitSpinlock --
+ *
+ *      Wrapper for spin_lock_init().
+ *      The reason we have to use void is to avoid dependency on kernel.
+ *      The spinlock_t structure can change for different compilation options.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      see spin_lock_init()
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMACL_InitSpinlock(void  **s) // IN: spinlock
+{
+   *s = kmalloc(sizeof(spinlock_t), GFP_ATOMIC);
+   spin_lock_init((spinlock_t *)*s);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_AcquireSpinlock --
+ *
+ *      Wrapper for spin_lock_irqsave().
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Grabs lock (see spin_lock_irqsave())
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMACL_AcquireSpinlock(void  **s,            // IN: spinlock
+		      unsigned long *flags) // IN/OUT: flags
+{
+   unsigned long f = *flags;
+   spin_lock_irqsave((spinlock_t *)*s, f);
+   *flags = f;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_ReleaseSpinlock --
+ *
+ *      Wrapper for spin_unlock_irqrestore().
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Ungrabs lock (see spin_unlock_irqrestore())
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMACL_ReleaseSpinlock(void **s,             // IN: spinlock
+		      unsigned long *flags) // IN/OUT: flags
+{
+   unsigned long f = *flags;
+   spin_unlock_irqrestore((spinlock_t *)*s, f);
+   *flags = f;
+}
+
+
+#ifdef DBG
+/*
+ *----------------------------------------------------------------------
+ * SMACL_Print --
+ *
+ *      Wrapper for printk().
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Creates output
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMACL_Print(const char * msg, // IN: format message
+	    ...)              // IN: params (currently ignored)
+{
+   char buf[512];
+   int len;
+   va_list ap;
+
+   va_start(ap, msg);
+   len = vsnprintf(buf, sizeof buf, msg, ap);
+   va_end(ap);
+   buf[sizeof buf - 1] = '\0';
+   printk(KERN_DEBUG "%s", buf);
+}
+
+#endif
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_DupPacket --
+ *
+ *      Wrapper for skb_copy().
+ *
+ * Results:
+ *      Pointer to packet if successful, NULL otherwise
+ *
+ * Side effects:
+ *      Creates a private duplicate of packet
+ *
+ *----------------------------------------------------------------------
+ */
+
+struct sk_buff* SMACINT
+SMACL_DupPacket(struct sk_buff *skb) // IN: packet to duplicate
+{
+   return skb_copy(skb, GFP_ATOMIC);
+}
+
+/*
+ *----------------------------------------------------------------------
+ * SMACL_PacketData --
+ *
+ *      Wrapper to get data from sk_buff.  This function might be
+ *      a bit extreme, but it's good to be able to handle changes
+ *      to the layout of the sk_buff struct.
+ *
+ * Results:
+ *      Pointer to data in sk_buff.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void* SMACINT
+SMACL_PacketData(struct sk_buff *skb) // IN: pointer to packet buffer
+{
+   return skb->data;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *  SMACL_IsSkbHostBound --
+ *
+ *      Checks if the direction of the packet is host bound.
+ *
+ * Results:
+ *      Returns non zero if host bound
+ *              0 for anything else
+ i
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+int SMACINT
+SMACL_IsSkbHostBound(struct sk_buff* skb) // IN: packet to process
+{
+   return (skb->pkt_type == PACKET_HOST);
+}
+
+
+#ifdef DBG
+/*
+ *----------------------------------------------------------------------
+ * SMACL_PrintSkb --
+ *
+ *      Print information about the skb.
+ *
+ * Results:
+ *      prints the sk_buff structure
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void SMACINT
+SMACL_PrintSkb(struct sk_buff *skb,          // IN: sk_buff structure
+               char *str)                    // IN: type of process
+{
+   LOG(4, (KERN_DEBUG "%s pointer %p shared? %d cloned? %d\n",
+            str, skb, skb_shared(skb), skb_cloned(skb)));
+   LOG(4, (KERN_DEBUG "next %p, prev %p\n",
+            skb->next, skb->prev));
+   LOG(4, (KERN_DEBUG "sock %p, dev %p\n",
+            skb->sk, skb->dev));
+   LOG(4, (KERN_DEBUG "pkt_type %x truesize %u protocol %u\n",
+            skb->pkt_type, skb->truesize, skb->protocol));
+   LOG(4, (KERN_DEBUG "users %d, tail %p, end %p\n",
+            atomic_read(&skb->users), compat_skb_tail_pointer(skb),
+            compat_skb_end_pointer(skb)));
+#if 0
+#define C skb->mac.raw
+   if(skb->mac.raw) {
+      LOG(4, (KERN_DEBUG "dest %02x:%02x:%02x:%02x:%02x:%02x"
+            " source %02x:%02x:%02x:%02x:%02x:%02x\n",
+            C[0],C[1],C[2],C[3],C[4],C[5] ,
+            C[6],C[7],C[8],C[9],C[10],C[11])); 
+   }
+#undef C
+   if(skb->dst) {
+      LOG(4, (KERN_DEBUG "dst_entry->__refcount %d\n",
+           atomic_read(&(skb->dst->__refcnt))));
+   }
+#endif
+   LOG(4, (KERN_DEBUG "dataref %d end\n",
+           atomic_read(&(skb_shinfo(skb)->dataref))));
+}
+#endif
diff --git a/vmnet-only/smac_compat.h b/vmnet-only/smac_compat.h
new file mode 100644
index 00000000..4df9d0c3
--- /dev/null
+++ b/vmnet-only/smac_compat.h
@@ -0,0 +1,60 @@
+/*********************************************************
+ * Copyright (C) 2005 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * smac_compat.h --
+ *
+ *      This file defines an abstraction layer to handling
+ *      differences among the Linux kernel and avoiding
+ *      symbol match issues.
+ */
+
+#ifndef _SMAC_COMPAT_H_
+#define _SMAC_COMPAT_H_
+
+#include "vm_basic_types.h"
+
+#if defined(__x86_64__) 
+#define SMACINT
+#else
+#define SMACINT __attribute__((cdecl, regparm(3)))
+#endif
+
+void   SMACINT SMACL_Memcpy(void *d, const void *s, size_t l);
+int    SMACINT SMACL_Memcmp(const void *p1, const void *p2, size_t l);
+void   SMACINT SMACL_Memset(void *p1, int val, size_t l);
+void*  SMACINT SMACL_Alloc(size_t s);
+void   SMACINT SMACL_Free(void *p);
+
+unsigned long SMACINT SMACL_GetUptime(void);
+
+void   SMACINT SMACL_InitSpinlock(void **s);
+void   SMACINT SMACL_AcquireSpinlock(void **s, unsigned long *flags);
+void   SMACINT SMACL_ReleaseSpinlock(void  **s, unsigned long *flags);
+
+
+struct sk_buff* SMACINT SMACL_DupPacket(struct sk_buff *skb);
+void*  SMACINT SMACL_PacketData(struct sk_buff *skb);
+int    SMACINT SMACL_IsSkbHostBound(struct sk_buff *skb);
+#ifdef DBG
+void   SMACINT SMACL_Print(const char *m, ...);
+void   SMACINT SMACL_PrintSkb(struct sk_buff *skb, char *type);
+#endif /* DBG */
+
+#endif /* _SMAC_COMPAT_H */
+
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
new file mode 100644
index 00000000..94146f61
--- /dev/null
+++ b/vmnet-only/userif.c
@@ -0,0 +1,1161 @@
+/*********************************************************
+ * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#include "driver-config.h"
+
+#define EXPORT_SYMTAB
+
+#define __KERNEL_SYSCALLS__
+
+#include <linux/file.h>
+#include <linux/highmem.h>
+#include <linux/if_ether.h>
+#include <linux/kernel.h>
+#include <linux/netdevice.h>
+#include <linux/etherdevice.h>
+#include <linux/mm.h>
+#include <linux/poll.h>
+#include <linux/proc_fs.h>
+#include <linux/sockios.h>
+#include <linux/sched.h>
+#include <linux/slab.h>
+#include <linux/version.h>
+#include <linux/wait.h>
+
+#include <net/checksum.h>
+#include <net/sock.h>
+
+#include <asm/io.h>
+
+#include "vnetInt.h"
+#include "compat_skbuff.h"
+#include "vmnetInt.h"
+#include "vm_atomic.h"
+#include "vm_assert.h"
+#include "monitorAction_exported.h"
+
+typedef struct VNetUserIFStats {
+   unsigned    read;
+   unsigned    written;
+   unsigned    queued;
+   unsigned    droppedDown;
+   unsigned    droppedMismatch;
+   unsigned    droppedOverflow;
+   unsigned    droppedLargePacket;
+} VNetUserIFStats;
+
+typedef struct VNetUserIF {
+   VNetPort               port;
+   struct sk_buff_head    packetQueue;
+   Atomic_uint32         *pollPtr;
+   MonitorActionIntr     *actionIntr;
+   uint32                 pollMask;
+   MonitorIdemAction      actionID;
+   uint32*                recvClusterCount;
+   wait_queue_head_t      waitQueue;
+   struct page*           actPage;
+   struct page*           pollPage;
+   struct page*           recvClusterPage;
+   VNetUserIFStats        stats;
+   VNetEvent_Sender      *eventSender;
+} VNetUserIF;
+
+static void VNetUserIfUnsetupNotify(VNetUserIF *userIf);
+static int  VNetUserIfSetupNotify(VNetUserIF *userIf, VNet_Notify *vn);
+static int  VNetUserIfSetUplinkState(VNetPort *port, uint8 linkUp);
+extern unsigned int  vnet_max_qlen;
+
+#if COMPAT_LINUX_VERSION_CHECK_LT(3, 2, 0)
+#   define compat_kmap(page) kmap(page)
+#   define compat_kunmap(page) kunmap(page)
+#else
+#   define compat_kmap(page) kmap((page).p)
+#   define compat_kunmap(page) kunmap((page).p)
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * UserifLockPage --
+ *
+ *    Lock in core the physical page associated to a valid virtual
+ *    address.
+ *
+ * Results:
+ *    The page structure on success
+ *    NULL on failure: memory pressure. Retry later
+ *
+ * Side effects:
+ *    Loads page into memory
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE struct page *
+UserifLockPage(VA addr) // IN
+{
+   struct page *page = NULL;
+   int retval;
+
+   down_read(&current->mm->mmap_sem);
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 9, 0)
+   retval = get_user_pages(addr, 1, FOLL_WRITE, &page, NULL);
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 6, 0)
+   retval = get_user_pages(addr, 1, 1, 0, &page, NULL);
+#else
+   retval = get_user_pages(current, current->mm, addr,
+                           1, 1, 0, &page, NULL);
+#endif
+   up_read(&current->mm->mmap_sem);
+
+   if (retval != 1) {
+      return NULL;
+   }
+
+   return page;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetUserIfMapUint32Ptr --
+ *
+ *    Maps a portion of user-space memory into the kernel.
+ *
+ * Results:
+ *    0 on success
+ *    < 0 on failure: the actual value determines the type of failure
+ *
+ * Side effects:
+ *    Might sleep.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE int
+VNetUserIfMapPtr(VA uAddr,        // IN: pointer to user memory
+                 size_t size,     // IN: size of data
+                 struct page **p, // OUT: locked page
+                 void **ptr)      // OUT: kernel mapped pointer
+{
+   if (!access_ok(VERIFY_WRITE, (void *)uAddr, size) ||
+       (((uAddr + size - 1) & ~(PAGE_SIZE - 1)) !=
+        (uAddr & ~(PAGE_SIZE - 1)))) {
+      return -EINVAL;
+   }
+
+   *p = UserifLockPage(uAddr);
+   if (*p == NULL) {
+      return -EAGAIN;
+   }
+
+   *ptr = (uint8 *)kmap(*p) + (uAddr & (PAGE_SIZE - 1));
+   return 0;
+}
+
+static INLINE int
+VNetUserIfMapUint32Ptr(VA uAddr,        // IN: pointer to user memory
+                       struct page **p, // OUT: locked page
+                       uint32 **ptr)    // OUT: kernel mapped pointer
+{
+   return VNetUserIfMapPtr(uAddr, sizeof **ptr, p, (void **)ptr);
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetUserIfSetupNotify --
+ *
+ *    Sets up notification by filling in pollPtr, actPtr, and recvClusterCount
+ *    fields.
+ * 
+ * Results: 
+ *    0 on success
+ *    < 0 on failure: the actual value determines the type of failure
+ *
+ * Side effects:
+ *    Fields pollPtr, actPtr, recvClusterCount, pollPage, actPage, and 
+ *    recvClusterPage are filled in VNetUserIf structure.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE int
+VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
+                      VNet_Notify *vn)    // IN
+{
+   unsigned long flags;
+   struct sk_buff_head *q = &userIf->packetQueue;
+   uint32 *pollPtr;
+   MonitorActionIntr *actionIntr;
+   uint32 *recvClusterCount;
+   struct page *pollPage = NULL;
+   struct page *actPage = NULL;
+   struct page *recvClusterPage = NULL;
+   int retval;
+
+   if (userIf->pollPtr || userIf->actionIntr || userIf->recvClusterCount) {
+      LOG(0, (KERN_DEBUG "vmnet: Notification mechanism already active\n"));
+      return -EBUSY;
+   }
+
+   if ((retval = VNetUserIfMapUint32Ptr((VA)vn->pollPtr, &pollPage,
+                                        &pollPtr)) < 0) {
+      return retval;
+   }
+
+   /* Atomic operations require proper alignment */
+   if ((uintptr_t)pollPtr & (sizeof *pollPtr - 1)) {
+      LOG(0, (KERN_DEBUG "vmnet: Incorrect notify alignment\n"));
+      retval = -EFAULT;
+      goto error_free;
+   }
+
+   if ((retval = VNetUserIfMapPtr((VA)vn->actPtr, sizeof *actionIntr,
+                                  &actPage,
+                                  (void **)&actionIntr)) < 0) {
+      goto error_free;
+   }
+
+   if ((retval = VNetUserIfMapUint32Ptr((VA)vn->recvClusterPtr,
+                                        &recvClusterPage,
+                                        &recvClusterCount)) < 0) {
+      goto error_free;
+   }
+
+   spin_lock_irqsave(&q->lock, flags);
+   if (userIf->pollPtr || userIf->actionIntr || userIf->recvClusterCount) {
+      spin_unlock_irqrestore(&q->lock, flags);
+      retval = -EBUSY;
+      LOG(0, (KERN_DEBUG "vmnet: Notification mechanism already active\n"));
+      goto error_free;
+   }
+
+   userIf->pollPtr = (Atomic_uint32 *)pollPtr;
+   userIf->pollPage = pollPage;
+   userIf->actionIntr = actionIntr;
+   userIf->actPage = actPage;
+   userIf->recvClusterCount = recvClusterCount;
+   userIf->recvClusterPage = recvClusterPage;
+   userIf->pollMask = vn->pollMask;
+   userIf->actionID = vn->actionID;
+   spin_unlock_irqrestore(&q->lock, flags);
+   return 0;
+
+ error_free:
+   if (pollPage) {
+      kunmap(pollPage);
+      put_page(pollPage);
+   }
+   if (actPage) {
+      kunmap(actPage);
+      put_page(actPage);
+   }
+   if (recvClusterPage) {
+      kunmap(recvClusterPage);
+      put_page(recvClusterPage);
+   }
+   return retval;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIfUnsetupNotify --
+ *
+ *      Destroys permanent mapping for notify structure provided by user.
+ * 
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      Fields pollPtr, actPtr, recvClusterCount, etc. in VNetUserIf
+ *      structure are cleared.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetUserIfUnsetupNotify(VNetUserIF *userIf) // IN
+{
+   unsigned long flags;
+   struct page *pollPage = userIf->pollPage;
+   struct page *actPage = userIf->actPage;
+   struct page *recvClusterPage = userIf->recvClusterPage;
+
+   struct sk_buff_head *q = &userIf->packetQueue;
+
+   spin_lock_irqsave(&q->lock, flags);
+   userIf->pollPtr = NULL;
+   userIf->pollPage = NULL;
+   userIf->actionIntr = NULL;
+   userIf->actPage = NULL;
+   userIf->recvClusterCount = NULL;
+   userIf->recvClusterPage = NULL;
+   userIf->pollMask = 0;
+   userIf->actionID = -1;
+   spin_unlock_irqrestore(&q->lock, flags);
+
+   /* Release */
+   if (pollPage) {
+      kunmap(pollPage);
+      put_page(pollPage);
+   }
+   if (actPage) {
+      kunmap(actPage);
+      put_page(actPage);
+   }
+   if (recvClusterPage) {
+      kunmap(recvClusterPage);
+      put_page(recvClusterPage);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIfFree --
+ *
+ *      Free the user interface port.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetUserIfFree(VNetJack *this) // IN
+{
+   VNetUserIF *userIf = (VNetUserIF*)this;
+   struct sk_buff *skb;
+
+   for (;;) {
+      skb = skb_dequeue(&userIf->packetQueue);
+      if (skb == NULL) {
+	 break;
+      }
+      dev_kfree_skb(skb);
+   }
+   
+   if (userIf->pollPtr) {
+      VNetUserIfUnsetupNotify(userIf);
+   }
+
+   if (userIf->eventSender) {
+      VNetEvent_DestroySender(userIf->eventSender);
+   }
+
+   if (this->procEntry) {
+      VNetProc_RemoveEntry(this->procEntry);
+   }
+
+   kfree(userIf);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIfReceive --
+ *
+ *      This jack is receiving a packet. Take appropriate action.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      Frees skb.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetUserIfReceive(VNetJack       *this, // IN
+                  struct sk_buff *skb)  // IN
+{
+   VNetUserIF *userIf = (VNetUserIF*)this->private;
+   uint8 *dest = SKB_2_DESTMAC(skb);
+   unsigned long flags;
+   
+   if (!UP_AND_RUNNING(userIf->port.flags)) {
+      userIf->stats.droppedDown++;
+      goto drop_packet;
+   }
+   
+   if (!VNetPacketMatch(dest,
+                        userIf->port.paddr,
+                        (const uint8 *)userIf->port.exactFilter,
+                        userIf->port.exactFilterLen,
+                        userIf->port.ladrf,
+                        userIf->port.flags)) {
+      userIf->stats.droppedMismatch++;
+      goto drop_packet;
+   }
+   
+   if (skb_queue_len(&userIf->packetQueue) >= vnet_max_qlen) {
+      userIf->stats.droppedOverflow++;
+      goto drop_packet;
+   }
+   
+   if (skb->len > ETHER_MAX_QUEUED_PACKET) {
+      userIf->stats.droppedLargePacket++;
+      goto drop_packet;
+   }
+
+   userIf->stats.queued++;
+
+   spin_lock_irqsave(&userIf->packetQueue.lock, flags);
+   /*
+    * __skb_dequeue_tail does not take any locks so must be used with
+    * appropriate locks held only.
+    */
+   __skb_queue_tail(&userIf->packetQueue, skb);
+   if (userIf->pollPtr) {
+      Atomic_Or(userIf->pollPtr, userIf->pollMask);
+      if (skb_queue_len(&userIf->packetQueue) >= (*userIf->recvClusterCount)) {
+         MonitorAction_SetBits(userIf->actionIntr, userIf->actionID);
+      }
+   }
+   spin_unlock_irqrestore(&userIf->packetQueue.lock, flags);
+
+   wake_up(&userIf->waitQueue);
+   return;
+   
+ drop_packet:
+   dev_kfree_skb(skb);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIfProcRead --
+ *
+ *      Callback for read operation on this userif entry in vnets proc fs.
+ *
+ * Results: 
+ *      Length of read operation.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetUserIfProcRead(char    *page,  // IN/OUT: buffer to write into
+                   char   **start, // OUT: 0 if file < 4k, else offset into
+                                   //      page
+                   off_t    off,   // IN: offset of read into the file
+                   int      count, // IN: maximum number of bytes to read
+                   int     *eof,   // OUT: TRUE if there is nothing more to
+                                   //      read
+                   void    *data)  // IN: client data - not used
+{
+   VNetUserIF *userIf = (VNetUserIF*)data; 
+   int len = 0;
+   
+   if (!userIf) {
+      return len;
+   }
+   
+   len += VNetPrintPort(&userIf->port, page+len);
+   
+   len += sprintf(page+len, "read %u written %u queued %u ",
+                  userIf->stats.read,
+                  userIf->stats.written,
+                  userIf->stats.queued);
+   
+   len += sprintf(page+len, 
+		  "dropped.down %u dropped.mismatch %u "
+		  "dropped.overflow %u dropped.largePacket %u",
+                  userIf->stats.droppedDown,
+                  userIf->stats.droppedMismatch,
+                  userIf->stats.droppedOverflow,
+		  userIf->stats.droppedLargePacket);
+
+   len += sprintf(page+len, "\n");
+   
+   *start = 0;
+   *eof   = 1;
+   return len;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetCopyDatagram --
+ *
+ *      Copy part of datagram to userspace.
+ *
+ * Results: 
+ *	zero    on success,
+ *	-EFAULT if buffer is an invalid area
+ *
+ * Side effects:
+ *      Data copied to the buffer.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetCopyDatagram(const struct sk_buff *skb,	// IN: skb to copy
+		 char *buf,			// OUT: where to copy data
+		 int len)			// IN: length
+{
+   struct iovec iov = {
+      .iov_base = buf,
+      .iov_len  = len,
+   };
+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 19, 0)
+   return skb_copy_datagram_iovec(skb, 0, &iov, len);
+#else
+   struct iov_iter ioviter;
+
+   iov_iter_init(&ioviter, READ, &iov, 1, len);
+   return skb_copy_datagram_iter(skb, 0, &ioviter, len);
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetCsumCopyDatagram --
+ *
+ *      Copy part of datagram to userspace doing checksum at same time.
+ *
+ *	Do not mark this function INLINE, it is recursive! With all gcc's 
+ *	released up to now (<= gcc-3.3.1) inlining this function just
+ *	consumes 120 more bytes of code and goes completely mad on
+ *	register allocation, storing almost everything in the memory.
+ *
+ * Results: 
+ *	folded checksum (non-negative value) on success,
+ *	-EINVAL if offset is too big,
+ *	-EFAULT if buffer is an invalid area
+ *
+ * Side effects:
+ *      Data copied to the buffer.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetCsumCopyDatagram(const struct sk_buff *skb,	// IN: skb to copy
+		     unsigned int offset,	// IN: how many bytes skip
+		     char *buf)			// OUT: where to copy data
+{
+   unsigned int csum;
+   int err = 0;
+   int len = skb_headlen(skb) - offset;
+   char *curr = buf;
+   const skb_frag_t *frag;
+
+   /* 
+    * Something bad happened. We skip only up to skb->nh.raw, and skb->nh.raw
+    * must be in the header, otherwise we are in the big troubles.
+    */
+   if (len < 0) {
+      return -EINVAL;
+   }
+
+   csum = csum_and_copy_to_user(skb->data + offset, curr, len, 0, &err);
+   if (err) {
+      return err;
+   }
+   curr += len;
+
+   for (frag = skb_shinfo(skb)->frags;
+	frag != skb_shinfo(skb)->frags + skb_shinfo(skb)->nr_frags;
+	frag++) {
+      if (frag->size > 0) {
+	 unsigned int tmpCsum;
+	 const void *vaddr;
+
+	 vaddr = compat_kmap(frag->page);
+	 tmpCsum = csum_and_copy_to_user(vaddr + frag->page_offset,
+					 curr, frag->size, 0, &err);
+	 compat_kunmap(frag->page);
+
+	 if (err) {
+	    return err;
+	 }
+	 csum = csum_block_add(csum, tmpCsum, curr - buf);
+	 curr += frag->size;
+      }
+   }
+
+   for (skb = skb_shinfo(skb)->frag_list; skb != NULL; skb = skb->next) {
+      int tmpCsum;
+
+      tmpCsum = VNetCsumCopyDatagram(skb, 0, curr);
+      if (tmpCsum < 0) {
+	 return tmpCsum;
+      }
+      /* Folded checksum must be inverted before we can use it */
+      csum = csum_block_add(csum, tmpCsum ^ 0xFFFF, curr - buf);
+      curr += skb->len;
+   }
+   return csum_fold(csum);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetCopyDatagramToUser --
+ *
+ *      Copy complete datagram to the user space. Fill correct checksum
+ *	into the copied datagram if nobody did it yet.
+ *
+ * Results: 
+ *      On success byte count, on failure -EFAULT.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE_SINGLE_CALLER int
+VNetCopyDatagramToUser(const struct sk_buff *skb,	// IN
+		       char *buf,			// OUT
+		       size_t count)			// IN
+{
+   if (count > skb->len) {
+      count = skb->len;
+   }
+   /*
+    * If truncation occurs, we do not bother with checksumming - caller cannot
+    * verify checksum anyway in such case, and copy without checksum is
+    * faster.
+    */
+   if (skb->pkt_type == PACKET_OUTGOING && 	/* Packet must be outgoing */
+       skb->ip_summed == VM_TX_CHECKSUM_PARTIAL &&	/* Without checksum */
+       compat_skb_network_header_len(skb) &&    /* We must know where header is */
+       skb->len == count) {			/* No truncation may occur */
+      size_t skl;
+      int csum;
+      u_int16_t csum16;
+     
+      skl = compat_skb_csum_start(skb);
+      if (VNetCopyDatagram(skb, buf, skl)) {
+	 return -EFAULT;
+      }
+      csum = VNetCsumCopyDatagram(skb, skl, buf + skl);
+      if (csum < 0) {
+	 return csum;
+      }
+      csum16 = csum;
+      if (copy_to_user(buf + skl + compat_skb_csum_offset(skb),
+                       &csum16, sizeof csum16)) {
+	 return -EFAULT;
+      }
+   } else {
+      if (VNetCopyDatagram(skb, buf, count)) {
+	 return -EFAULT;
+      }
+   }
+   return count;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIfRead --
+ *
+ *      The virtual network's read file operation. Reads the next pending
+ *      packet for this network connection.
+ *
+ * Results: 
+ *      On success the len of the packet received,
+ *      else if no packet waiting and nonblocking 0,
+ *      else -errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int 
+VNetUserIfRead(VNetPort    *port, // IN
+               struct file *filp, // IN
+               char        *buf,  // OUT
+               size_t      count) // IN
+{
+   VNetUserIF *userIf = (VNetUserIF*)port->jack.private;
+   struct sk_buff *skb;
+   int ret;
+   unsigned long flags;
+   DECLARE_WAITQUEUE(wait, current);
+
+   add_wait_queue(&userIf->waitQueue, &wait);
+   for (;;) {
+      set_current_state(TASK_INTERRUPTIBLE);
+      skb = skb_peek(&userIf->packetQueue);
+      if (skb && (skb->len > count)) {
+         skb = NULL;
+         ret = -EMSGSIZE;
+         break;
+      }
+      ret = -EAGAIN;
+
+      spin_lock_irqsave(&userIf->packetQueue.lock, flags);
+      /*
+       * __skb_dequeue does not take any locks so must be used with
+       * appropriate locks held only.
+       */
+      skb = __skb_dequeue(&userIf->packetQueue);
+      if (userIf->pollPtr) {
+         if (!skb) {
+            /* List empty */
+            Atomic_And(userIf->pollPtr, ~userIf->pollMask);
+         }
+      }
+      spin_unlock_irqrestore(&userIf->packetQueue.lock, flags);
+
+      if (skb != NULL || filp->f_flags & O_NONBLOCK) {
+         break;
+      }
+      ret = -EINTR;
+      if (signal_pending(current)) {
+         break;
+      }
+      schedule();
+   }
+   __set_current_state(TASK_RUNNING);
+   remove_wait_queue(&userIf->waitQueue, &wait);
+   if (! skb) {
+      return ret;
+   }
+
+   userIf->stats.read++;
+
+   count = VNetCopyDatagramToUser(skb, buf, count);
+   dev_kfree_skb(skb);
+   return count;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIfWrite --
+ *
+ *      The virtual network's write file operation. Send the raw packet
+ *      to the network.
+ *
+ * Results: 
+ *      On success the count of bytes written else errno.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int 
+VNetUserIfWrite(VNetPort    *port, // IN
+                struct file *filp, // IN
+                const char  *buf,  // IN
+                size_t      count) // IN
+{
+   VNetUserIF *userIf = (VNetUserIF*)port->jack.private;
+   struct sk_buff *skb;
+
+   /*
+    * Check size
+    */
+   
+   if (count < sizeof (struct ethhdr) || 
+       count > ETHER_MAX_QUEUED_PACKET) {
+      return -EINVAL;
+   }
+
+   /*
+    * Required to enforce the downWhenAddrMismatch policy in the MAC
+    * layer. --hpreg
+    */
+   if (!UP_AND_RUNNING(userIf->port.flags)) {
+      userIf->stats.droppedDown++;
+      return count;
+   }
+
+   /*
+    * Allocate an sk_buff.
+    */
+   
+   skb = dev_alloc_skb(count + 7);
+   if (skb == NULL) {
+      // XXX obey O_NONBLOCK?
+      return -ENOBUFS;
+   }
+   
+   skb_reserve(skb, 2);
+   
+   /*
+    * Copy the data and send it.
+    */
+   
+   userIf->stats.written++;
+   if (copy_from_user(skb_put(skb, count), buf, count)) {
+      dev_kfree_skb(skb);
+      return -EFAULT;
+   }
+   
+   VNetSend(&userIf->port.jack, skb);
+
+   return count;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetUserIfIoctl --
+ *
+ *      XXX
+ *
+ * Results: 
+ *      0 on success
+ *      -errno on failure
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static int
+VNetUserIfIoctl(VNetPort      *port,  // IN
+                struct file   *filp,  // IN
+                unsigned int   iocmd, // IN
+                unsigned long  ioarg) // IN or OUT depending on iocmd
+{
+   VNetUserIF *userIf = (VNetUserIF*)port->jack.private;
+
+   switch (iocmd) {
+   case SIOCSETNOTIFY:
+      return -EINVAL;
+   case SIOCSETNOTIFY2:
+#ifdef VMX86_SERVER
+      /* 
+       * This ioctl always return failure on ESX since we cannot map pages into 
+       * the console os that are from the VMKernel address space which  was the
+       * only case we used this.
+       */
+      return -EINVAL;
+#else // VMX86_SERVER
+   /*
+    * ORs pollMask into the integer pointed to by ptr if pending packet. Is
+    * cleared when all packets are drained.
+    */
+   {
+      int retval;
+      VNet_Notify vn;
+
+      if (copy_from_user(&vn, (void *)ioarg, sizeof vn)) {
+         return -EFAULT;
+      }
+
+      ASSERT_ON_COMPILE(VNET_NOTIFY_VERSION == 5);
+      ASSERT_ON_COMPILE(ACTION_EXPORTED_VERSION == 2);
+      if (vn.version != VNET_NOTIFY_VERSION ||
+          vn.actionVersion != ACTION_EXPORTED_VERSION ||
+          vn.actionID / ACTION_WORD_SIZE >= ACTION_NUM_WORDS) {
+         return -ENOTTY;
+      }
+
+      retval = VNetUserIfSetupNotify(userIf, &vn);
+      if (retval < 0) {
+         return retval;
+      }
+
+      break;
+   }
+#endif // VMX86_SERVER
+   case SIOCUNSETNOTIFY:
+      if (!userIf->pollPtr) {
+	 /* This should always happen on ESX. */
+         return -EINVAL;
+      }
+      VNetUserIfUnsetupNotify(userIf);
+      break;
+
+   case SIOCSIFFLAGS:
+      /* 
+       * Drain queue when interface is no longer active. We drain the queue to 
+       * avoid having old packets delivered to the guest when reneabled.
+       */
+      
+      if (!UP_AND_RUNNING(userIf->port.flags)) {
+         struct sk_buff *skb;
+         unsigned long flags;
+         struct sk_buff_head *q = &userIf->packetQueue;
+         
+         while ((skb = skb_dequeue(q)) != NULL) {
+            dev_kfree_skb(skb);
+         }
+         
+         spin_lock_irqsave(&q->lock, flags);
+         if (userIf->pollPtr) {
+            if (skb_queue_empty(q)) {
+               /*
+                * Clear the pending bit as no packets are pending at this
+                * point.
+                */
+               Atomic_And(userIf->pollPtr, ~userIf->pollMask);
+            }
+         }
+         spin_unlock_irqrestore(&q->lock, flags);
+      }
+      break;
+   case SIOCINJECTLINKSTATE:
+      {
+         uint8 linkUpFromUser;
+         if (copy_from_user(&linkUpFromUser, (void *)ioarg, 
+                            sizeof linkUpFromUser)) {
+            return -EFAULT;
+         }
+         
+         if (linkUpFromUser != 0 && linkUpFromUser != 1) {
+            return -EINVAL;
+         }
+
+         return VNetUserIfSetUplinkState(port, linkUpFromUser);
+      }
+      break;
+   default:
+      return -ENOIOCTLCMD;
+      break;
+   }
+   
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIfPoll --
+ *
+ *      The virtual network's file poll operation.
+ *
+ * Results: 
+ *      Return POLLIN if success, else sleep and return 0.
+ *      FIXME: Should not we always return POLLOUT?
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetUserIfPoll(VNetPort     *port, // IN
+               struct file  *filp, // IN
+               poll_table   *wait) // IN
+{
+   VNetUserIF *userIf = (VNetUserIF*)port->jack.private;
+   
+   poll_wait(filp, &userIf->waitQueue, wait);
+   if (!skb_queue_empty(&userIf->packetQueue)) {
+      return POLLIN;
+   }
+
+   return 0;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIfSetUplinkState --
+ *
+ *      Sends link state change event.
+ * 
+ * Results: 
+ *      0 on success, errno on failure.
+ *
+ * Side effects:
+ *      Link state event is sent to all the event listeners
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetUserIfSetUplinkState(VNetPort *port, uint8 linkUp)
+{
+   VNetUserIF *userIf;
+   VNetJack *hubJack;
+   VNet_LinkStateEvent event;
+   int retval;
+
+   userIf = (VNetUserIF *)port->jack.private;
+   hubJack = port->jack.peer;
+
+   if (port->jack.state == FALSE || hubJack == NULL) {
+      return -EINVAL;
+   }
+
+   if (userIf->eventSender == NULL) {
+      /* create event sender */
+      retval = VNetHub_CreateSender(hubJack, &userIf->eventSender);
+      if (retval != 0) {
+         return retval;
+      }
+   }
+
+   event.header.size = sizeof event;
+   retval = VNetEvent_GetSenderId(userIf->eventSender, &event.header.senderId);
+   if (retval != 0) {
+      LOG(1, (KERN_NOTICE "userif-%d: can't send link state event, "
+              "getSenderId failed (%d)\n", userIf->port.id, retval));
+      return retval;
+   }
+   event.header.eventId = 0;
+   event.header.classSet = VNET_EVENT_CLASS_UPLINK;
+   event.header.type = VNET_EVENT_TYPE_LINK_STATE;
+   /* 
+    * XXX kind of a hack, vmx will coalesce linkup/down if they come from the
+    * same adapter.
+    */
+   event.adapter = linkUp;
+   event.up = linkUp;
+   retval = VNetEvent_Send(userIf->eventSender, &event.header);
+   if (retval != 0) {
+      LOG(1, (KERN_NOTICE "userif-%d: can't send link state event, send "
+              "failed (%d)\n", userIf->port.id, retval));
+   }
+
+   LOG(0, (KERN_NOTICE "userif-%d: sent link %s event.\n",
+        userIf->port.id, linkUp ? "up" : "down"));
+
+   return retval;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserIf_Create --
+ *
+ *      Create a user level port to the wonderful world of virtual
+ *      networking.
+ * 
+ * Results: 
+ *      Errno. Also returns an allocated port to connect to,
+ *      NULL on error.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetUserIf_Create(VNetPort **ret) // OUT
+{
+   VNetUserIF *userIf;
+   static unsigned id = 0;
+   int retval;
+   
+   userIf = kmalloc(sizeof *userIf, GFP_USER);
+   if (!userIf) {
+      return -ENOMEM;
+   }
+
+   /*
+    * Initialize fields.
+    */
+   
+   userIf->port.id = id++;
+
+   userIf->port.jack.peer = NULL;
+   userIf->port.jack.numPorts = 1;
+   VNetSnprintf(userIf->port.jack.name, sizeof userIf->port.jack.name,
+		"userif%u", userIf->port.id);
+   userIf->port.jack.private = userIf;
+   userIf->port.jack.index = 0;
+   userIf->port.jack.procEntry = NULL;
+   userIf->port.jack.free = VNetUserIfFree;
+   userIf->port.jack.rcv = VNetUserIfReceive;
+   userIf->port.jack.cycleDetect = NULL;
+   userIf->port.jack.portsChanged = NULL;
+   userIf->port.jack.isBridged = NULL;
+   userIf->pollPtr = NULL;
+   userIf->actionIntr = NULL;
+   userIf->recvClusterCount = NULL;
+   userIf->pollPage = NULL;
+   userIf->actPage = NULL;
+   userIf->recvClusterPage = NULL;
+   userIf->pollMask = 0;
+   userIf->actionID = -1;
+   userIf->port.exactFilterLen = 0;
+   userIf->eventSender = NULL;
+
+   /*
+    * Make proc entry for this jack.
+    */
+
+   retval = VNetProc_MakeEntry(userIf->port.jack.name, S_IFREG, userIf,
+                               VNetUserIfProcRead,
+                               &userIf->port.jack.procEntry);
+   if (retval) {
+      if (retval == -ENXIO) {
+         userIf->port.jack.procEntry = NULL;
+      } else {
+         kfree(userIf);
+         return retval;
+      }
+   }
+
+   /*
+    * Rest of fields.
+    */
+   
+   userIf->port.flags = IFF_RUNNING;
+
+   memset(userIf->port.paddr, 0, sizeof userIf->port.paddr);
+   memset(userIf->port.ladrf, 0, sizeof userIf->port.ladrf);
+   memset(userIf->port.exactFilter, 0, sizeof userIf->port.exactFilter);
+
+   VNet_MakeMACAddress(&userIf->port);
+
+   userIf->port.fileOpRead = VNetUserIfRead;
+   userIf->port.fileOpWrite = VNetUserIfWrite;
+   userIf->port.fileOpIoctl = VNetUserIfIoctl;
+   userIf->port.fileOpPoll = VNetUserIfPoll;
+   
+   skb_queue_head_init(&(userIf->packetQueue));
+   init_waitqueue_head(&userIf->waitQueue);
+
+   memset(&userIf->stats, 0, sizeof userIf->stats);
+   
+   *ret = &userIf->port;
+   return 0;
+}
+
diff --git a/vmnet-only/vm_assert.h b/vmnet-only/vm_assert.h
new file mode 100644
index 00000000..b368e1da
--- /dev/null
+++ b/vmnet-only/vm_assert.h
@@ -0,0 +1,336 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_assert.h --
+ *
+ *	The basic assertion facility for all VMware code.
+ *
+ *      For proper use, see bora/doc/assert and
+ *      http://vmweb.vmware.com/~mts/WebSite/guide/programming/asserts.html.
+ */
+
+#ifndef _VM_ASSERT_H_
+#define _VM_ASSERT_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+// XXX not necessary except some places include vm_assert.h improperly
+#include "vm_basic_types.h"
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/*
+ * Some bits of vmcore are used in VMKernel code and cannot have
+ * the VMKERNEL define due to other header dependencies.
+ */
+#if defined(VMKERNEL) && !defined(VMKPANIC)
+#define VMKPANIC 1
+#endif
+
+/*
+ * Internal macros, functions, and strings
+ *
+ * The monitor wants to save space at call sites, so it has specialized
+ * functions for each situation.  User level wants to save on implementation
+ * so it uses generic functions.
+ */
+
+#if !defined VMM || defined MONITOR_APP // {
+
+#if defined (VMKPANIC) 
+#include "vmk_assert.h"
+#else /* !VMKPANIC */
+#define _ASSERT_PANIC(name) \
+           Panic(_##name##Fmt "\n", __FILE__, __LINE__)
+#define _ASSERT_PANIC_BUG(bug, name) \
+           Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
+#define _ASSERT_PANIC_NORETURN(name) \
+           Panic(_##name##Fmt "\n", __FILE__, __LINE__)
+#define _ASSERT_PANIC_BUG_NORETURN(bug, name) \
+           Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
+#endif /* VMKPANIC */
+
+#endif // }
+
+
+// These strings don't have newline so that a bug can be tacked on.
+#define _AssertPanicFmt            "PANIC %s:%d"
+#define _AssertAssertFmt           "ASSERT %s:%d"
+#define _AssertVerifyFmt           "VERIFY %s:%d"
+#define _AssertNotImplementedFmt   "NOT_IMPLEMENTED %s:%d"
+#define _AssertNotReachedFmt       "NOT_REACHED %s:%d"
+#define _AssertMemAllocFmt         "MEM_ALLOC %s:%d"
+#define _AssertNotTestedFmt        "NOT_TESTED %s:%d"
+
+
+/*
+ * Panic and log functions
+ */
+
+void Log(const char *fmt, ...) PRINTF_DECL(1, 2);
+void Warning(const char *fmt, ...) PRINTF_DECL(1, 2);
+#if defined VMKPANIC
+void Panic_SaveRegs(void);
+
+#ifdef VMX86_DEBUG
+void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
+#else
+NORETURN void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
+#endif
+
+NORETURN void Panic_NoSaveNoReturn(const char *fmt, ...) PRINTF_DECL(1, 2);
+
+#define Panic(fmt...) do { \
+   Panic_SaveRegs();       \
+   Panic_NoSave(fmt);      \
+} while(0)
+
+#define Panic_NoReturn(fmt...) do { \
+   Panic_SaveRegs();                \
+   Panic_NoSaveNoReturn(fmt);       \
+} while(0)
+
+#else
+NORETURN void Panic(const char *fmt, ...) PRINTF_DECL(1, 2);
+#endif
+
+void LogThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
+void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
+
+
+#ifndef ASSERT_IFNOT
+   /*
+    * PR 271512: When compiling with gcc, catch assignments inside an ASSERT.
+    *
+    * 'UNLIKELY' is defined with __builtin_expect, which does not warn when
+    * passed an assignment (gcc bug 36050). To get around this, we put 'cond'
+    * in an 'if' statement and make sure it never gets executed by putting
+    * that inside of 'if (0)'. We use gcc's statement expression syntax to
+    * make ASSERT an expression because some code uses it that way.
+    *
+    * Since statement expression syntax is a gcc extension and since it's
+    * not clear if this is a problem with other compilers, the ASSERT
+    * definition was not changed for them. Using a bare 'cond' with the
+    * ternary operator may provide a solution.
+    */
+
+   #ifdef __GNUC__
+      #define ASSERT_IFNOT(cond, panic)                                       \
+         ({if (UNLIKELY(!(cond))) { panic; if (0) { if (cond) {;}}} (void)0;})
+   #else
+      #define ASSERT_IFNOT(cond, panic)                                       \
+         (UNLIKELY(!(cond)) ? (panic) : (void)0)
+   #endif
+#endif
+
+
+/*
+ * Assert, panic, and log macros
+ *
+ * Some of these are redefined below undef !VMX86_DEBUG.
+ * ASSERT() is special cased because of interaction with Windows DDK.
+ */
+
+#if defined VMX86_DEBUG
+#undef  ASSERT
+#define ASSERT(cond) ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertAssert))
+#define ASSERT_BUG(bug, cond) \
+           ASSERT_IFNOT(cond, _ASSERT_PANIC_BUG(bug, AssertAssert))
+#endif
+
+#undef  VERIFY
+#define VERIFY(cond) \
+           ASSERT_IFNOT(cond, _ASSERT_PANIC_NORETURN(AssertVerify))
+#define VERIFY_BUG(bug, cond) \
+           ASSERT_IFNOT(cond, _ASSERT_PANIC_BUG_NORETURN(bug, AssertVerify))
+
+#define PANIC()        _ASSERT_PANIC(AssertPanic)
+#define PANIC_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertPanic)
+
+#define ASSERT_NOT_IMPLEMENTED(cond) \
+           ASSERT_IFNOT(cond, NOT_IMPLEMENTED())
+#define ASSERT_NOT_IMPLEMENTED_BUG(bug, cond) \
+           ASSERT_IFNOT(cond, NOT_IMPLEMENTED_BUG(bug))
+
+#if defined VMKPANIC || defined VMM
+#define NOT_IMPLEMENTED()        _ASSERT_PANIC_NORETURN(AssertNotImplemented)
+#else
+#define NOT_IMPLEMENTED()        _ASSERT_PANIC(AssertNotImplemented)
+#endif
+
+#if defined VMM
+#define NOT_IMPLEMENTED_BUG(bug) \
+          _ASSERT_PANIC_BUG_NORETURN(bug, AssertNotImplemented)
+#else 
+#define NOT_IMPLEMENTED_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertNotImplemented)
+#endif
+
+#if defined VMKPANIC || defined VMM
+#define NOT_REACHED()            _ASSERT_PANIC_NORETURN(AssertNotReached)
+#else
+#define NOT_REACHED()            _ASSERT_PANIC(AssertNotReached)
+#endif
+
+#define ASSERT_MEM_ALLOC(cond) \
+           ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertMemAlloc))
+
+#ifdef VMX86_DEVEL
+#define ASSERT_DEVEL(cond) ASSERT(cond)
+#define NOT_TESTED()       Warning(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
+#else
+#define ASSERT_DEVEL(cond) ((void)0)
+#define NOT_TESTED()       Log(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
+#endif
+
+#define ASSERT_NO_INTERRUPTS()  ASSERT(!INTERRUPTS_ENABLED())
+#define ASSERT_HAS_INTERRUPTS() ASSERT(INTERRUPTS_ENABLED())
+
+#define ASSERT_NOT_TESTED(cond) (UNLIKELY(!(cond)) ? NOT_TESTED() : (void)0)
+#define NOT_TESTED_ONCE()       DO_ONCE(NOT_TESTED())
+
+#define NOT_TESTED_1024()                                               \
+   do {                                                                 \
+      static uint16 count = 0;                                          \
+      if (UNLIKELY(count == 0)) { NOT_TESTED(); }                       \
+      count = (count + 1) & 1023;                                       \
+   } while (0)
+
+#define LOG_ONCE(_s) DO_ONCE(Log _s)
+
+
+/*
+ * Redefine macros that are only in debug versions
+ */
+
+#if !defined VMX86_DEBUG // {
+
+#undef  ASSERT
+#define ASSERT(cond)          ((void)0)
+#define ASSERT_BUG(bug, cond) ((void)0)
+
+/*
+ * Expand NOT_REACHED() as appropriate for each situation.
+ *
+ * Mainly, we want the compiler to infer the same control-flow
+ * information as it would from Panic().  Otherwise, different
+ * compilation options will lead to different control-flow-derived
+ * errors, causing some make targets to fail while others succeed.
+ *
+ * VC++ has the __assume() built-in function which we don't trust
+ * (see bug 43485); gcc has no such construct; we just panic in
+ * userlevel code.  The monitor doesn't want to pay the size penalty
+ * (measured at 212 bytes for the release vmm for a minimal infinite
+ * loop; panic would cost even more) so it does without and lives
+ * with the inconsistency.
+ */
+
+#if defined VMKPANIC || defined VMM
+#undef  NOT_REACHED
+#if defined __GNUC__ && (__GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 5)
+#define NOT_REACHED() (__builtin_unreachable())
+#else
+#define NOT_REACHED() ((void)0)
+#endif
+#else
+// keep debug definition
+#endif
+
+#undef LOG_UNEXPECTED
+#define LOG_UNEXPECTED(bug)     ((void)0)
+
+#undef  ASSERT_NOT_TESTED
+#define ASSERT_NOT_TESTED(cond) ((void)0)
+#undef  NOT_TESTED
+#define NOT_TESTED()            ((void)0)
+#undef  NOT_TESTED_ONCE
+#define NOT_TESTED_ONCE()       ((void)0)
+#undef  NOT_TESTED_1024
+#define NOT_TESTED_1024()       ((void)0)
+
+#endif // !VMX86_DEBUG }
+
+
+/*
+ * Compile-time assertions.
+ *
+ * ASSERT_ON_COMPILE does not use the common
+ * switch (0) { case 0: case (e): ; } trick because some compilers (e.g. MSVC)
+ * generate code for it.
+ *
+ * The implementation uses both enum and typedef because the typedef alone is
+ * insufficient; gcc allows arrays to be declared with non-constant expressions
+ * (even in typedefs, where it makes no sense).
+ *
+ * NOTE: if GCC ever changes so that it ignores unused types altogether, this
+ * assert might not fire!  We explicitly mark it as unused because GCC 4.8+
+ * uses -Wunused-local-typedefs as part of -Wall, which means the typedef will
+ * generate a warning.
+ */
+
+#if defined(_Static_assert) || defined(__cplusplus) ||                         \
+    !defined(__GNUC__) || __GNUC__ < 4 || (__GNUC__ == 4 && __GNUC_MINOR__ < 6)
+#define ASSERT_ON_COMPILE(e) \
+   do { \
+      enum { AssertOnCompileMisused = ((e) ? 1 : -1) }; \
+      UNUSED_TYPE(typedef char AssertOnCompileFailed[AssertOnCompileMisused]); \
+   } while (0)
+#else
+#define ASSERT_ON_COMPILE(e) \
+   do {                      \
+      _Static_assert(e, #e); \
+   } while (0);
+#endif
+
+/*
+ * To put an ASSERT_ON_COMPILE() outside a function, wrap it
+ * in MY_ASSERTS().  The first parameter must be unique in
+ * each .c file where it appears.  For example,
+ *
+ * MY_ASSERTS(FS3_INT,
+ *    ASSERT_ON_COMPILE(sizeof(FS3_DiskLock) == 128);
+ *    ASSERT_ON_COMPILE(sizeof(FS3_DiskLockReserved) == DISK_BLOCK_SIZE);
+ *    ASSERT_ON_COMPILE(sizeof(FS3_DiskBlock) == DISK_BLOCK_SIZE);
+ *    ASSERT_ON_COMPILE(sizeof(Hardware_DMIUUID) == 16);
+ * )
+ *
+ * Caution: ASSERT() within MY_ASSERTS() is silently ignored.
+ * The same goes for anything else not evaluated at compile time.
+ */
+
+#define MY_ASSERTS(name, assertions) \
+   static INLINE void name(void) {   \
+      assertions                     \
+   }
+
+#ifdef __cplusplus
+} /* extern "C" */
+#endif
+
+#endif /* ifndef _VM_ASSERT_H_ */
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
new file mode 100644
index 00000000..07f32eab
--- /dev/null
+++ b/vmnet-only/vm_atomic.h
@@ -0,0 +1,3896 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_atomic.h --
+ *
+ *       Atomic power
+ *
+ * Note: Only partially tested on ARM processors: Works for View Open
+ *       Client, which shouldn't have threads, and ARMv8 processors.
+ *
+ *       In ARM, GCC intrinsics (__sync*) compile but might not
+ *       work, while MS intrinsics (_Interlocked*) do not compile.
+ */
+
+#ifndef _ATOMIC_H_
+#define _ATOMIC_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_assert.h"
+
+/*
+ * In the Atomic_* definitions below, memory ordering and atomicity are somewhat
+ * conflated in an inconsistent manner. First, we have Atomic_{Read,Write},
+ * which only guarantees single copy atomicity, i.e. that the read/write occurs
+ * in an atomic fashion, but have no implication on memory ordering. The second
+ * class of Atomics are all the non-unfenced operations excluding
+ * Atomic_{Read,Write}*, which both imply atomicity and act as a memory barrier,
+ * implying sequentially consistent ordering of the atomic operation with all
+ * loads/stores prior to and after it.
+ *
+ * Since on x86, the second class of operations are associated with LOCK
+ * semantics, assumptions have been made about the ordering these operations
+ * imply on surrounding code (see for example the vmkernel's RefCount
+ * implementation). As a result, on arm64 we have to provide these same
+ * guarantees. We do this by making use of DMB barriers both before and after
+ * the atomic ldrx/strx sequences. A barrier before and after is required to
+ * avoid having part of the atomic operation reordered with surrounding code,
+ * e.g. a store-load reordering of the strx with a following load outside the
+ * Atomic_ op. For the first class of operations, Atomic_{Read,Write}, we do not
+ * implement a barrier.
+ *
+ * This implementation of Atomic operations is suboptimal on arm64, since
+ * both atomicity and memory ordering are fused together. Ideally the Atomic
+ * operations would only imply atomicity, and an explicit memory barrier in the
+ * surrounding code used to enforce ordering where necessary. This would eschew
+ * the need for the DMBs. A middle ground can be implemented where we use the
+ * arm64 load-acquire/store-release exclusive instructions to implement Atomics.
+ * This would imply sequential consistency of the Atomic operations (but not
+ * with any of the surrounding non-atomic operations) without the need for a
+ * DMB. Using these without a DMB today can still result in problematic
+ * reordering by the processor with surrounding non-atomic operations, e.g. a
+ * store-load reordering with a stlxr. Future optimization for arm64 should
+ * consider the wider change required at the call sites to minimize DMBs.
+ *
+ * For further details on x86 and ARM memory ordering see
+ * https://wiki.eng.vmware.com/ARM/MemoryOrdering.
+ */
+
+#ifdef VM_ARM_64
+#include "vm_basic_asm_arm64.h"
+
+#define ARM_64_ATOMIC_16_OPV_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint16 _sample;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxrh   %w0, [%2]      \n\t" \
+      #op "       %w0, %w0, %w3  \n\t" \
+      "   stxrh   %w1, %w0, [%2] \n\t" \
+      "   cbnz    %w1, 1b        \n\t" \
+      : "=&r" (_sample),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+})
+
+#define ARM_64_ATOMIC_16_OPO_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint16 _newval;                     \
+   uint16 _oldval;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxrh   %w0, [%3]      \n\t" \
+      #op "       %w1, %w0, %w4  \n\t" \
+      "   stxrh   %w2, %w1, [%3] \n\t" \
+      "   cbnz    %w2, 1b        \n\t" \
+      : "=&r" (_oldval),               \
+        "=&r" (_newval),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+   _oldval;                            \
+})
+
+#define ARM_64_ATOMIC_32_OPV_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint32 _sample;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxr    %w0, [%2]      \n\t" \
+      #op "       %w0, %w0, %w3  \n\t" \
+      "   stxr    %w1, %w0, [%2] \n\t" \
+      "   cbnz    %w1, 1b        \n\t" \
+      : "=&r" (_sample),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+})
+
+#define ARM_64_ATOMIC_32_OPO_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint32 _newval;                     \
+   uint32 _oldval;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxr    %w0, [%3]      \n\t" \
+      #op "       %w1, %w0, %w4  \n\t" \
+      "   stxr    %w2, %w1, [%3] \n\t" \
+      "   cbnz    %w2, 1b        \n\t" \
+      : "=&r" (_oldval),               \
+        "=&r" (_newval),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+   _oldval;                            \
+})
+
+#define ARM_64_ATOMIC_64_OPV_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint64 _sample;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxr    %x0, [%2]      \n\t" \
+      #op "       %x0, %x0, %x3  \n\t" \
+      "   stxr    %w1, %x0, [%2] \n\t" \
+      "   cbnz    %w1, 1b        \n\t" \
+      : "=&r" (_sample),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+})
+
+#define ARM_64_ATOMIC_64_OPO_PRIVATE(atm,modval,op) ({ \
+   uint32 _failed;                     \
+   uint64 _newval;                     \
+   uint64 _oldval;                     \
+   __asm__ __volatile__ (              \
+      "1: ldxr    %x0, [%3]      \n\t" \
+      #op "       %x1, %x0, %x4  \n\t" \
+      "   stxr    %w2, %x1, [%3] \n\t" \
+      "   cbnz    %w2, 1b        \n\t" \
+      : "=&r" (_oldval),               \
+        "=&r" (_newval),               \
+        "=&r" (_failed)                \
+      : "r" (atm),                     \
+        "r" (modval)                   \
+      : "memory");                     \
+   _oldval;                            \
+})
+
+#define ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
+   DMB();                                       \
+   ARM_64_ATOMIC_16_OPV_PRIVATE(atm,modval,op); \
+   DMB();                                       \
+})
+
+#define ARM_64_ATOMIC_16_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
+   uint16 _oldval_fenced;                                        \
+   DMB();                                                        \
+   _oldval_fenced = ARM_64_ATOMIC_16_OPO_PRIVATE(atm,modval,op); \
+   DMB();                                                        \
+   _oldval_fenced;                                               \
+})
+
+#define ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
+   DMB();                                       \
+   ARM_64_ATOMIC_32_OPV_PRIVATE(atm,modval,op); \
+   DMB();                                       \
+})
+
+#define ARM_64_ATOMIC_32_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
+   uint32 _oldval_fenced;                                        \
+   DMB();                                                        \
+   _oldval_fenced = ARM_64_ATOMIC_32_OPO_PRIVATE(atm,modval,op); \
+   DMB();                                                        \
+   _oldval_fenced;                                               \
+})
+
+#define ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
+   DMB();                                       \
+   ARM_64_ATOMIC_64_OPV_PRIVATE(atm,modval,op); \
+   DMB();                                       \
+})
+
+#define ARM_64_ATOMIC_64_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
+   uint64 _oldval_fenced;                                        \
+   DMB();                                                        \
+   _oldval_fenced = ARM_64_ATOMIC_64_OPO_PRIVATE(atm,modval,op); \
+   DMB();                                                        \
+   _oldval_fenced;                                               \
+})
+
+#endif /* VM_ARM_64 */
+
+
+/* Basic atomic types: 16, 32 and 64 bits */
+typedef struct Atomic_uint16 {
+   volatile uint16 value;
+} Atomic_uint16 ALIGNED(2);
+
+typedef struct Atomic_uint32 {
+   volatile uint32 value;
+} Atomic_uint32 ALIGNED(4);
+
+typedef struct  Atomic_uint64 {
+   volatile uint64 value;
+} Atomic_uint64 ALIGNED(8);
+
+/*
+ * Prototypes for msft atomics.  These are defined & inlined by the
+ * compiler so no function definition is needed.  The prototypes are
+ * needed for C++.  Since amd64 compiler doesn't support inline asm we
+ * have to use these.  Unfortunately, we still have to use some inline asm
+ * for the 32 bit code since the and/or/xor implementations didn't show up
+ * until XP or 2k3.
+ *
+ * The declarations for the intrinsic functions were taken from ntddk.h
+ * in the DDK. The declarations must match otherwise the 64-bit C++
+ * compiler will complain about second linkage of the intrinsic functions.
+ * We define the intrinsic using the basic types corresponding to the
+ * Windows typedefs. This avoids having to include windows header files
+ * to get to the windows types.
+ */
+#if defined(_MSC_VER) && _MSC_VER >= 1310 && !defined(BORA_NO_WIN32_INTRINS)
+#ifdef __cplusplus
+extern "C" {
+#endif
+long  _InterlockedExchange(long volatile*, long);
+long  _InterlockedCompareExchange(long volatile*, long, long);
+long  _InterlockedExchangeAdd(long volatile*, long);
+long  _InterlockedDecrement(long volatile*);
+long  _InterlockedIncrement(long volatile*);
+void  _ReadWriteBarrier(void);
+#pragma intrinsic(_InterlockedExchange, _InterlockedCompareExchange)
+#pragma intrinsic(_InterlockedExchangeAdd, _InterlockedDecrement)
+#pragma intrinsic(_InterlockedIncrement, _ReadWriteBarrier)
+
+# if _MSC_VER >= 1600
+char     _InterlockedExchange8(char volatile *, char);
+char     _InterlockedCompareExchange8(char volatile *, char, char);
+#pragma intrinsic(_InterlockedCompareExchange8, _InterlockedCompareExchange8)
+#endif
+
+#if defined(VM_X86_64)
+long     _InterlockedAnd(long volatile*, long);
+__int64  _InterlockedAnd64(__int64 volatile*, __int64);
+long     _InterlockedOr(long volatile*, long);
+__int64  _InterlockedOr64(__int64 volatile*, __int64);
+long     _InterlockedXor(long volatile*, long);
+__int64  _InterlockedXor64(__int64 volatile*, __int64);
+__int64  _InterlockedExchangeAdd64(__int64 volatile*, __int64);
+__int64  _InterlockedIncrement64(__int64 volatile*);
+__int64  _InterlockedDecrement64(__int64 volatile*);
+__int64  _InterlockedExchange64(__int64 volatile*, __int64);
+__int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
+#if !defined(_WIN64)
+#pragma intrinsic(_InterlockedAnd, _InterlockedAnd64)
+#pragma intrinsic(_InterlockedOr, _InterlockedOr64)
+#pragma intrinsic(_InterlockedXor, _InterlockedXor64)
+#pragma intrinsic(_InterlockedExchangeAdd64, _InterlockedIncrement64)
+#pragma intrinsic(_InterlockedDecrement64, _InterlockedExchange64)
+#pragma intrinsic(_InterlockedCompareExchange64)
+#endif /* !_WIN64 */
+#endif /* __x86_64__ */
+
+#ifdef __cplusplus
+}
+#endif
+#endif /* _MSC_VER */
+
+#if defined(__arm__)
+/*
+ * LDREX without STREX or CLREX may cause problems in environments where the
+ * context switch may not clear the reference monitor - according ARM manual
+ * the reference monitor should be cleared after a context switch, but some
+ * may not like Linux kernel's non-preemptive context switch path. So use of
+ * ARM routines in kernel code may not be safe.
+ */
+#   if defined(__ARM_ARCH_7__) || defined(__ARM_ARCH_7A__) ||  \
+       defined(__ARM_ARCH_7R__)|| defined(__ARM_ARCH_7M__)
+#      define VM_ARM_V7
+#      ifdef __KERNEL__
+#         warning LDREX/STREX may not be safe in linux kernel, since it      \
+          does not issue CLREX on context switch (as of 2011-09-29).
+#      endif
+#   else
+#     error Only ARMv7 extends the synchronization primitives ldrex/strex.   \
+            For the lower ARM version, please implement the atomic functions \
+            by kernel APIs.
+#   endif
+#endif
+
+/* Data Memory Barrier */
+#ifdef VM_ARM_V7
+#define dmb() __asm__ __volatile__("dmb" : : : "memory")
+#endif
+
+
+/* Convert a volatile uint32 to Atomic_uint32. */
+static INLINE Atomic_uint32 *
+Atomic_VolatileToAtomic(volatile uint32 *var)  // IN:
+{
+   return (Atomic_uint32 *)var;
+}
+
+/* Convert a volatile uint64 to Atomic_uint64. */
+static INLINE Atomic_uint64 *
+Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
+{
+   return (Atomic_uint64 *)var;
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Init, Atomic_SetFence, AtomicUseFence --
+ *
+ *      Determine whether an lfence intruction is executed after
+ *	every locked instruction.
+ *
+ *	Certain AMD processors have a bug (see bug 107024) that
+ *	requires an lfence after every locked instruction.
+ *
+ *	The global variable AtomicUseFence controls whether lfence
+ *	is used (see AtomicEpilogue).
+ *
+ *	Atomic_SetFence sets AtomicUseFence to the given value.
+ *
+ *	Atomic_Init computes and sets AtomicUseFence for x86.
+ *	It does not take into account the number of processors.
+ *
+ *	The rationale for all this complexity is that Atomic_Init
+ *	is the easy-to-use interface.  It can be called a number
+ *	of times cheaply, and does not depend on other libraries.
+ *	However, because the number of CPUs is difficult to compute,
+ *	it does without it and always assumes there are more than one.
+ *
+ *	For programs that care or have special requirements,
+ *	Atomic_SetFence can be called directly, in addition to Atomic_Init.
+ *	It overrides the effect of Atomic_Init, and can be called
+ *	before, after, or between calls to Atomic_Init.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+// The freebsd assembler doesn't know the lfence instruction
+#if defined(__GNUC__) &&                                                \
+     __GNUC__ >= 3 &&                                                   \
+    (defined(__VMKERNEL__) || !defined(__FreeBSD__)) &&                 \
+    (!defined(MODULE) || defined(__VMKERNEL_MODULE__)) &&               \
+    !defined(__APPLE__) &&                                              \
+    (defined(__i386__) || defined(__x86_64__)) /* PR136775 */
+#define ATOMIC_USE_FENCE
+#endif
+
+/* 
+ * Starting with vSphere 2014, we no longer support ESX on AMD Rev F. 
+ * Thus, we can eliminate all dynamic checks for whether to enable 
+ * the Errata 147 work-around when compiling many of our binaries. 
+ * However, we use an opt-in approach here rather than assuming all 
+ * parts of our builds are safe. For example, the "fdm" binary from 
+ * a new build may time travel back to hosts running older versions 
+ * of ESX on Rev F, so "fdm" continues to require the ability to 
+ * dynamically enable the errata work-around. With vSphere 2017,
+ * this will no longer be required as the oldest version of ESX that 
+ * VC 2017 will support is ESX 2014 (which won't run on Rev F).
+ *
+ * Modules may explicitly define MAY_NEED_AMD_REVF_WORKAROUND as 0 prior to
+ * inclusion of vm_atomic.h when they are safe on AMD Rev F with the elided
+ * lfence.
+ */
+#if !defined(MAY_NEED_AMD_REVF_WORKAROUND)
+#if (!defined(VMX86_SERVER) ||                                          \
+      (!defined(VMX86_VMX) && !defined(VMKERNEL) &&                     \
+       !defined(VMM)       && !defined(VMCORE)))
+#define MAY_NEED_AMD_REVF_WORKAROUND 1
+#else
+#define MAY_NEED_AMD_REVF_WORKAROUND 0
+#endif
+#endif
+
+#if MAY_NEED_AMD_REVF_WORKAROUND
+#if defined(VMATOMIC_IMPORT_DLLDATA)
+VMX86_EXTERN_DATA Bool AtomicUseFence;
+#else
+EXTERN Bool AtomicUseFence;
+#endif
+EXTERN Bool atomicFenceInitialized;
+#else   /* MAY_NEED_AMD_REVF_WORKAROUND */
+#define AtomicUseFence         FALSE
+#define atomicFenceInitialized TRUE
+#endif  /* MAY_NEED_AMD_REVF_WORKAROUND */
+
+
+void AtomicInitFence(void);
+
+static INLINE void
+Atomic_Init(void)
+{
+#ifdef ATOMIC_USE_FENCE
+   if (MAY_NEED_AMD_REVF_WORKAROUND && !atomicFenceInitialized) {
+      AtomicInitFence();
+   }
+#endif
+}
+
+static INLINE void
+Atomic_SetFence(Bool fenceAfterLock)  // IN:
+{
+   (void)fenceAfterLock;     /* Work around unused parameter. */
+#if MAY_NEED_AMD_REVF_WORKAROUND
+   AtomicUseFence = fenceAfterLock;
+   atomicFenceInitialized = TRUE;
+#endif
+}
+
+
+/* Conditionally execute fence after interlocked instruction. */
+static INLINE void
+AtomicEpilogue(void)
+{
+#if MAY_NEED_AMD_REVF_WORKAROUND && defined(ATOMIC_USE_FENCE)
+#ifdef VMM
+      /* The monitor conditionally patches out the lfence when not needed.*/
+      /* Construct a MonitorPatchTextEntry in the .patchtext section. */
+      asm volatile ("1:\n\t"
+                    "lfence\n\t"
+                    "2:\n\t"
+                    ".pushsection .patchtext\n\t"
+                    ".quad 1b\n\t"
+                    ".quad 2b\n\t"
+                    ".quad 0\n\t"
+                    ".popsection\n\t" ::: "memory");
+#else
+      if (UNLIKELY(AtomicUseFence)) {
+         asm volatile ("lfence" ::: "memory");
+      }
+#endif
+#endif
+}
+
+
+/*
+ * All the assembly code is tricky and written conservatively.
+ * For example, to make sure gcc won't introduce copies,
+ * we force the addressing mode like this:
+ *
+ *    "xchgl %0, (%1)"
+ *    : "=r" (val)
+ *    : "r" (&var->value),
+ *      "0" (val)
+ *    : "memory"
+ *
+ * - edward
+ *
+ * Actually - turns out that gcc never generates memory aliases (it
+ * still does generate register aliases though), so we can be a bit
+ * more agressive with the memory constraints. The code above can be
+ * modified like this:
+ *
+ *    "xchgl %0, %1"
+ *    : "=r" (val),
+ *      "=m" (var->value),
+ *    : "0" (val),
+ *      "1" (var->value)
+ *
+ * The advantages are that gcc can use whatever addressing mode it
+ * likes to access the memory value, and that we dont have to use a
+ * way-too-generic "memory" clobber as there is now an explicit
+ * declaration that var->value is modified.
+ *
+ * see also /usr/include/asm/atomic.h to convince yourself this is a
+ * valid optimization.
+ *
+ * - walken
+ */
+
+#if defined(_MSC_VER) && _MSC_VER < 1600 && defined(__x86_64__)
+Bool VMWInterlockedExchangeBool(Bool volatile *ptr,
+                                Bool val);
+
+Bool VMWInterlockedCompareExchangeBool(Bool volatile *ptr,
+                                       Bool newVal,
+                                       Bool oldVal);
+#endif
+
+typedef struct Atomic_Bool {
+   volatile Bool value;
+} Atomic_Bool;
+
+/* The ARM team can come along and add the code real soon now */
+extern Bool AtomicUndefinedOnARM(void);
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadBool --
+ *
+ *      Read the value of the specified object atomically.
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_ReadBool(Atomic_Bool const *var)  // IN:
+{
+   Bool val;
+
+#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
+   val = AtomicUndefinedOnARM();
+#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=q" (val)
+      : "m" (var->value)
+   );
+#elif defined(_MSC_VER)
+   val = var->value;
+#else
+#error No compiler defined for Atomic_ReadBool
+#endif
+
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWriteBool --
+ *
+ *      Read followed by write.
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_ReadWriteBool(Atomic_Bool *var,  // IN/OUT:
+                     Bool val)          // IN:
+{
+#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
+   return AtomicUndefinedOnARM();
+#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
+   __asm__ __volatile__(
+      "xchgb %0, %1"
+      : "=q" (val),
+        "+m" (var->value)
+      : "0" (val)
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(_MSC_VER) && _MSC_VER >= 1600
+   return _InterlockedExchange8(&var->value, val);
+#elif defined(_MSC_VER) && defined(__i386__)
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm movzx eax, val
+      __asm mov ebx, var
+      __asm xchg [ebx]Atomic_Bool.value, al
+   }
+#pragma warning(pop)
+#elif defined(_MSC_VER) && defined(__x86_64__)
+   return VMWInterlockedExchangeBool(&var->value, val);
+#else
+#error No compiler defined for Atomic_ReadBool
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_WriteBool --
+ *
+ *      Write the specified value to the specified object atomically.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_WriteBool(Atomic_Bool *var,  // IN/OUT:
+                 Bool val)          // IN:
+{
+#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
+   AtomicUndefinedOnARM();
+#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=m" (var->value)
+      : "qn" (val)
+   );
+#elif defined(_MSC_VER)
+   var->value = val;
+#else
+#error No compiler defined for Atomic_WriteBool
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWriteBool --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal.
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_ReadIfEqualWriteBool(Atomic_Bool *var,  // IN/OUT:
+                            Bool oldVal,       // IN:
+                            Bool newVal)       // IN:
+{
+#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
+   return AtomicUndefinedOnARM();
+#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
+   Bool val;
+
+   __asm__ __volatile__(
+      "lock; cmpxchgb %2, %1"
+      : "=a" (val),
+        "+m" (var->value)
+      : "q" (newVal),
+        "0" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(_MSC_VER) && _MSC_VER >= 1600
+   return _InterlockedCompareExchange8(&var->value, newVal, oldVal);
+#elif defined(_MSC_VER) && defined(__i386__)
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov al, oldVal
+      __asm mov ebx, var
+      __asm mov cl, newVal
+      __asm lock cmpxchg [ebx]Atomic_Bool.value, cl
+      __asm movzx eax, al
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#elif defined(_MSC_VER) && defined(__x86_64__)
+   return VMWInterlockedCompareExchangeBool(&var->value, newVal, oldVal);
+#else
+#error No compiler defined for Atomic_ReadIfEqualWriteBool
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read --
+ *
+ *      Read
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_Read(Atomic_uint32 const *var) // IN
+{
+   uint32 value;
+
+#if defined(VMM)
+   ASSERT(((uintptr_t)var % 4) == 0);
+#endif
+
+#if defined(__GNUC__)
+   /*
+    * Use inline assembler to force using a single load instruction to
+    * ensure that the compiler doesn't split a transfer operation into multiple
+    * instructions.
+    */
+
+#if defined(VM_ARM_32)
+   __asm__ __volatile__(
+      "ldr %0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value)
+   );
+#elif defined(VM_ARM_64)
+   __asm__ __volatile__ (
+      "ldr    %w0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value)
+   );
+#else
+   __asm__ __volatile__(
+      "mov %1, %0"
+      : "=r" (value)
+      : "m" (var->value)
+   );
+#endif
+#elif defined(_MSC_VER)
+   /*
+    * Microsoft docs guarantee simple reads and writes to properly
+    * aligned 32-bit variables use only a single instruction.
+    * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
+    */
+
+   value = var->value;
+#else
+#error No compiler defined for Atomic_Read
+#endif
+
+   return value;
+}
+#define Atomic_Read32 Atomic_Read
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWrite --
+ *
+ *      Read followed by write
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
+                 uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 retVal;
+   register volatile uint32 res;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[retVal], [%[var]] \n\t"
+      "strex %[res], %[val], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint32 retVal;
+   register uint32 failed;
+
+   __asm__ __volatile__(
+      "   dmb     sy             \n\t"
+      "1: ldxr   %w0, [%2]       \n\t"
+      "   stxr   %w1, %w3, [%2]  \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (val)
+      : "memory"
+   );
+
+   return retVal;
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "xchgl %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+   );
+   AtomicEpilogue();
+   return val;
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   return _InterlockedExchange((long *)&var->value, (long)val);
+#else
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov eax, val
+      __asm mov ebx, var
+      __asm xchg [ebx]Atomic_uint32.value, eax
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#endif // _MSC_VER >= 1310
+#else
+#error No compiler defined for Atomic_ReadWrite
+#endif // __GNUC__
+}
+#define Atomic_ReadWrite32 Atomic_ReadWrite
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write --
+ *
+ *      Write
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write(Atomic_uint32 *var, // OUT
+             uint32 val)         // IN
+{
+#if defined(VMM)
+   ASSERT(((uintptr_t)var % 4) == 0);
+#endif
+
+#if defined(__GNUC__)
+#if defined(VM_ARM_ANY)
+   /*
+    * A3.4.1 ARM DDI 0406C:
+    *
+    * When a processor writes using any instruction other than a
+    * Store-Exclusive:
+    *
+    * - if the write is to a physical address that is not covered by its local
+    *   monitor the write does not affect the state of the local monitor
+    * - if the write is to a physical address that is covered by its local
+    *   monitor it is IMPLEMENTATION DEFINED whether the write affects the
+    *   state of the local monitor.
+    *
+    * A3.4.5 ARM DDI 0406C:
+    *
+    * If two STREX instructions are executed without an intervening LDREX the
+    * second STREX returns a status value of 1. This means that:
+    *
+    * - ARM recommends that, in a given thread of execution, every STREX has a
+    *   preceding LDREX associated with it
+    * - it is not necessary for every LDREX to have a subsequent STREX.
+    */
+
+   Atomic_ReadWrite(var, val);
+#else
+   /*
+    * Use inline assembler to force using a single store instruction to
+    * ensure that the compiler doesn't split a transfer operation into multiple
+    * instructions.
+    */
+
+   __asm__ __volatile__(
+      "mov %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#endif
+#elif defined(_MSC_VER)
+   /*
+    * Microsoft docs guarantee simple reads and writes to properly
+    * aligned 32-bit variables use only a single instruction.
+    * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
+    */
+
+   var->value = val;
+#else
+#error No compiler defined for Atomic_Write
+#endif
+}
+#define Atomic_Write32 Atomic_Write
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWrite --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
+                        uint32 oldVal,      // IN
+                        uint32 newVal)      // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register uint32 retVal;
+   register uint32 res;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[retVal], [%[var]] \n\t"
+      "mov %[res], #0 \n\t"
+      "teq %[retVal], %[oldVal] \n\t"
+      "strexeq %[res], %[newVal], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint32 retVal;
+   register uint32 failed;
+
+   __asm__ __volatile__ (
+      "   dmb     sy             \n\t"
+      "1: ldxr   %w0, [%2]       \n\t"
+      "   cmp     %w0, %w3       \n\t"
+      "   b.ne    2f             \n\t"
+      "   stxr   %w1, %w4, [%2]  \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "2: clrex                  \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (oldVal), "r" (newVal)
+      : "cc", "memory");
+
+   return retVal;
+#else /* VM_X86_ANY */
+   uint32 val;
+
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; cmpxchgl %2, %1"
+      : "=a" (val),
+	"+m" (var->value)
+      : "r" (newVal),
+	"0" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   return _InterlockedCompareExchange((long *)&var->value,
+				      (long)newVal,
+				      (long)oldVal);
+#else
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov eax, oldVal
+      __asm mov ebx, var
+      __asm mov ecx, newVal
+      __asm lock cmpxchg [ebx]Atomic_uint32.value, ecx
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#endif
+#else
+#error No compiler defined for Atomic_ReadIfEqualWrite
+#endif
+}
+#define Atomic_ReadIfEqualWrite32 Atomic_ReadIfEqualWrite
+
+
+#if defined(VM_64BIT) || defined(VM_ARM_V7)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWrite64 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
+                          uint64 oldVal,      // IN
+                          uint64 newVal)      // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register uint64 retVal;
+   register uint32 res;
+
+   dmb();
+
+   /*
+    * Under Apple LLVM version 5.0 (clang-500.2.76) (based on LLVM 3.3svn)
+    * There will be a warning:
+    * "value size does not match register size specified by the constraint
+    * and modifier [-Wasm-operand-widths]"
+    * on the lines:
+    * : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+    *                                          ^
+    * : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+    *                                                                 ^
+    *
+    * Furthermore, using a 32-bits register to store a
+    * 64-bits value of an variable looks risky.
+    */
+#if defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wasm-operand-widths"
+#endif
+   __asm__ __volatile__(
+   "1: ldrexd %[retVal], %H[retVal], [%[var]] \n\t"
+      "mov %[res], #0 \n\t"
+      "teq %[retVal], %[oldVal] \n\t"
+      "teqeq %H[retVal], %H[oldVal] \n\t"
+      "strexdeq %[res], %[newVal], %H[newVal], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+      : "cc"
+   );
+#if defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#pragma clang diagnostic pop
+#endif // defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint64 retVal;
+   register uint32 failed;
+
+   __asm__ __volatile__ (
+      "   dmb     sy             \n\t"
+      "1: ldxr    %x0, [%2]      \n\t"
+      "   cmp     %x0, %x3       \n\t"
+      "   b.ne    2f             \n\t"
+      "   stxr    %w1, %x4, [%2] \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "2: clrex                  \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (oldVal), "r" (newVal)
+      : "cc", "memory");
+
+   return retVal;
+#else /* VM_X86_64 */
+   uint64 val;
+
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; cmpxchgq %2, %1"
+      : "=a" (val),
+	"+m" (var->value)
+      : "r" (newVal),
+	"0" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#endif //VM_ARM_V7
+#elif defined _MSC_VER
+   return _InterlockedCompareExchange64((__int64 *)&var->value,
+					(__int64)newVal,
+					(__int64)oldVal);
+#else
+#error No compiler defined for Atomic_ReadIfEqualWrite64
+#endif
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_And --
+ *
+ *      Atomic read, bitwise AND with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_And(Atomic_uint32 *var, // IN/OUT
+           uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[tmp], [%[var]] \n\t"
+      "and %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, and);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; andl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if defined(__x86_64__)
+   _InterlockedAnd((long *)&var->value, (long)val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock and [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_And
+#endif
+}
+#define Atomic_And32 Atomic_And
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Or --
+ *
+ *      Atomic read, bitwise OR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Or(Atomic_uint32 *var, // IN/OUT
+          uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[tmp], [%[var]] \n\t"
+      "orr %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, orr);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; orl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if defined(__x86_64__)
+   _InterlockedOr((long *)&var->value, (long)val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock or [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_Or
+#endif
+}
+#define Atomic_Or32 Atomic_Or
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Xor --
+ *
+ *      Atomic read, bitwise XOR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Xor(Atomic_uint32 *var, // IN/OUT
+           uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[tmp], [%[var]] \n\t"
+      "eor %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, eor);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; xorl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if defined(__x86_64__)
+   _InterlockedXor((long *)&var->value, (long)val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock xor [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_Xor
+#endif
+}
+#define Atomic_Xor32 Atomic_Xor
+
+
+#if defined(VM_64BIT)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Xor64 --
+ *
+ *      Atomic read, bitwise XOR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
+             uint64 val)         // IN
+{
+#if defined(__GNUC__)
+#if defined(VM_ARM_64)
+   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, eor);
+#else /* VM_X86_64 */
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; xorq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif
+#elif defined _MSC_VER
+   _InterlockedXor64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_Xor64
+#endif
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Add --
+ *
+ *      Atomic read, add a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Add(Atomic_uint32 *var, // IN/OUT
+           uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrex %[tmp], [%[var]] \n\t"
+      "add %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, add);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; addl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   _InterlockedExchangeAdd((long *)&var->value, (long)val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock add [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_Add
+#endif
+}
+#define Atomic_Add32 Atomic_Add
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Sub --
+ *
+ *      Atomic read, subtract a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Sub(Atomic_uint32 *var, // IN/OUT
+           uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+      "1: ldrex %[tmp], [%[var]] \n\t"
+      "sub %[tmp], %[tmp], %[val] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, sub);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; subl %1, %0"
+      : "+m" (var->value)
+      : "ri" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   _InterlockedExchangeAdd((long *)&var->value, (long)-val);
+#else
+   __asm mov eax, val
+   __asm mov ebx, var
+   __asm lock sub [ebx]Atomic_uint32.value, eax
+#endif
+#else
+#error No compiler defined for Atomic_Sub
+#endif
+}
+#define Atomic_Sub32 Atomic_Sub
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Inc --
+ *
+ *      Atomic read, increment, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Inc(Atomic_uint32 *var) // IN/OUT
+{
+#ifdef __GNUC__
+#if defined(VM_ARM_ANY)
+   Atomic_Add(var, 1);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; incl %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   _InterlockedIncrement((long *)&var->value);
+#else
+   __asm mov ebx, var
+   __asm lock inc [ebx]Atomic_uint32.value
+#endif
+#else
+#error No compiler defined for Atomic_Inc
+#endif
+}
+#define Atomic_Inc32 Atomic_Inc
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Dec --
+ *
+ *      Atomic read, decrement, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Dec(Atomic_uint32 *var) // IN/OUT
+{
+#ifdef __GNUC__
+#if defined(VM_ARM_ANY)
+   Atomic_Sub(var, 1);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; decl %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   _InterlockedDecrement((long *)&var->value);
+#else
+   __asm mov ebx, var
+   __asm lock dec [ebx]Atomic_uint32.value
+#endif
+#else
+#error No compiler defined for Atomic_Dec
+#endif
+}
+#define Atomic_Dec32 Atomic_Dec
+
+
+/*
+ * Note that the technique below can be used to implement ReadX(), where X is
+ * an arbitrary mathematical function.
+ */
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadOr32 --
+ *
+ *      Atomic read (returned), bitwise OR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
+                uint32 val)         // IN
+{
+   uint32 res;
+
+   do {
+      res = Atomic_Read(var);
+   } while (res != Atomic_ReadIfEqualWrite(var, res, res | val));
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAnd32 --
+ *
+ *      Atomic read (returned), bitwise And with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
+                 uint32 val)         // IN
+{
+   uint32 res;
+
+   do {
+      res = Atomic_Read(var);
+   } while (res != Atomic_ReadIfEqualWrite(var, res, res & val));
+
+   return res;
+}
+
+
+#if defined(VM_64BIT)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadOr64 --
+ *
+ *      Atomic read (returned), bitwise OR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
+                uint64 val)         // IN
+{
+   uint64 res;
+
+   do {
+      res = var->value;
+   } while (res != Atomic_ReadIfEqualWrite64(var, res, res | val));
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAnd64 --
+ *
+ *      Atomic read (returned), bitwise AND with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
+                 uint64 val)         // IN
+{
+   uint64 res;
+
+   do {
+      res = var->value;
+   } while (res != Atomic_ReadIfEqualWrite64(var, res, res & val));
+
+   return res;
+}
+#endif /* defined(VM_64BIT) */
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAdd32 --
+ *
+ *      Atomic read (returned), add a value, write.
+ *
+ *      If you have to implement ReadAdd32() on an architecture other than
+ *      x86 or x86-64, you might want to consider doing something similar to
+ *      Atomic_ReadOr32().
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
+                 uint32 val)         // IN
+{
+#if defined(__GNUC__)
+#ifdef VM_ARM_V7
+   register volatile uint32 res;
+   register volatile uint32 retVal;
+   register volatile uint32 tmp;
+
+   dmb();
+
+   __asm__ __volatile__(
+      "1: ldrex %[retVal], [%[var]] \n\t"
+      "add %[tmp], %[val], %[retVal] \n\t"
+      "strex %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [tmp] "=&r" (tmp), [res] "=&r" (res), [retVal] "=&r" (retVal)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   return ARM_64_ATOMIC_32_OPO_PRIVATE_FENCED(var, val, add);
+#else /* VM_X86_ANY */
+   /* Checked against the Intel manual and GCC --walken */
+   __asm__ __volatile__(
+      "lock; xaddl %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#endif /* VM_X86_ANY */
+#elif defined _MSC_VER
+#if _MSC_VER >= 1310
+   return _InterlockedExchangeAdd((long *)&var->value, (long)val);
+#else
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov eax, val
+      __asm mov ebx, var
+      __asm lock xadd [ebx]Atomic_uint32.value, eax
+   }
+#pragma warning(pop)
+#endif
+#else
+#error No compiler defined for Atomic_ReadAdd32
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadInc32 --
+ *
+ *      Atomic read (returned), increment, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadInc32(Atomic_uint32 *var) // IN/OUT
+{
+   return Atomic_ReadAdd32(var, 1);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadDec32 --
+ *
+ *      Atomic read (returned), decrement, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_ReadDec32(Atomic_uint32 *var) // IN/OUT
+{
+   return Atomic_ReadAdd32(var, (uint32)-1);
+}
+
+
+#if defined VMKERNEL || defined VMM
+#if !defined(VM_ARM_64)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CMPXCHG1B --
+ *
+ *      Compare and exchange a single byte.
+ *
+ * Results:
+ *      The value read from ptr.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+static INLINE uint8
+CMPXCHG1B(volatile uint8 *ptr, // IN/OUT
+          uint8 oldVal,        // IN
+          uint8 newVal)        // IN
+{
+   uint8 val;
+   __asm__ __volatile__("lock; cmpxchgb %b2, %1"
+                        : "=a" (val),
+                          "+m" (*ptr)
+                        : "r" (newVal),
+                          "0" (oldVal)
+                        : "cc");
+   return val;
+}
+#endif /* !defined(VM_ARM_64) */
+#endif
+
+
+/*
+ * Usage of this helper struct is strictly reserved to the following
+ * function. --hpreg
+ */
+typedef struct {
+   uint32 lowValue;
+   uint32 highValue;
+} S_uint64;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_CMPXCHG64 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ *      XXX: Ensure that if this function is to be inlined by gcc, it is
+ *      compiled with -fno-strict-aliasing. Otherwise it will break.
+ *      Unfortunately we know that gcc 2.95.3 (used to build the FreeBSD 3.2
+ *      Tools) does not honor -fno-strict-aliasing. As a workaround, we avoid
+ *      inlining the function entirely for versions of gcc under 3.0.
+ *
+ * Results:
+ *      TRUE if equal, FALSE if not equal
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && __GNUC__ < 3
+static Bool
+#else
+static INLINE Bool
+#endif
+Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
+                 uint64 const *oldVal, // IN
+                 uint64 const *newVal) // IN
+{
+#if defined(__GNUC__)
+#if defined(VM_ARM_ANY)
+   return (Atomic_ReadIfEqualWrite64(var, *oldVal, *newVal) == *oldVal);
+#else /* VM_X86_ANY */
+
+   Bool equal;
+   /* Checked against the Intel manual and GCC --walken */
+#if defined(__x86_64__)
+   uint64 dummy;
+   __asm__ __volatile__(
+      "lock; cmpxchgq %3, %0" "\n\t"
+      "sete %1"
+      : "+m" (*var),
+	"=qm" (equal),
+	"=a" (dummy)
+      : "r" (*newVal),
+        "2" (*oldVal)
+      : "cc"
+   );
+#else /* 32-bit version for non-ARM */
+   int dummy1, dummy2;
+#   if defined __PIC__
+   /*
+    * Rules for __asm__ statements in __PIC__ code
+    * --------------------------------------------
+    *
+    * The compiler uses %ebx for __PIC__ code, so an __asm__ statement cannot
+    * clobber %ebx. The __asm__ statement can temporarily modify %ebx, but _for
+    * each parameter that is used while %ebx is temporarily modified_:
+    *
+    * 1) The constraint cannot be "m", because the memory location the compiler
+    *    chooses could then be relative to %ebx.
+    *
+    * 2) The constraint cannot be a register class which contains %ebx (such as
+    *    "r" or "q"), because the register the compiler chooses could then be
+    *    %ebx. (This happens when compiling the Fusion UI with gcc 4.2.1, Apple
+    *    build 5577.)
+    *
+    * 3) Using register classes even for other values is problematic, as gcc
+    *    can decide e.g. %ecx == %edi == 0 (as compile-time constants) and
+    *    ends up using one register for two things. Which breaks xchg's ability
+    *    to temporarily put the PIC pointer somewhere else. PR772455
+    *
+    * For that reason alone, the __asm__ statement should keep the regions
+    * where it temporarily modifies %ebx as small as possible, and should
+    * prefer specific register assignments.
+    */
+#      if __GNUC__ < 3 // Part of #188541 - for RHL 6.2 etc.
+   __asm__ __volatile__(
+      "xchg %%ebx, %6"       "\n\t"
+      "mov 4(%%ebx), %%ecx"  "\n\t"
+      "mov (%%ebx), %%ebx"   "\n\t"
+      "lock; cmpxchg8b (%3)" "\n\t"
+      "xchg %%ebx, %6"       "\n\t"
+      "sete %0"
+      : "=a" (equal),
+        "=d" (dummy2),
+        "=D" (dummy1)
+      : /*
+         * See the "Rules for __asm__ statements in __PIC__ code" above: %3
+         * must use a register class which does not contain %ebx.
+         */
+        "S" (var),
+        "0" (((S_uint64 const *)oldVal)->lowValue),
+        "1" (((S_uint64 const *)oldVal)->highValue),
+        "D" (newVal)
+      : "ecx", "cc", "memory"
+   );
+#      else
+   __asm__ __volatile__(
+      "xchgl %%ebx, %6"      "\n\t"
+      "lock; cmpxchg8b (%3)" "\n\t"
+      "xchgl %%ebx, %6"      "\n\t"
+      "sete %0"
+      :	"=qm" (equal),
+	"=a" (dummy1),
+	"=d" (dummy2)
+      : /*
+         * See the "Rules for __asm__ statements in __PIC__ code" above: %3
+         * must use a register class which does not contain %ebx.
+         * "a"/"c"/"d" are already used, so we are left with either "S" or "D".
+         *
+         * Note that this assembly uses ALL GP registers (with %esp reserved for
+         * stack, %ebp reserved for frame, %ebx reserved for PIC).
+         */
+        "S" (var),
+        "1" (((S_uint64 const *)oldVal)->lowValue),
+        "2" (((S_uint64 const *)oldVal)->highValue),
+        "D" (((S_uint64 const *)newVal)->lowValue),
+        "c" (((S_uint64 const *)newVal)->highValue)
+      : "cc", "memory"
+   );
+#      endif
+#   else
+   __asm__ __volatile__(
+      "lock; cmpxchg8b %0" "\n\t"
+      "sete %1"
+      : "+m" (*var),
+	"=qm" (equal),
+	"=a" (dummy1),
+	"=d" (dummy2)
+      : "2" (((S_uint64 const *)oldVal)->lowValue),
+        "3" (((S_uint64 const *)oldVal)->highValue),
+        "b" (((S_uint64 const *)newVal)->lowValue),
+        "c" (((S_uint64 const *)newVal)->highValue)
+      : "cc"
+   );
+#   endif
+#endif
+   AtomicEpilogue();
+   return equal;
+#endif //VM_ARM_V7
+#elif defined _MSC_VER
+#if defined(__x86_64__)
+   return (__int64)*oldVal == _InterlockedCompareExchange64((__int64 *)&var->value,
+                                                            (__int64)*newVal,
+                                                            (__int64)*oldVal);
+#else
+#pragma warning(push)
+#pragma warning(disable : 4035)		// disable no-return warning
+   {
+      __asm mov esi, var
+      __asm mov edx, oldVal
+      __asm mov ecx, newVal
+      __asm mov eax, [edx]S_uint64.lowValue
+      __asm mov edx, [edx]S_uint64.highValue
+      __asm mov ebx, [ecx]S_uint64.lowValue
+      __asm mov ecx, [ecx]S_uint64.highValue
+      __asm lock cmpxchg8b [esi]
+      __asm sete al
+      __asm movzx eax, al
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#endif
+#else
+#error No compiler defined for Atomic_CMPXCHG64
+#endif // !GNUC
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_CMPXCHG32 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ * Results:
+ *      TRUE if equal, FALSE if not equal
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
+                 uint32 oldVal,        // IN
+                 uint32 newVal)        // IN
+{
+#if defined(__GNUC__)
+#if defined(VM_ARM_ANY)
+   return (Atomic_ReadIfEqualWrite(var, oldVal, newVal) == oldVal);
+#else /* VM_X86_ANY */
+   Bool equal;
+   uint32 dummy;
+
+   __asm__ __volatile__(
+      "lock; cmpxchgl %3, %0" "\n\t"
+      "sete %1"
+      : "+m" (*var),
+	"=qm" (equal),
+	"=a" (dummy)
+      : "r" (newVal),
+        "2" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return equal;
+#endif /* VM_X86_ANY */
+#else // defined(__GNUC__)
+   return (Atomic_ReadIfEqualWrite(var, oldVal, newVal) == oldVal);
+#endif // !defined(__GNUC__)
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read64 --
+ *
+ *      Read and return.
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_Read64(Atomic_uint64 const *var) // IN
+{
+#if defined(__GNUC__) && defined(__x86_64__)
+   uint64 value;
+
+#ifdef VMM
+   ASSERT((uintptr_t)var % 8 == 0);
+#endif
+   /*
+    * Use asm to ensure we emit a single load.
+    */
+   __asm__ __volatile__(
+      "movq %1, %0"
+      : "=r" (value)
+      : "m" (var->value)
+   );
+   return value;
+#elif defined(__GNUC__) && defined(__i386__)
+   uint64 value;
+   /*
+    * Since cmpxchg8b will replace the contents of EDX:EAX with the
+    * value in memory if there is no match, we need only execute the
+    * instruction once in order to atomically read 64 bits from
+    * memory.  The only constraint is that ECX:EBX must have the same
+    * value as EDX:EAX so that if the comparison succeeds.  We
+    * intentionally don't tell gcc that we are using ebx and ecx as we
+    * don't modify them and do not care what value they store.
+    */
+   __asm__ __volatile__(
+      "mov %%ebx, %%eax"   "\n\t"
+      "mov %%ecx, %%edx"   "\n\t"
+      "lock; cmpxchg8b %1"
+      : "=&A" (value)
+      : "m" (*var)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return value;
+#elif defined (_MSC_VER) && defined(__x86_64__)
+   /*
+    * Microsoft docs guarantee "Simple reads and writes to properly
+    * aligned 64-bit variables are atomic on 64-bit Windows."
+    * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
+    *
+    * XXX Verify that value is properly aligned. Bug 61315.
+    */
+   return var->value;
+#elif defined (_MSC_VER) && defined(__i386__)
+#   pragma warning(push)
+#   pragma warning(disable : 4035)		// disable no-return warning
+   {
+      __asm mov ecx, var
+      __asm mov edx, ecx
+      __asm mov eax, ebx
+      __asm lock cmpxchg8b [ecx]
+      // edx:eax is the return value; this is documented to work. --mann
+   }
+#   pragma warning(pop)
+#elif defined(__GNUC__) && defined (VM_ARM_V7)
+   uint64 value;
+
+   __asm__ __volatile__(
+      "ldrexd %[value], %H[value], [%[var]] \n\t"
+      : [value] "=&r" (value)
+      : [var] "r" (&var->value)
+   );
+
+   return value;
+#elif defined(__GNUC__) && defined(VM_ARM_64)
+   uint64 value;
+
+   __asm__ __volatile__(
+      "ldr     %0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value));
+
+   return value;
+#endif /* defined(__GNUC__) && defined(VM_ARM_64) */
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadUnaligned64 --
+ *
+ *      Atomically read a 64 bit integer, possibly misaligned.
+ *      This function can be *very* expensive, costing over 50 kcycles
+ *      on Nehalem.
+ * 
+ *      Note that "var" needs to be writable, even though it will not
+ *      be modified.
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+#if defined(VM_64BIT)
+static INLINE uint64
+Atomic_ReadUnaligned64(Atomic_uint64 const *var)  // IN:
+{
+   return Atomic_ReadIfEqualWrite64((Atomic_uint64*)var, 0, 0);
+}
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadAdd64 --
+ *
+ *      Atomically adds a 64-bit integer to another
+ *
+ * Results:
+ *      Returns the old value just prior to the addition
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
+                 uint64 val)         // IN
+{
+#if defined(VM_ARM_64)
+   return ARM_64_ATOMIC_64_OPO_PRIVATE_FENCED(var, val, add);
+#elif defined(__x86_64__)
+
+#if defined(__GNUC__)
+   __asm__ __volatile__(
+      "lock; xaddq %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined _MSC_VER
+   return _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_ReadAdd64
+#endif
+
+#else
+   uint64 oldVal;
+   uint64 newVal;
+
+   do {
+      oldVal = var->value;
+      newVal = oldVal + val;
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+
+   return oldVal;
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadSub64 --
+ *
+ *      Atomically subtracts a 64-bit integer to another
+ *
+ * Results:
+ *      Returns the old value just prior to the subtraction
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
+                 uint64 val)         // IN
+{
+   return Atomic_ReadAdd64(var, -val);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadInc64 --
+ *
+ *      Atomically increments a 64-bit integer
+ *
+ * Results:
+ *      Returns the old value just prior to incrementing
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadInc64(Atomic_uint64 *var) // IN/OUT
+{
+   return Atomic_ReadAdd64(var, 1);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadDec64 --
+ *
+ *      Atomically decrements a 64-bit integer
+ *
+ * Results:
+ *      Returns the old value just prior to decrementing
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadDec64(Atomic_uint64 *var) // IN/OUT
+{
+   return Atomic_ReadAdd64(var, CONST64U(-1));
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Add64 --
+ *
+ *      Atomic read, add a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Add64(Atomic_uint64 *var, // IN/OUT
+             uint64 val)         // IN
+{
+#if !defined(VM_64BIT)
+   Atomic_ReadAdd64(var, val); /* Return value is unused. */
+#elif defined(__GNUC__)
+#if defined(VM_ARM_64)
+   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, add);
+#else /* defined(VM_X86_64) */
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; addq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif
+#elif defined _MSC_VER
+   _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_Add64
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Sub64 --
+ *
+ *      Atomic read, subtract a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
+             uint64 val)         // IN
+{
+#if !defined(__x86_64__)
+   Atomic_ReadSub64(var, val); /* Return value is unused. */
+#elif defined(__GNUC__)
+#if defined(VM_ARM_64)
+   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, sub);
+#else /* VM_X86_64 */
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; subq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#endif
+#elif defined _MSC_VER
+   _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)-val);
+#else
+#error No compiler defined for Atomic_Sub64
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Inc64 --
+ *
+ *      Atomic read, increment, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
+{
+#if !defined(__x86_64__)
+   Atomic_ReadInc64(var);  /* Return value is unused. */
+#elif defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; incq %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   _InterlockedIncrement64((__int64 *)&var->value);
+#else
+#error No compiler defined for Atomic_Inc64
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Dec64 --
+ *
+ *      Atomic read, decrement, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
+{
+#if !defined(__x86_64__)
+   Atomic_ReadDec64(var);  /* Return value is unused. */
+#elif defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; decq %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   _InterlockedDecrement64((__int64 *)&var->value);
+#else
+#error No compiler defined for Atomic_Dec64
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWrite64 --
+ *
+ *      Read followed by write
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
+                   uint64 val)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "xchgq %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined _MSC_VER
+   return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_ReadWrite64
+#endif
+#else
+   uint64 oldVal;
+
+   do {
+      oldVal = var->value;
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &val));
+
+   return oldVal;
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write64 --
+ *
+ *      Write
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write64(Atomic_uint64 *var, // OUT
+               uint64 val)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+
+#ifdef VMM
+   ASSERT((uintptr_t)var % 8 == 0);
+#endif
+   /*
+    * There is no move instruction for 64-bit immediate to memory, so unless
+    * the immediate value fits in 32-bit (i.e. can be sign-extended), GCC
+    * breaks the assignment into two movl instructions.  The code below forces
+    * GCC to load the immediate value into a register first.
+    */
+
+   __asm__ __volatile__(
+      "movq %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#elif defined _MSC_VER
+   /*
+    * Microsoft docs guarantee "Simple reads and writes to properly aligned 
+    * 64-bit variables are atomic on 64-bit Windows."
+    * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
+    *
+    * XXX Verify that value is properly aligned. Bug 61315.
+    */
+
+   var->value = val;
+#else
+#error No compiler defined for Atomic_Write64
+#endif
+#else  /* defined(__x86_64__) */
+   (void)Atomic_ReadWrite64(var, val);
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Or64 --
+ *
+ *      Atomic read, bitwise OR with a 64-bit value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Or64(Atomic_uint64 *var, // IN/OUT
+            uint64 val)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; orq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   _InterlockedOr64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_Or64
+#endif
+#else // __x86_64__
+   uint64 oldVal;
+   uint64 newVal;
+   do {
+      oldVal = var->value;
+      newVal = oldVal | val;
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_And64 --
+ *
+ *      Atomic read, bitwise AND with a 64-bit value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_And64(Atomic_uint64 *var, // IN/OUT
+             uint64 val)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   /* Checked against the AMD manual and GCC --hpreg */
+   __asm__ __volatile__(
+      "lock; andq %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
+#else
+#error No compiler defined for Atomic_And64
+#endif
+#else // __x86_64__
+   uint64 oldVal;
+   uint64 newVal;
+   do {
+      oldVal = var->value;
+      newVal = oldVal & val;
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_SetBit64 --
+ *
+ *      Atomically set the bit 'bit' in var.  Bit must be between 0 and 63.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
+                uint64 bit)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   ASSERT(bit <= 63);
+   __asm__ __volatile__(
+      "lock; bts %1, %0"
+      : "+m" (var->value)
+      : "ri" (bit)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   uint64 oldVal;
+   uint64 newVal;
+   ASSERT(bit <= 63);
+   do {
+      oldVal = var->value;
+      newVal = oldVal | (CONST64U(1) << bit);
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#else
+#error No compiler defined for Atomic_SetBit64
+#endif
+#else // __x86_64__
+   uint64 oldVal;
+   uint64 newVal;
+   ASSERT(bit <= 63);
+   do {
+      oldVal = var->value;
+      newVal = oldVal | (CONST64U(1) << bit);
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ClearBit64 --
+ *
+ *      Atomically clear the bit 'bit' in var.  Bit must be between 0 and 63.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
+                  uint64 bit)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   ASSERT(bit <= 63);
+   __asm__ __volatile__(
+      "lock; btr %1, %0"
+      : "+m" (var->value)
+      : "ri" (bit)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined _MSC_VER
+   uint64 oldVal;
+   uint64 newVal;
+   ASSERT(bit <= 63);
+   do {
+      oldVal = var->value;
+      newVal = oldVal & ~(CONST64U(1) << bit);
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#else
+#error No compiler defined for Atomic_ClearBit64
+#endif
+#else // __x86_64__
+   uint64 oldVal;
+   uint64 newVal;
+   ASSERT(bit <= 63);
+   do {
+      oldVal = var->value;
+      newVal = oldVal & ~(CONST64U(1) << bit);
+   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestBit64 --
+ *
+ *      Read the bit 'bit' in var.  Bit must be between 0 and 63.
+ *
+ * Results:
+ *      TRUE if the tested bit was set; else FALSE.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestBit64(Atomic_uint64 *var, // IN
+                 uint64 bit)         // IN
+{
+#if defined(__x86_64__)
+#if defined(__GNUC__)
+   Bool out = FALSE;
+   ASSERT(bit <= 63);
+   __asm__ __volatile__(
+      "bt %2, %1; setc %0"
+      : "=rm"(out)
+      : "m" (var->value),
+        "rJ" (bit)
+      : "cc"
+   );
+   return out;
+#elif defined _MSC_VER
+   ASSERT(bit <= 63);
+   return (var->value & (CONST64U(1) << bit)) != 0;
+#else
+#error No compiler defined for Atomic_TestBit64
+#endif
+#else // __x86_64__
+   ASSERT(bit <= 63);
+   return (var->value & (CONST64U(1) << bit)) != 0;
+#endif
+}
+
+
+#if defined(__GNUC__)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read16 --
+ *
+ *      Read and return.
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_Read16(Atomic_uint16 const *var) // IN
+{
+   uint16 value;
+
+#ifdef VMM
+   ASSERT((uintptr_t)var % 2 == 0);
+#endif
+
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+
+   __asm__ __volatile__(
+      "movw %1, %0"
+      : "=r" (value)
+      : "m" (var->value)
+   );
+#elif defined(VM_ARM_V7)
+   NOT_TESTED();
+
+   __asm__ __volatile__(
+      "ldrh %0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value)
+   );
+#elif defined(VM_ARM_64)
+   __asm__ __volatile__ (
+      "ldrh   %w0, [%1]"
+      : "=r" (value)
+      : "r" (&var->value)
+   );
+
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+
+   return value;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWrite16 --
+ *
+ *      Read followed by write
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
+                   uint16 val)          // IN:
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "xchgw %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(VM_ARM_V7)
+   register volatile uint16 retVal;
+   register volatile uint16 res;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[retVal], [%[var]] \n\t"
+      "strexh %[res], %[val], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint16 retVal;
+   register uint16 failed;
+
+   __asm__ __volatile__(
+      "   dmb     sy             \n\t"
+      "1: ldxrh  %w0, [%2]       \n\t"
+      "   stxrh  %w1, %w3, [%2]  \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (val)
+      : "memory"
+   );
+
+   return retVal;
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write16 --
+ *
+ *      Write
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write16(Atomic_uint16 *var,  // OUT:
+               uint16 val)          // IN:
+{
+#ifdef VMM
+   ASSERT((uintptr_t)var % 2 == 0);
+#endif
+
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+
+   __asm__ __volatile__(
+      "movw %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#elif defined(VM_ARM_ANY)
+   Atomic_ReadWrite16(var, val);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWrite16 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
+                          uint16 oldVal,        // IN
+                          uint16 newVal)        // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   uint16 val;
+
+   __asm__ __volatile__(
+      "lock; cmpxchgw %2, %1"
+      : "=a" (val),
+	"+m" (var->value)
+      : "r" (newVal),
+	"0" (oldVal)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(VM_ARM_V7)
+   register uint16 retVal;
+   register uint16 res;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[retVal], [%[var]] \n\t"
+      "mov %[res], #0 \n\t"
+      "teq %[retVal], %[oldVal] \n\t"
+      "strexheq %[res], %[newVal], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [retVal] "=&r" (retVal), [res] "=&r" (res)
+      : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   register uint16 retVal;
+   register uint16 failed;
+
+   __asm__ __volatile__ (
+      "   dmb     sy             \n\t"
+      "1: ldxrh  %w0, [%2]       \n\t"
+      "   cmp     %w0, %w3       \n\t"
+      "   b.ne    2f             \n\t"
+      "   stxrh  %w1, %w4, [%2]  \n\t"
+      "   cbnz    %w1, 1b        \n\t"
+      "2: clrex                  \n\t"
+      "   dmb     sy             \n\t"
+      : "=&r" (retVal), "=&r" (failed)
+      : "r" (&var->value), "r" (oldVal), "r" (newVal)
+      : "cc", "memory");
+
+   return retVal;
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_And16 --
+ *
+ *      Atomic read, bitwise AND with a 16-bit value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_And16(Atomic_uint16 *var, // IN/OUT
+             uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; andw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[tmp], [%[var]] \n\t"
+      "and %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, and);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Or16 --
+ *
+ *      Atomic read, bitwise OR with a 16-bit value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Or16(Atomic_uint16 *var, // IN/OUT
+            uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; orw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[tmp], [%[var]] \n\t"
+      "orr %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, orr);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Xor16 --
+ *
+ *      Atomic read, bitwise XOR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
+             uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; xorw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[tmp], [%[var]] \n\t"
+      "eor %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, eor);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Add16 --
+ *
+ *      Atomic read, add a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Add16(Atomic_uint16 *var, // IN/OUT
+             uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; addw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+   "1: ldrexh %[tmp], [%[var]] \n\t"
+      "add %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, add);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Sub16 --
+ *
+ *      Atomic read, subtract a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
+             uint16 val)         // IN
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; subw %1, %0"
+      : "+m" (var->value)
+      : "re" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+      "1: ldrexh %[tmp], [%[var]] \n\t"
+      "sub %[tmp], %[tmp], %[val] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [res] "=&r" (res), [tmp] "=&r" (tmp)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+#elif defined(VM_ARM_64)
+   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, sub);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Inc16 --
+ *
+ *      Atomic read, increment, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; incw %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_ANY)
+   Atomic_Add16(var, 1);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Dec16 --
+ *
+ *      Atomic read, decrement, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; decw %0"
+      : "+m" (var->value)
+      :
+      : "cc"
+   );
+   AtomicEpilogue();
+#elif defined(VM_ARM_ANY)
+   Atomic_Sub16(var, 1);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadOr16 --
+ *
+ *      Atomic read (returned), bitwise OR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadOr16(Atomic_uint16 *var, // IN/OUT
+                uint16 val)         // IN
+{
+   uint16 res;
+
+   do {
+      res = var->value;
+   } while (res != Atomic_ReadIfEqualWrite16(var, res, res | val));
+
+   return res;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadAdd16 --
+ *
+ *      Atomically adds a 16-bit integer to another
+ *
+ * Results:
+ *      Returns the old value just prior to the addition
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
+                 uint16 val)          // IN:
+{
+#if defined(__GNUC__)
+#if (defined(__x86_64__) || defined(__i386__))
+   __asm__ __volatile__(
+      "lock; xaddw %0, %1"
+      : "=r" (val),
+	"+m" (var->value)
+      : "0" (val)
+      : "cc"
+   );
+   AtomicEpilogue();
+   return val;
+#elif defined(VM_ARM_V7)
+   register volatile uint16 res;
+   register volatile uint16 retVal;
+   register volatile uint16 tmp;
+
+   NOT_TESTED();
+
+   dmb();
+
+   __asm__ __volatile__(
+      "1: ldrexh %[retVal], [%[var]] \n\t"
+      "add %[tmp], %[val], %[retVal] \n\t"
+      "strexh %[res], %[tmp], [%[var]] \n\t"
+      "teq %[res], #0 \n\t"
+      "bne 1b"
+      : [tmp] "=&r" (tmp), [res] "=&r" (res), [retVal] "=&r" (retVal)
+      : [var] "r" (&var->value), [val] "r" (val)
+      : "cc"
+   );
+
+   dmb();
+
+   return retVal;
+#elif defined(VM_ARM_64)
+   return ARM_64_ATOMIC_16_OPO_PRIVATE_FENCED(var, val, add);
+#else
+#error No 16-bits atomics.
+#endif
+#endif
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadInc16 --
+ *
+ *      Atomically increments a 64-bit integer
+ *
+ * Results:
+ *      Returns the old value just prior to incrementing
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadInc16(Atomic_uint16 *var) // IN/OUT
+{
+   return Atomic_ReadAdd16(var, 1);
+}
+
+/*
+
+ *----------------------------------------------------------------------
+ *
+ * Atomic_ReadDec16 --
+ *
+ *      Atomically decrements a 64-bit integer
+ *
+ * Results:
+ *      Returns the old value just prior to decrementing
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
+{
+   return Atomic_ReadAdd16(var, -1);
+}
+#endif
+
+/*
+ * Template code for the Atomic_<name> type and its operators.
+ *
+ * The cast argument is an intermediate type cast to make some
+ * compilers stop complaining about casting uint32 <-> void *,
+ * even though we only do it in the 32-bit case so they are always
+ * the same size.  So for val of type uint32, instead of
+ * (void *)val, we have (void *)(uintptr_t)val.
+ * The specific problem case is the Windows ddk compiler
+ * (as used by the SVGA driver).  -- edward
+ *
+ * NOTE: See the comment in vm_assert.h for why we need UNUSED_TYPE in
+ * AtomicAssertOnCompile(), and why we need to be very careful doing so.
+ */
+
+#define MAKE_ATOMIC_TYPE(name, size, in, out, cast)                           \
+   typedef Atomic_uint ## size Atomic_ ## name;                               \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   AtomicAssertOnCompile ## name(void)                                        \
+   {                                                                          \
+      enum { AssertOnCompileMisused =    8 * sizeof (in) == size              \
+                                      && 8 * sizeof (out) == size             \
+                                      && 8 * sizeof (cast) == size            \
+                                         ? 1 : -1 };                          \
+      UNUSED_TYPE(typedef char AssertOnCompileFailed[AssertOnCompileMisused]);\
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_Read ## name(Atomic_ ## name const *var)                            \
+   {                                                                          \
+      return (out)(cast)Atomic_Read ## size(var);                             \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Write ## name(Atomic_ ## name *var,                                 \
+                        in val)                                               \
+   {                                                                          \
+      Atomic_Write ## size(var, (uint ## size)(cast)val);                     \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadWrite ## name(Atomic_ ## name *var,                             \
+                            in val)                                           \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadWrite ## size(var,                         \
+		(uint ## size)(cast)val);                                     \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadIfEqualWrite ## name(Atomic_ ## name *var,                      \
+                                   in oldVal,                                 \
+                                   in newVal)                                 \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadIfEqualWrite ## size(var,                  \
+                (uint ## size)(cast)oldVal, (uint ## size)(cast)newVal);      \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_And ## name(Atomic_ ## name *var,                                   \
+                      in val)                                                 \
+   {                                                                          \
+      Atomic_And ## size(var, (uint ## size)(cast)val);                       \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Or ## name(Atomic_ ## name *var,                                    \
+                     in val)                                                  \
+   {                                                                          \
+      Atomic_Or ## size(var, (uint ## size)(cast)val);                        \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Xor ## name(Atomic_ ## name *var,                                   \
+                      in val)                                                 \
+   {                                                                          \
+      Atomic_Xor ## size(var, (uint ## size)(cast)val);                       \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Add ## name(Atomic_ ## name *var,                                   \
+                      in val)                                                 \
+   {                                                                          \
+      Atomic_Add ## size(var, (uint ## size)(cast)val);                       \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Sub ## name(Atomic_ ## name *var,                                   \
+                      in val)                                                 \
+   {                                                                          \
+      Atomic_Sub ## size(var, (uint ## size)(cast)val);                       \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Inc ## name(Atomic_ ## name *var)                                   \
+   {                                                                          \
+      Atomic_Inc ## size(var);                                                \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Dec ## name(Atomic_ ## name *var)                                   \
+   {                                                                          \
+      Atomic_Dec ## size(var);                                                \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadOr ## name(Atomic_ ## name *var,                                \
+                         in val)                                              \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadOr ## size(var, (uint ## size)(cast)val);  \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadAdd ## name(Atomic_ ## name *var,                               \
+                          in val)                                             \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadAdd ## size(var, (uint ## size)(cast)val); \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadInc ## name(Atomic_ ## name *var)                               \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadInc ## size(var);                          \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE out                                                          \
+   Atomic_ReadDec ## name(Atomic_ ## name *var)                               \
+   {                                                                          \
+      return (out)(cast)Atomic_ReadDec ## size(var);                          \
+   }
+
+
+/*
+ * Since we use a macro to generate these definitions, it is hard to look for
+ * them. So DO NOT REMOVE THIS COMMENT and keep it up-to-date. --hpreg
+ *
+ * Atomic_Ptr
+ * Atomic_ReadPtr --
+ * Atomic_WritePtr --
+ * Atomic_ReadWritePtr --
+ * Atomic_ReadIfEqualWritePtr --
+ * Atomic_AndPtr --
+ * Atomic_OrPtr --
+ * Atomic_XorPtr --
+ * Atomic_AddPtr --
+ * Atomic_SubPtr --
+ * Atomic_IncPtr --
+ * Atomic_DecPtr --
+ * Atomic_ReadOrPtr --
+ * Atomic_ReadAddPtr --
+ * Atomic_ReadIncPtr --
+ * Atomic_ReadDecPtr --
+ *
+ * Atomic_Int
+ * Atomic_ReadInt --
+ * Atomic_WriteInt --
+ * Atomic_ReadWriteInt --
+ * Atomic_ReadIfEqualWriteInt --
+ * Atomic_AndInt --
+ * Atomic_OrInt --
+ * Atomic_XorInt --
+ * Atomic_AddInt --
+ * Atomic_SubInt --
+ * Atomic_IncInt --
+ * Atomic_DecInt --
+ * Atomic_ReadOrInt --
+ * Atomic_ReadAddInt --
+ * Atomic_ReadIncInt --
+ * Atomic_ReadDecInt --
+ */
+#if defined(VM_64BIT)
+MAKE_ATOMIC_TYPE(Ptr, 64, void const *, void *, uintptr_t)
+#else
+MAKE_ATOMIC_TYPE(Ptr, 32, void const *, void *, uintptr_t)
+#endif
+MAKE_ATOMIC_TYPE(Int, 32, int, int, int)
+
+
+/* Prevent the compiler from re-ordering memory references. */
+#ifdef __GNUC__
+#define ATOMIC_COMPILER_BARRIER()   __asm__ __volatile__ ("": : :"memory")
+#elif defined(_MSC_VER)
+#define ATOMIC_COMPILER_BARRIER()   _ReadWriteBarrier()
+#else
+#error No compiler defined for ATOMIC_COMPILER_BARRIER
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_MFence --
+ *
+ *      Implements mfence in terms of a lock xor. The reason for implementing
+ *      our own mfence is that not all of our supported cpus have an assembly
+ *      mfence (P3, Athlon). We put it here to avoid duplicating code which is
+ *      also why it is prefixed with "Atomic_". Moreover, this implementation
+ *      performs slightly better than 'mfence' on modern CPUs (See PR 817059).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Cause loads and stores prior to this to be globally
+ *      visible.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_MFence(void)
+{
+   Atomic_uint32 fence;
+   ATOMIC_COMPILER_BARRIER();
+   Atomic_Xor(&fence, 0x1);
+   ATOMIC_COMPILER_BARRIER();
+}
+
+#ifdef ATOMIC_COMPILER_BARRIER
+#undef ATOMIC_COMPILER_BARRIER
+#endif /* ATOMIC_COMPILER_BARRIER */
+
+#endif // ifndef _ATOMIC_H_
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
new file mode 100644
index 00000000..0e4adae6
--- /dev/null
+++ b/vmnet-only/vm_basic_asm.h
@@ -0,0 +1,1258 @@
+/*********************************************************
+ * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_asm.h
+ *
+ *	Basic asm macros
+ */
+
+#ifndef _VM_BASIC_ASM_H_
+#define _VM_BASIC_ASM_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+#if defined VM_X86_64
+#include "vm_basic_asm_x86_common.h"
+#include "vm_basic_asm_x86_64.h"
+#elif defined VM_X86_32
+#include "vm_basic_asm_x86_common.h"
+#include "vm_basic_asm_x86.h"
+#elif defined VM_ARM_64
+#include "arm64_basic_defs.h"
+#include "vm_basic_asm_arm64.h"
+#else
+#define MUL64_NO_ASM 1
+#include "mul64.h"
+#endif
+
+/*
+ * Locate most and least significant bit set functions. Use our own name
+ * space to avoid namespace collisions. The new names follow a pattern,
+ * <prefix><size><option>, where:
+ *
+ * <prefix> is [lm]ssb (least/most significant bit set)
+ * <size> is size of the argument: 32 (32-bit), 64 (64-bit) or Ptr (pointer)
+ * <option> is for alternative versions of the functions
+ *
+ * NAME        FUNCTION                    BITS     FUNC(0)
+ *-----        --------                    ----     -------
+ * lssb32_0    LSB set (uint32)            0..31    -1
+ * mssb32_0    MSB set (uint32)            0..31    -1
+ * lssb64_0    LSB set (uint64)            0..63    -1
+ * mssb64_0    MSB set (uint64)            0..63    -1
+ * lssbPtr_0   LSB set (uintptr_t;32-bit)  0..31    -1
+ * lssbPtr_0   LSB set (uintptr_t;64-bit)  0..63    -1
+ * mssbPtr_0   MSB set (uintptr_t;32-bit)  0..31    -1
+ * mssbPtr_0   MSB set (uintptr_t;64-bit)  0..63    -1
+ * lssbPtr     LSB set (uintptr_t;32-bit)  1..32    0
+ * lssbPtr     LSB set (uintptr_t;64-bit)  1..64    0
+ * mssbPtr     MSB set (uintptr_t;32-bit)  1..32    0
+ * mssbPtr     MSB set (uintptr_t;64-bit)  1..64    0
+ * lssb32      LSB set (uint32)            1..32    0
+ * mssb32      MSB set (uint32)            1..32    0
+ * lssb64      LSB set (uint64)            1..64    0
+ * mssb64      MSB set (uint64)            1..64    0
+ */
+
+#ifdef _MSC_VER
+static INLINE int
+lssb32_0(const uint32 value)
+{
+   unsigned long idx;
+   unsigned char ret;
+
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   }
+   ret = _BitScanForward(&idx, (unsigned long)value);
+#ifdef __analysis_assume
+   __analysis_assume(ret != 0);
+#endif
+
+#pragma warning(suppress: 6001 6102) // Suppress bogus complaint that idx may be uninitialized in error case
+   return idx;
+}
+
+static INLINE int
+mssb32_0(const uint32 value)
+{
+   unsigned long idx;
+   unsigned char ret;
+
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   }
+   ret = _BitScanReverse(&idx, (unsigned long)value);
+#ifdef __analysis_assume
+   __analysis_assume(ret != 0);
+#endif
+
+#pragma warning(suppress: 6001 6102) // Suppress bogus complaint that idx may be uninitialized in error case
+   return idx;
+}
+
+static INLINE int
+lssb64_0(const uint64 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+#ifdef VM_X86_64
+      unsigned long idx;
+      unsigned char ret;
+
+      ret = _BitScanForward64(&idx, (unsigned __int64)value);
+#ifdef __analysis_assume
+      __analysis_assume(ret != 0);
+#endif
+
+#pragma warning(suppress: 6001 6102) // Suppress bogus complaint that idx may be uninitialized in error case
+      return idx;
+#else
+      /* The coding was chosen to minimize conditionals and operations */
+      int lowFirstBit = lssb32_0((uint32) value);
+      if (lowFirstBit == -1) {
+         lowFirstBit = lssb32_0((uint32) (value >> 32));
+         if (lowFirstBit != -1) {
+            return lowFirstBit + 32;
+         }
+      }
+      return lowFirstBit;
+#endif
+   }
+}
+
+static INLINE int
+mssb64_0(const uint64 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+#ifdef VM_X86_64
+      unsigned long idx;
+      unsigned char ret;
+
+      ret = _BitScanReverse64(&idx, (unsigned __int64)value);
+#ifdef __analysis_assume
+      __analysis_assume(ret != 0);
+#endif
+
+#pragma warning(suppress: 6001 6102) // Suppress bogus complaint that idx may be uninitialized in error case
+      return idx;
+#else
+      /* The coding was chosen to minimize conditionals and operations */
+      if (value > 0xFFFFFFFFULL) {
+         return 32 + mssb32_0((uint32) (value >> 32));
+      }
+      return mssb32_0((uint32) value);
+#endif
+   }
+}
+#endif
+
+#ifdef __GNUC__
+
+#ifdef VM_X86_ANY
+#define USE_ARCH_X86_CUSTOM
+#endif
+
+/* **********************************************************
+ *  GCC's intrinsics for the lssb and mssb family produce sub-optimal code,
+ *  so we use inline assembly to improve matters.  However, GCC cannot
+ *  propagate constants through inline assembly, so we help GCC out by
+ *  allowing it to use its intrinsics for compile-time constant values.
+ *  Some day, GCC will make better code and these can collapse to intrinsics.
+ *
+ *  For example, in Decoder_AddressSize, inlined into VVT_GetVTInstrInfo:
+ *  __builtin_ffs(a) compiles to:
+ *  mov   $0xffffffff, %esi
+ *  bsf   %eax, %eax
+ *  cmovz %esi, %eax
+ *  sub   $0x1, %eax
+ *  and   $0x7, %eax
+ *
+ *  While the code below compiles to:
+ *  bsf   %eax, %eax
+ *  sub   $0x1, %eax
+ *
+ *  Ideally, GCC should have recognized non-zero input in the first case.
+ *  Other instances of the intrinsic produce code like
+ *  sub $1, %eax; add $1, %eax; clts
+ * **********************************************************
+ */
+
+#if __GNUC__ < 4
+#define FEWER_BUILTINS
+#endif
+
+static INLINE int
+lssb32_0(uint32 value)
+{
+#ifdef USE_ARCH_X86_CUSTOM
+   if (!__builtin_constant_p(value)) {
+      if (UNLIKELY(value == 0)) {
+         return -1;
+      } else {
+         int pos;
+         __asm__ ("bsfl %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+         return pos;
+      }
+   }
+#endif
+   return __builtin_ffs(value) - 1;
+}
+
+#ifndef FEWER_BUILTINS
+static INLINE int
+mssb32_0(uint32 value)
+{
+   /*
+    * We must keep the UNLIKELY(...) outside the #if defined ...
+    * because __builtin_clz(0) is undefined according to gcc's
+    * documentation.
+    */
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+      int pos;
+#ifdef USE_ARCH_X86_CUSTOM
+      if (!__builtin_constant_p(value)) {
+         __asm__ ("bsrl %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+         return pos;
+      }
+#endif
+      pos = 32 - __builtin_clz(value) - 1;
+      return pos;
+   }
+}
+
+static INLINE int
+lssb64_0(const uint64 value)
+{
+#ifdef USE_ARCH_X86_CUSTOM
+   if (!__builtin_constant_p(value)) {
+      if (UNLIKELY(value == 0)) {
+         return -1;
+      } else {
+         intptr_t pos;
+#ifdef VM_X86_64
+         __asm__ ("bsf %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+#else
+         /* The coding was chosen to minimize conditionals and operations */
+         pos = lssb32_0((uint32) value);
+         if (pos == -1) {
+            pos = lssb32_0((uint32) (value >> 32));
+            if (pos != -1) {
+               return pos + 32;
+            }
+         }
+#endif
+         return pos;
+      }
+   }
+#endif
+   return __builtin_ffsll(value) - 1;
+}
+#endif /* !FEWER_BUILTINS */
+
+#ifdef FEWER_BUILTINS
+/* GCC 3.3.x does not like __bulitin_clz or __builtin_ffsll. */
+static INLINE int
+mssb32_0(uint32 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+      int pos;
+      __asm__ __volatile__("bsrl %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+      return pos;
+   }
+}
+
+static INLINE int
+lssb64_0(const uint64 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+      intptr_t pos;
+
+#ifdef VM_X86_64
+      __asm__ __volatile__("bsf %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+#else
+      /* The coding was chosen to minimize conditionals and operations */
+      pos = lssb32_0((uint32) value);
+      if (pos == -1) {
+         pos = lssb32_0((uint32) (value >> 32));
+         if (pos != -1) {
+            return pos + 32;
+         }
+      }
+#endif /* VM_X86_64 */
+      return pos;
+   }
+}
+#endif /* FEWER_BUILTINS */
+
+
+static INLINE int
+mssb64_0(const uint64 value)
+{
+   if (UNLIKELY(value == 0)) {
+      return -1;
+   } else {
+      intptr_t pos;
+
+#ifdef USE_ARCH_X86_CUSTOM
+#ifdef VM_X86_64
+      __asm__ ("bsr %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
+#else
+      /* The coding was chosen to minimize conditionals and operations */
+      if (value > 0xFFFFFFFFULL) {
+         pos = 32 + mssb32_0((uint32) (value >> 32));
+      } else {
+         pos = mssb32_0((uint32) value);
+      }
+#endif
+#else
+      pos = 64 - __builtin_clzll(value) - 1;
+#endif
+
+      return pos;
+   }
+}
+
+#ifdef USE_ARCH_X86_CUSTOM
+#undef USE_ARCH_X86_CUSTOM
+#endif
+
+#endif // __GNUC__
+
+static INLINE int
+lssbPtr_0(const uintptr_t value)
+{
+#ifdef VM_64BIT
+   return lssb64_0((uint64) value);
+#else
+   return lssb32_0((uint32) value);
+#endif
+}
+
+static INLINE int
+lssbPtr(const uintptr_t value)
+{
+   return lssbPtr_0(value) + 1;
+}
+
+static INLINE int
+mssbPtr_0(const uintptr_t value)
+{
+#ifdef VM_64BIT
+   return mssb64_0((uint64) value);
+#else
+   return mssb32_0((uint32) value);
+#endif
+}
+
+static INLINE int
+mssbPtr(const uintptr_t value)
+{
+   return mssbPtr_0(value) + 1;
+}
+
+static INLINE int
+lssb32(const uint32 value)
+{
+   return lssb32_0(value) + 1;
+}
+
+static INLINE int
+mssb32(const uint32 value)
+{
+   return mssb32_0(value) + 1;
+}
+
+static INLINE int
+lssb64(const uint64 value)
+{
+   return lssb64_0(value) + 1;
+}
+
+static INLINE int
+mssb64(const uint64 value)
+{
+   return mssb64_0(value) + 1;
+}
+
+#ifdef __GNUC__
+#if defined(VM_X86_ANY) || defined(VM_ARM_ANY)
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * uint16set --
+ *
+ *      memset a given address with an uint16 value, count times.
+ *
+ * Results:
+ *      Pointer to filled memory range.
+ *
+ * Side effects:
+ *      As with memset.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void *
+uint16set(void *dst, uint16 val, size_t count)
+{
+#ifdef VM_ARM_32
+   void *tmpDst = dst;
+
+   __asm__ __volatile__ (
+      "cmp     %1, #0\n\t"
+      "beq     2f\n"
+      "1:\n\t"
+      "strh    %2, [%0], #2\n\t"
+      "subs    %1, %1, #1\n\t"
+      "bne     1b\n"
+      "2:"
+      : "+r" (tmpDst), "+r" (count)
+      : "r" (val)
+      : "cc", "memory");
+#elif defined(VM_ARM_64)
+   void   *tmpDst = dst;
+   uint64  tmpVal = 0;
+
+   if (count == 0) {
+      return dst;
+   }
+
+   __asm__ __volatile__ (
+      "cbz     %3, 1f\n\t"
+
+      // Copy 16 bits twice...
+      "bfm     %2, %3, #0, #15\n\t"
+      "lsl     %2, %2, #16\n\t"
+      "bfm     %2, %3, #0, #15\n\t"
+
+      // Copy 32 bits from the bottom of the reg. to the top...
+      "lsl     %2, %2, #32\n\t"
+      "bfm     %2, %2, #32, #63\n"
+
+      // Copy into dst 8 bytes (4 uint16s) at a time
+      "1:\t"
+      "cmp     %1, #4\n\t"
+      "b.lo    2f\n\t"
+      "str     %2, [%0], #8\n\t"
+      "sub     %1, %1, #4\n\t"
+      "b       1b\n"
+
+      // Copy into dst 4 bytes at a time
+      "2:\t"
+      "cmp     %1, #2\n\t"
+      "b.lo    3f\n\t"
+      "str     %w2, [%0], #4\n\t"
+      "sub     %1, %1, #2\n\t"
+      "b       2b\n"
+
+      // We have 1 or zero items left...
+      "3:\t"
+      "cbz     %1, 4f\n\t"
+      "strh    %w2, [%0]\n"
+      "4:"
+      : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
+      : "r" (val)
+      : "cc", "memory");
+#else
+   size_t dummy0;
+   void *dummy1;
+
+   __asm__ __volatile__("\t"
+                        "cld"            "\n\t"
+                        "rep ; stosw"    "\n"
+                        : "=c" (dummy0), "=D" (dummy1)
+                        : "0" (count), "1" (dst), "a" (val)
+                        : "memory", "cc"
+      );
+#endif
+   return dst;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * uint32set --
+ *
+ *      memset a given address with an uint32 value, count times.
+ *
+ * Results:
+ *      Pointer to filled memory range.
+ *
+ * Side effects:
+ *      As with memset.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void *
+uint32set(void *dst, uint32 val, size_t count)
+{
+#ifdef VM_ARM_32
+   void *tmpDst = dst;
+
+   __asm__ __volatile__ (
+      "cmp     %1, #0\n\t"
+      "beq     2f\n"
+      "1:\n\t"
+      "str     %2, [%0], #4\n\t"
+      "subs    %1, %1, #1\n\t"
+      "bne     1b\n"
+      "2:"
+      : "+r" (tmpDst), "+r" (count)
+      : "r" (val)
+      : "cc", "memory");
+#elif defined(VM_ARM_64)
+   void   *tmpDst = dst;
+
+   if (count == 0) {
+      return dst;
+   }
+
+   __asm__ __volatile__ (
+      "cbz     %2, 1f\n\t"
+
+      // Drop our value in the top 32 bits, then copy from there to the bottom
+      "lsl     %2, %2, #32\n\t"
+      "bfm     %2, %2, #32, #63\n"
+
+      // Copy four at a time
+      "1:\t"
+      "cmp     %1, #16\n\t"
+      "b.lo    2f\n\t"
+      "stp     %2, %2, [%0], #16\n\t"
+      "stp     %2, %2, [%0], #16\n\t"
+      "stp     %2, %2, [%0], #16\n\t"
+      "stp     %2, %2, [%0], #16\n\t"
+      "sub     %1, %1, #16\n\t"
+      "b       1b\n"
+
+      // Copy remaining pairs of data
+      "2:\t"
+      "cmp     %1, #2\n\t"
+      "b.lo    3f\n\t"
+      "str     %2, [%0], #8\n\t"
+      "sub     %1, %1, #2\n\t"
+      "b       2b\n"
+
+      // One or zero values left to copy
+      "3:\t"
+      "cbz     %1, 4f\n\t"
+      "str     %w2, [%0]\n\t" // No incr
+      "4:"
+      : "+r" (tmpDst), "+r" (count), "+r" (val)
+      :
+      : "cc", "memory");
+#else
+   size_t dummy0;
+   void *dummy1;
+
+   __asm__ __volatile__("\t"
+                        "cld"            "\n\t"
+                        "rep ; stosl"    "\n"
+                        : "=c" (dummy0), "=D" (dummy1)
+                        : "0" (count), "1" (dst), "a" (val)
+                        : "memory", "cc"
+      );
+#endif
+   return dst;
+}
+
+#else /* unknown system: rely on C to write */
+static INLINE void *
+uint16set(void *dst, uint16 val, size_t count)
+{
+   size_t i;
+   for (i = 0; i < count; i++) {
+     ((uint16 *) dst)[i] = val;
+   }
+   return dst;
+}
+
+static INLINE void *
+uint32set(void *dst, uint32 val, size_t count)
+{
+   size_t i;
+   for (i = 0; i < count; i++) {
+     ((uint32 *) dst)[i] = val;
+   }
+   return dst;
+}
+#endif // defined(VM_X86_ANY) || defined(VM_ARM_ANY)
+#elif defined(_MSC_VER)
+
+static INLINE void *
+uint16set(void *dst, uint16 val, size_t count)
+{
+#ifdef VM_X86_64
+   __stosw((uint16*)dst, val, count);
+#else
+   __asm { pushf;
+           mov ax, val;
+           mov ecx, count;
+           mov edi, dst;
+           cld;
+           rep stosw;
+           popf;
+   }
+#endif
+   return dst;
+}
+
+static INLINE void *
+uint32set(void *dst, uint32 val, size_t count)
+{
+#ifdef VM_X86_64
+   __stosd((unsigned long*)dst, (unsigned long)val, count);
+#else
+   __asm { pushf;
+           mov eax, val;
+           mov ecx, count;
+           mov edi, dst;
+           cld;
+           rep stosd;
+           popf;
+   }
+#endif
+   return dst;
+}
+
+#else
+#error "No compiler defined for uint*set"
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Bswap16 --
+ *
+ *      Swap the 2 bytes of "v" as follows: 32 -> 23.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Bswap16(uint16 v)
+{
+#if defined(VM_ARM_64)
+   __asm__("rev16 %0, %0" : "+r"(v));
+   return v;
+#else
+   return ((v >> 8) & 0x00ff) | ((v << 8) & 0xff00);
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Bswap32 --
+ *
+ *      Swap the 4 bytes of "v" as follows: 3210 -> 0123.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Bswap32(uint32 v) // IN
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   /* Checked against the Intel manual and GCC. --hpreg */
+   __asm__(
+      "bswap %0"
+      : "=r" (v)
+      : "0" (v)
+   );
+   return v;
+#elif defined(VM_ARM_32) && !defined(__ANDROID__)
+    __asm__("rev %0, %0" : "+r"(v));
+    return v;
+#elif defined(VM_ARM_64)
+   __asm__("rev32 %0, %0" : "+r"(v));
+    return v;
+#else
+   return    (v >> 24)
+          | ((v >>  8) & 0xFF00)
+          | ((v & 0xFF00) <<  8)
+          |  (v << 24)          ;
+#endif
+}
+#define Bswap Bswap32
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Bswap64 --
+ *
+ *      Swap the 8 bytes of "v" as follows: 76543210 -> 01234567.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Bswap64(uint64 v) // IN
+{
+#if defined(VM_ARM_64)
+   __asm__("rev %0, %0" : "+r"(v));
+   return v;
+#else
+   return ((uint64)Bswap((uint32)v) << 32) | Bswap((uint32)(v >> 32));
+#endif
+}
+
+
+/*
+ * COMPILER_MEM_BARRIER prevents the compiler from re-ordering memory
+ * references accross the barrier.  NOTE: It does not generate any
+ * instruction, so the CPU is free to do whatever it wants to...
+ */
+#ifdef __GNUC__
+#define COMPILER_MEM_BARRIER()   __asm__ __volatile__ ("": : :"memory")
+#define COMPILER_READ_BARRIER()  COMPILER_MEM_BARRIER()
+#define COMPILER_WRITE_BARRIER() COMPILER_MEM_BARRIER()
+#elif defined(_MSC_VER)
+#define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
+#define COMPILER_READ_BARRIER()  _ReadBarrier()
+#define COMPILER_WRITE_BARRIER() _WriteBarrier()
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * COMPILER_FORCED_LOAD_AND_MEM_BARRIER --
+ *
+ *        This macro prevents the compiler from re-ordering memory references
+ *        across the barrier. In addition it emits a forced load from the given
+ *        memory reference. The memory reference has to be either 1, 2, 4 or 8
+ *        bytes wide.
+ *        The forced load of a memory reference can be used exploit details of a
+ *        given CPUs memory model. For example x86 CPUs won't reorder stores to
+ *        a memory location x with loads from a memory location x.
+ *        NOTE: It does not generate any fencing instruction, so the CPU is free
+ *              to reorder instructions according to its memory model.
+ *
+ * Results:
+ *        None
+ *
+ * Side Effects:
+ *        None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#ifdef VM_X86_64
+#ifdef __GNUC__
+
+#define COMPILER_FORCED_LOAD_AND_MEM_BARRIER(_memory_reference)               \
+   do {                                                                       \
+      typeof(_memory_reference) _dummy;                                       \
+                                                                              \
+      asm volatile("mov %1, %0\n\t"                                           \
+                   : "=r" (_dummy) /* Let compiler choose reg for _dummy */   \
+                   : "m" (_memory_reference)                                  \
+                   : "memory");                                               \
+   } while(0)
+
+#endif /* __GNUC__ */
+#endif /* VM_X86_64 */
+
+
+/*
+ * PAUSE is a P4 instruction that improves spinlock power+performance;
+ * on non-P4 IA32 systems, the encoding is interpreted as a REPZ-NOP.
+ * Use volatile to avoid NOP removal.
+ */
+static INLINE void
+PAUSE(void)
+#ifdef __GNUC__
+{
+#ifdef VM_ARM_ANY
+   /*
+    * ARM has no instruction to execute "spin-wait loop", just leave it
+    * empty.
+    */
+#else
+   __asm__ __volatile__( "pause" :);
+#endif
+}
+#elif defined(_MSC_VER)
+#ifdef VM_X86_64
+{
+   _mm_pause();
+}
+#else /* VM_X86_64 */
+#pragma warning( disable : 4035)
+{
+   __asm _emit 0xf3 __asm _emit 0x90
+}
+#pragma warning (default: 4035)
+#endif /* VM_X86_64 */
+#else  /* __GNUC__  */
+#error No compiler defined for PAUSE
+#endif
+
+
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ *
+ * volatile because the tsc always changes without the compiler knowing it.
+ */
+static INLINE uint64
+RDTSC(void)
+#ifdef __GNUC__
+{
+#ifdef VM_X86_64
+   uint64 tscLow;
+   uint64 tscHigh;
+
+   __asm__ __volatile__(
+      "rdtsc"
+      : "=a" (tscLow), "=d" (tscHigh)
+   );
+
+   return tscHigh << 32 | tscLow;
+#elif defined(VM_X86_32)
+   uint64 tim;
+
+   __asm__ __volatile__(
+      "rdtsc"
+      : "=A" (tim)
+   );
+
+   return tim;
+#elif defined(VM_ARM_64)
+#if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1)
+   return MRS(CNTPCT_EL0);
+#else
+   return MRS(CNTVCT_EL0);
+#endif
+#else
+   /*
+    * For platform without cheap timer, just return 0.
+    */
+   return 0;
+#endif
+}
+#elif defined(_MSC_VER)
+#ifdef VM_X86_64
+{
+   return __rdtsc();
+}
+#else
+#pragma warning( disable : 4035)
+{
+   __asm _emit 0x0f __asm _emit 0x31
+}
+#pragma warning (default: 4035)
+#endif /* VM_X86_64 */
+#else  /* __GNUC__  */
+#error No compiler defined for RDTSC
+#endif /* __GNUC__  */
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * DEBUGBREAK --
+ *
+ *    Does an int3 for MSVC / GCC, bkpt/brk for ARM. This is a macro to make
+ *    sure int3 is always inlined.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#ifdef VM_ARM_32
+#define DEBUGBREAK() __asm__("bkpt")
+#elif defined(VM_ARM_64)
+#define DEBUGBREAK() __asm__("brk #0")
+#elif defined(_MSC_VER)
+#define DEBUGBREAK() __debugbreak()
+#else
+#define DEBUGBREAK() __asm__("int $3")
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * {Clear,Set,Test}Bit{32,64} --
+ *
+ *    Sets or clears a specified single bit in the provided variable.
+ *
+ *    The index input value specifies which bit to modify and is 0-based.
+ *    Index is truncated by hardware to a 5-bit or 6-bit offset for the
+ *    32 and 64-bit flavors, respectively, but input values are not validated
+ *    with asserts to avoid include dependencies.
+ *
+ *    64-bit flavors are not handcrafted for 32-bit builds because they may
+ *    defeat compiler optimizations.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+SetBit32(uint32 *var, uint32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   __asm__ (
+      "bts %1, %0"
+      : "+mr" (*var)
+      : "rI" (index)
+      : "cc"
+   );
+#elif defined(_MSC_VER)
+   _bittestandset((long *)var, index);
+#else
+   *var |= (1 << index);
+#endif
+}
+
+static INLINE void
+ClearBit32(uint32 *var, uint32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   __asm__ (
+      "btr %1, %0"
+      : "+mr" (*var)
+      : "rI" (index)
+      : "cc"
+   );
+#elif defined(_MSC_VER)
+   _bittestandreset((long *)var, index);
+#else
+   *var &= ~(1 << index);
+#endif
+}
+
+static INLINE void
+SetBit64(uint64 *var, uint64 index)
+{
+#if defined(VM_64BIT) && !defined(VM_ARM_64)
+#ifdef __GNUC__
+   __asm__ (
+      "bts %1, %0"
+      : "+mr" (*var)
+      : "rJ" (index)
+      : "cc"
+   );
+#elif defined(_MSC_VER)
+   _bittestandset64((__int64 *)var, index);
+#endif
+#else
+   *var |= ((uint64)1 << index);
+#endif
+}
+
+static INLINE void
+ClearBit64(uint64 *var, uint64 index)
+{
+#if defined(VM_64BIT) && !defined(VM_ARM_64)
+#ifdef __GNUC__
+   __asm__ (
+      "btrq %1, %0"
+      : "+mr" (*var)
+      : "rJ" (index)
+      : "cc"
+   );
+#elif defined(_MSC_VER)
+   _bittestandreset64((__int64 *)var, index);
+#endif
+#else
+   *var &= ~((uint64)1 << index);
+#endif
+}
+
+static INLINE Bool
+TestBit32(const uint32 *var, uint32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "bt %[index], %[var] \n"
+      "setc %[bit]"
+      : [bit] "=qQm" (bit)
+      : [index] "rI" (index), [var] "r" (*var)
+      : "cc"
+   );
+   return bit;
+#else
+   return (*var & (1 << index)) != 0;
+#endif
+}
+
+static INLINE Bool
+TestBit64(const uint64 *var, uint64 index)
+{
+#if defined __GNUC__ && defined VM_X86_64
+   Bool bit;
+   __asm__ (
+      "bt %[index], %[var] \n"
+      "setc %[bit]"
+      : [bit] "=qQm" (bit)
+      : [index] "rJ" (index), [var] "r" (*var)
+      : "cc"
+   );
+   return bit;
+#else
+   return (*var & (CONST64U(1) << index)) != 0;
+#endif
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * {Clear,Set,Complement,Test}BitVector --
+ *
+ *    Sets, clears, complements, or tests a specified single bit in the
+ *    provided array.  The index input value specifies which bit to modify
+ *    and is 0-based.  Bit number can be +-2Gb (+-128MB) relative from 'var'
+ *    variable.
+ *
+ *    All functions return value of the bit before modification was performed.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+SetBitVector(void *var, int32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "bts %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (*(uint32 *)var)
+      : "rI" (index)
+      : "memory", "cc"
+   );
+   return bit;
+#elif defined(_MSC_VER)
+   return _bittestandset((long *)var, index) != 0;
+#else
+   Bool retVal = (((uint8 *)var)[index / 8] & (1 << (index % 8))) != 0;
+   ((uint8 *)var)[index / 8] |= 1 << (index % 8);
+   return retVal;
+#endif
+}
+
+static INLINE Bool
+ClearBitVector(void *var, int32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "btr %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (*(uint32 *)var)
+      : "rI" (index)
+      : "cc"
+   );
+   return bit;
+#elif defined(_MSC_VER)
+   return _bittestandreset((long *)var, index) != 0;
+#else
+   Bool retVal = (((uint8 *)var)[index / 8] & (1 << (index % 8))) != 0;
+   ((uint8 *)var)[index / 8] &= ~(1 << (index % 8));
+   return retVal;
+#endif
+}
+
+static INLINE Bool
+ComplementBitVector(void *var, int32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "btc %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (*(uint32 *)var)
+      : "rI" (index)
+      : "cc"
+   );
+   return bit;
+#elif defined(_MSC_VER)
+   return _bittestandcomplement((long *)var, index) != 0;
+#else
+   Bool retVal = (((uint8 *)var)[index / 8] & (1 << (index % 8))) != 0;
+   ((uint8 *)var)[index / 8] ^= ~(1 << (index % 8));
+   return retVal;
+#endif
+}
+
+static INLINE Bool
+TestBitVector(const void *var, int32 index)
+{
+#if defined(__GNUC__) && defined(VM_X86_ANY)
+   Bool bit;
+   __asm__ (
+      "bt %2, %1;"
+      "setc %0"
+      : "=qQm" (bit)
+      : "m" (*(const uint32 *)var), "rI" (index)
+      : "cc"
+   );
+   return bit;
+#elif defined _MSC_VER
+   return _bittest((long *)var, index) != 0;
+#else
+   return (((const uint8 *)var)[index / 8] & (1 << (index % 8))) != 0;
+#endif
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ * RoundUpPow2_{64,32} --
+ *
+ *   Rounds a value up to the next higher power of 2.  Returns the original
+ *   value if it is a power of 2.  The next power of 2 for inputs {0, 1} is 1.
+ *   The result is undefined for inputs above {2^63, 2^31} (but equal to 1
+ *   in this implementation).
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+RoundUpPow2C64(uint64 value)
+{
+   if (value <= 1 || value > (CONST64U(1) << 63)) {
+      return 1; // Match the assembly's undefined value for large inputs.
+   } else {
+      return (CONST64U(2) << mssb64_0(value - 1));
+   }
+}
+
+#if defined(__GNUC__) && defined(VM_X86_64)
+static INLINE uint64
+RoundUpPow2Asm64(uint64 value)
+{
+   uint64 out = 2;
+   __asm__("lea -1(%[in]), %%rcx;"      // rcx = value - 1.  Preserve original.
+           "bsr %%rcx, %%rcx;"          // rcx = log2(value - 1) if value != 1
+                                        // if value == 0, then rcx = 63
+                                        // if value == 1 then zf = 1, else zf = 0.
+           "rol %%cl, %[out];"          // out = 2 << rcx (if rcx != -1)
+                                        //     = 2^(log2(value - 1) + 1)
+                                        // if rcx == -1 (value == 0), out = 1
+                                        // zf is always unmodified.
+           "cmovz %[in], %[out]"        // if value == 1 (zf == 1), write 1 to out.
+       : [out]"+r"(out) : [in]"r"(value) : "%rcx", "cc");
+   return out;
+}
+#endif
+
+static INLINE uint64
+RoundUpPow2_64(uint64 value)
+{
+#if defined(__GNUC__) && defined(VM_X86_64)
+   if (__builtin_constant_p(value)) {
+      return RoundUpPow2C64(value);
+   } else {
+      return RoundUpPow2Asm64(value);
+   }
+#else
+   return RoundUpPow2C64(value);
+#endif
+}
+
+static INLINE uint32
+RoundUpPow2C32(uint32 value)
+{
+   if (value <= 1 || value > (1U << 31)) {
+      return 1; // Match the assembly's undefined value for large inputs.
+   } else {
+      return (2 << mssb32_0(value - 1));
+   }
+}
+
+#ifdef __GNUC__
+static INLINE uint32
+RoundUpPow2Asm32(uint32 value)
+{
+#ifdef VM_ARM_32
+   uint32 out = 1;
+   // Note: None Thumb only!
+   //       The value of the argument "value"
+   //       will be affected!
+   __asm__("sub %[in], %[in], #1;"         // r1 = value - 1 . if value == 0 then r1 = 0xFFFFFFFF
+           "clz %[in], %[in];"             // r1 = log2(value - 1) if value != 1
+                                           // if value == 0 then r1 = 0
+                                           // if value == 1 then r1 = 32
+           "mov %[out], %[out], ror %[in]" // out = 2^(32 - r1)
+                                           // if out == 2^32 then out = 1 as it is right rotate
+       : [in]"+r"(value),[out]"+r"(out));
+   return out;
+#elif defined(VM_ARM_64)
+   return RoundUpPow2C32(value);
+#else
+   uint32 out = 2;
+
+   __asm__("lea -1(%[in]), %%ecx;"      // ecx = value - 1.  Preserve original.
+           "bsr %%ecx, %%ecx;"          // ecx = log2(value - 1) if value != 1
+                                        // if value == 0, then ecx = 31
+                                        // if value == 1 then zf = 1, else zf = 0.
+           "rol %%cl, %[out];"          // out = 2 << ecx (if ecx != -1)
+                                        //     = 2^(log2(value - 1) + 1).
+                                        // if ecx == -1 (value == 0), out = 1
+                                        // zf is always unmodified
+           "cmovz %[in], %[out]"        // if value == 1 (zf == 1), write 1 to out.
+       : [out]"+r"(out) : [in]"r"(value) : "%ecx", "cc");
+   return out;
+#endif
+}
+#endif // __GNUC__
+
+static INLINE uint32
+RoundUpPow2_32(uint32 value)
+{
+#ifdef __GNUC__
+   if (__builtin_constant_p(value)) {
+      return RoundUpPow2C32(value);
+   } else {
+      return RoundUpPow2Asm32(value);
+   }
+#else
+   return RoundUpPow2C32(value);
+#endif
+}
+
+#endif // _VM_BASIC_ASM_H_
+
diff --git a/vmnet-only/vm_basic_asm_x86.h b/vmnet-only/vm_basic_asm_x86.h
new file mode 100644
index 00000000..2c4232c3
--- /dev/null
+++ b/vmnet-only/vm_basic_asm_x86.h
@@ -0,0 +1,548 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_asm_x86.h
+ *
+ *	Basic IA32 asm macros
+ */
+
+#ifndef _VM_BASIC_ASM_X86_H_
+#define _VM_BASIC_ASM_X86_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#ifdef VM_X86_64
+/*
+ * The gcc inline asm uses the "A" constraint which differs in 32 & 64
+ * bit mode.  32 bit means eax and edx, 64 means rax or rdx.
+ */
+#error "x86-64 not supported"
+#endif
+
+/*
+ * XTEST
+ *     Return TRUE if processor is in transaction region.
+ *
+ */
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+static INLINE Bool
+xtest(void)
+{
+   uint8 al;
+   __asm__ __volatile__(".byte 0x0f, 0x01, 0xd6    # xtest \n"
+                        "setnz %%al\n"
+                        : "=a"(al) : : "cc");
+   return al;
+}
+
+#endif /* __GNUC__ */
+
+
+/*
+ * FXSAVE/FXRSTOR
+ *     save/restore SIMD/MMX fpu state
+ *
+ * The pointer passed in must be 16-byte aligned.
+ *
+ * Intel and AMD processors behave differently w.r.t. fxsave/fxrstor. Intel
+ * processors unconditionally save the exception pointer state (instruction
+ * ptr., data ptr., and error instruction opcode). FXSAVE_ES1 and FXRSTOR_ES1
+ * work correctly for Intel processors.
+ *
+ * AMD processors only save the exception pointer state if ES=1. This leads to a
+ * security hole whereby one process/VM can inspect the state of another process
+ * VM. The AMD recommended workaround involves clobbering the exception pointer
+ * state unconditionally, and this is implemented in FXRSTOR_AMD_ES0. Note that
+ * FXSAVE_ES1 will only save the exception pointer state for AMD processors if
+ * ES=1.
+ *
+ * The workaround (FXRSTOR_AMD_ES0) only costs 1 cycle more than just doing an
+ * fxrstor, on both AMD Opteron and Intel Core CPUs.
+ */
+#if defined(__GNUC__)
+static INLINE void 
+FXSAVE_ES1(void *save)
+{
+   __asm__ __volatile__ ("fxsave %0\n" : "=m" (*(uint8 *)save) : : "memory");
+}
+
+static INLINE void 
+FXRSTOR_ES1(const void *load)
+{
+   __asm__ __volatile__ ("fxrstor %0\n"
+                         : : "m" (*(const uint8 *)load) : "memory");
+}
+
+static INLINE void 
+FXRSTOR_AMD_ES0(const void *load)
+{
+   uint64 dummy = 0;
+
+   __asm__ __volatile__ 
+       ("fnstsw  %%ax    \n"     // Grab x87 ES bit
+        "bt      $7,%%ax \n"     // Test ES bit
+        "jnc     1f      \n"     // Jump if ES=0
+        "fnclex          \n"     // ES=1. Clear it so fild doesn't trap
+        "1:              \n"
+        "ffree   %%st(7) \n"     // Clear tag bit - avoid poss. stack overflow
+        "fildl   %0      \n"     // Dummy Load from "safe address" changes all
+                                 // x87 exception pointers.
+        "fxrstor %1      \n"
+        :  
+        : "m" (dummy), "m" (*(const uint8 *)load)
+        : "ax", "memory");
+}
+#endif /* __GNUC__ */
+
+/*
+ * XSAVE/XRSTOR
+ *     save/restore GSSE/SIMD/MMX fpu state
+ *
+ * The pointer passed in must be 64-byte aligned.
+ * See above comment for more information.
+ */
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+
+static INLINE void 
+XSAVE_ES1(void *save, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x21 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xsave %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XSAVEOPT_ES1(void *save, uint64 mask)
+{
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x31 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+}
+
+static INLINE void 
+XRSTOR_ES1(const void *load, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x29 \n"
+        :
+        : "c" ((const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xrstor %0 \n"
+        :
+        : "m" (*(const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XRSTOR_AMD_ES0(const void *load, uint64 mask)
+{
+   uint64 dummy = 0;
+
+   __asm__ __volatile__ 
+       ("fnstsw  %%ax    \n"     // Grab x87 ES bit
+        "bt      $7,%%ax \n"     // Test ES bit
+        "jnc     1f      \n"     // Jump if ES=0
+        "fnclex          \n"     // ES=1. Clear it so fild doesn't trap
+        "1:              \n"
+        "ffree   %%st(7) \n"     // Clear tag bit - avoid poss. stack overflow
+        "fildl   %0      \n"     // Dummy Load from "safe address" changes all
+                                 // x87 exception pointers.
+        "mov %%ebx, %%eax \n"
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+        ".byte 0x0f, 0xae, 0x29 \n"
+        :
+        : "m" (dummy), "c" ((const uint8 *)load),
+          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
+#else
+        "xrstor %1 \n"
+        :
+        : "m" (dummy), "m" (*(const uint8 *)load),
+          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
+#endif
+        : "eax", "memory");
+}
+#endif /* __GNUC__ */
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Div643232 --
+ *
+ *    Unsigned integer division:
+ *       The dividend is 64-bit wide
+ *       The divisor  is 32-bit wide
+ *       The quotient is 32-bit wide
+ *
+ *    Use this function if you are certain that:
+ *    o Either the quotient will fit in 32 bits,
+ *    o Or your code is ready to handle a #DE exception indicating overflow.
+ *    If that is not the case, then use Div643264().
+ *
+ * Results:
+ *    Quotient and remainder
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__)
+
+static INLINE void
+Div643232(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint32 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   __asm__(
+      "divl %4"
+      : "=a" (*quotient),
+        "=d" (*remainder)
+      : "0" ((uint32)dividend),
+        "1" ((uint32)(dividend >> 32)),
+        "rm" (divisor)
+      : "cc"
+   );
+}
+
+#elif defined _MSC_VER
+
+static INLINE void
+Div643232(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint32 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   __asm {
+      mov  eax, DWORD PTR [dividend]
+      mov  edx, DWORD PTR [dividend+4]
+      div  DWORD PTR [divisor]
+      mov  edi, DWORD PTR [quotient]
+      mov  [edi], eax
+      mov  edi, DWORD PTR [remainder]
+      mov  [edi], edx
+   }
+}
+
+#else
+#error No compiler defined for Div643232
+#endif
+
+
+#if defined(__GNUC__)
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Div643264 --
+ *
+ *    Unsigned integer division:
+ *       The dividend is 64-bit wide
+ *       The divisor  is 32-bit wide
+ *       The quotient is 64-bit wide
+ *
+ * Results:
+ *    Quotient and remainder
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Div643264(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint64 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   uint32 hQuotient;
+   uint32 lQuotient;
+
+   __asm__(
+      "divl %5"        "\n\t"
+      "movl %%eax, %0" "\n\t"
+      "movl %4, %%eax" "\n\t"
+      "divl %5"
+      : "=&rm" (hQuotient),
+        "=a" (lQuotient),
+        "=d" (*remainder)
+      : "1" ((uint32)(dividend >> 32)),
+        "g" ((uint32)dividend),
+        "rm" (divisor),
+        "2" (0)
+      : "cc"
+   );
+   *quotient = (uint64)hQuotient << 32 | lQuotient;
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Mul64x3264 --
+ *
+ *    Unsigned integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Unsigned 64-bit integer multiplicand.
+ *       Unsigned 32-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Unsigned 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && \
+   (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 4)) && \
+   !defined(MUL64_NO_ASM)
+
+static INLINE uint64
+Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   uint64 result;
+   uint32 tmp1, tmp2;
+   // ASSERT(shift >= 0 && shift < 64);
+  
+   __asm__("mov   %%eax, %2\n\t"      // Save lo(multiplicand)
+           "mov   %%edx, %%eax\n\t"   // Get hi(multiplicand)
+           "mull  %4\n\t"             // p2 = hi(multiplicand) * multiplier
+           "xchg  %%eax, %2\n\t"      // Save lo(p2), get lo(multiplicand)
+           "mov   %%edx, %1\n\t"      // Save hi(p2)
+           "mull  %4\n\t"             // p1 = lo(multiplicand) * multiplier
+           "addl  %2, %%edx\n\t"      // hi(p1) += lo(p2)
+           "adcl  $0, %1\n\t"         // hi(p2) += carry from previous step
+           "cmpl  $32, %%ecx\n\t"     // shift < 32?
+           "jl    2f\n\t"             // Go if so
+           "shll  $1, %%eax\n\t"      // Save lo(p1) bit 31 in CF in case shift=32
+           "mov   %%edx, %%eax\n\t"   // result = hi(p2):hi(p1) >> (shift & 31)
+           "mov   %1, %%edx\n\t"
+           "shrdl %%edx, %%eax\n\t"
+           "mov   $0, %2\n\t"
+           "adcl  $0, %2\n\t"         // Get highest order bit shifted out, from CF
+           "shrl  %%cl, %%edx\n\t"
+           "jmp   3f\n"
+        "2:\n\t"
+           "xor   %2, %2\n\t"
+           "shrdl %%edx, %%eax\n\t"   // result = hi(p2):hi(p1):lo(p1) >> shift
+           "adcl  $0, %2\n\t"         // Get highest order bit shifted out, from CF
+           "shrdl %1, %%edx\n"
+        "3:\n\t"
+           "addl  %2, %%eax\n\t"      // result += highest order bit shifted out
+           "adcl  $0, %%edx"
+           : "=A" (result), "=&r" (tmp1), "=&r" (tmp2)
+           : "0" (multiplicand), "rm" (multiplier), "c" (shift)
+           : "cc");
+   return result;
+}
+
+#elif defined _MSC_VER
+#pragma warning(disable: 4035)
+
+static INLINE uint64
+Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   // ASSERT(shift >= 0 && shift < 64);
+
+   __asm {
+      mov  eax, DWORD PTR [multiplicand+4]  // Get hi(multiplicand)
+      mul  DWORD PTR [multiplier]           // p2 = hi(multiplicand) * multiplier
+      mov  ecx, eax                         // Save lo(p2)
+      mov  ebx, edx                         // Save hi(p2)
+      mov  eax, DWORD PTR [multiplicand]    // Get lo(multiplicand)
+      mul  DWORD PTR [multiplier+0]         // p1 = lo(multiplicand) * multiplier
+      add  edx, ecx                         // hi(p1) += lo(p2)
+      adc  ebx, 0                           // hi(p2) += carry from previous step
+      mov  ecx, DWORD PTR [shift]           // Get shift
+      cmp  ecx, 32                          // shift < 32?
+      jl   SHORT l2                         // Go if so
+      shl  eax, 1                           // Save lo(p1) bit 31 in CF in case shift=32
+      mov  eax, edx                         // result = hi(p2):hi(p1) >> (shift & 31)
+      mov  edx, ebx
+      shrd eax, edx, cl
+      mov  esi, 0
+      adc  esi, 0                           // Get highest order bit shifted out, from CF
+      shr  edx, cl
+      jmp  SHORT l3
+   l2:
+      xor  esi, esi
+      shrd eax, edx, cl                     // result = hi(p2):hi(p1):lo(p1) >> shift
+      adc  esi, 0                           // Get highest order bit shifted out, from CF
+      shrd edx, ebx, cl
+   l3:
+      add  eax, esi                         // result += highest order bit shifted out
+      adc  edx, 0
+   }
+   // return with result in edx:eax
+}
+
+#pragma warning(default: 4035)
+#else
+#define MUL64_NO_ASM 1
+#include "mul64.h"
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Muls64x32s64 --
+ *
+ *    Signed integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Signed 64-bit integer multiplicand.
+ *       Unsigned 32-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Signed 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && \
+   (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 4)) && \
+   !defined(MUL64_NO_ASM)
+
+static INLINE int64
+Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   int64 result;
+   uint32 tmp1, tmp2;
+   // ASSERT(shift >= 0 && shift < 64);
+
+   __asm__("mov   %%eax, %2\n\t"      // Save lo(multiplicand)
+           "mov   %%edx, %%eax\n\t"   // Get hi(multiplicand)
+           "test  %%eax, %%eax\n\t"   // Check sign of multiplicand
+           "jl    0f\n\t"             // Go if negative
+           "mull  %4\n\t"             // p2 = hi(multiplicand) * multiplier
+           "jmp   1f\n"
+        "0:\n\t"
+           "mull  %4\n\t"             // p2 = hi(multiplicand) * multiplier
+           "sub   %4, %%edx\n"        // hi(p2) += -1 * multiplier
+        "1:\n\t"
+           "xchg  %%eax, %2\n\t"      // Save lo(p2), get lo(multiplicand)
+           "mov   %%edx, %1\n\t"      // Save hi(p2)
+           "mull  %4\n\t"             // p1 = lo(multiplicand) * multiplier
+           "addl  %2, %%edx\n\t"      // hi(p1) += lo(p2)
+           "adcl  $0, %1\n\t"         // hi(p2) += carry from previous step
+           "cmpl  $32, %%ecx\n\t"     // shift < 32?
+           "jl    2f\n\t"             // Go if so
+           "shll  $1, %%eax\n\t"      // Save lo(p1) bit 31 in CF in case shift=32
+           "mov   %%edx, %%eax\n\t"   // result = hi(p2):hi(p1) >> (shift & 31)
+           "mov   %1, %%edx\n\t"
+           "shrdl %%edx, %%eax\n\t"
+           "mov   $0, %2\n\t"
+           "adcl  $0, %2\n\t"         // Get highest order bit shifted out from CF
+           "sarl  %%cl, %%edx\n\t"
+           "jmp   3f\n"
+        "2:\n\t"
+           "xor   %2, %2\n\t"
+           "shrdl %%edx, %%eax\n\t"   // result = hi(p2):hi(p1):lo(p1) >> shift
+           "adcl  $0, %2\n\t"         // Get highest order bit shifted out from CF
+           "shrdl %1, %%edx\n"
+        "3:\n\t"
+           "addl  %2, %%eax\n\t"      // result += highest order bit shifted out
+           "adcl  $0, %%edx"
+           : "=A" (result), "=&r" (tmp1), "=&rm" (tmp2)
+           : "0" (multiplicand), "rm" (multiplier), "c" (shift)
+           : "cc");
+   return result;
+}
+
+#elif defined(_MSC_VER)
+#pragma warning(disable: 4035)
+
+static INLINE int64
+Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   //ASSERT(shift >= 0 && shift < 64);
+  
+   __asm {
+      mov  eax, DWORD PTR [multiplicand+4]  // Get hi(multiplicand)
+      test eax, eax                         // Check sign of multiplicand
+      jl   SHORT l0                         // Go if negative
+      mul  DWORD PTR [multiplier]           // p2 = hi(multiplicand) * multiplier
+      jmp  SHORT l1
+   l0:
+      mul  DWORD PTR [multiplier]           // p2 = hi(multiplicand) * multiplier
+      sub  edx, DWORD PTR [multiplier]      // hi(p2) += -1 * multiplier
+   l1:
+      mov  ecx, eax                         // Save lo(p2)
+      mov  ebx, edx                         // Save hi(p2)
+      mov  eax, DWORD PTR [multiplicand]    // Get lo(multiplicand)
+      mul  DWORD PTR [multiplier]           // p1 = lo(multiplicand) * multiplier
+      add  edx, ecx                         // hi(p1) += lo(p2)
+      adc  ebx, 0                           // hi(p2) += carry from previous step
+      mov  ecx, DWORD PTR [shift]           // Get shift
+      cmp  ecx, 32                          // shift < 32?
+      jl   SHORT l2                         // Go if so
+      shl  eax, 1                           // Save lo(p1) bit 31 in CF in case shift=32
+      mov  eax, edx                         // result = hi(p2):hi(p1) >> (shift & 31)
+      mov  edx, ebx
+      shrd eax, edx, cl
+      mov  esi, 0
+      adc  esi, 0                           // Get highest order bit shifted out, from CF
+      sar  edx, cl
+      jmp  SHORT l3
+   l2:
+      xor  esi, esi
+      shrd eax, edx, cl                     // result = hi(p2):hi(p1):lo(p1) << shift
+      adc  esi, 0                           // Get highest order bit shifted out, from CF
+      shrd edx, ebx, cl
+   l3:
+      add  eax, esi                         // result += highest order bit shifted out
+      adc  edx, 0
+   }
+   // return with result in edx:eax
+}
+
+#pragma warning(default: 4035)
+#endif
+
+#endif
diff --git a/vmnet-only/vm_basic_asm_x86_64.h b/vmnet-only/vm_basic_asm_x86_64.h
new file mode 100644
index 00000000..bef0056d
--- /dev/null
+++ b/vmnet-only/vm_basic_asm_x86_64.h
@@ -0,0 +1,615 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_asm_x86_64.h
+ *
+ *	Basic x86_64 asm macros.
+ */
+
+#ifndef _VM_BASIC_ASM_X86_64_H_
+#define _VM_BASIC_ASM_X86_64_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#ifndef VM_X86_64
+#error "This file is x86-64 only!"
+#endif
+
+#if defined(_MSC_VER) && !defined(BORA_NO_WIN32_INTRINS)
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+uint64 _umul128(uint64 multiplier, uint64 multiplicand,
+                uint64 *highProduct);
+int64 _mul128(int64 multiplier, int64 multiplicand,
+              int64 *highProduct);
+uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
+#ifdef __cplusplus
+}
+#endif
+
+#pragma intrinsic(_umul128, _mul128, __shiftright128)
+
+#endif // _MSC_VER
+
+#if defined(__GNUC__)
+/*
+ * GET_CURRENT_RIP
+ *
+ * Returns the current instruction pointer. In the example below:
+ *
+ *   foo.c
+ *   L123: Foo(GET_CURRENT_RIP())
+ *
+ * the return value from GET_CURRENT_RIP will point a debugger to L123.
+ */
+#define GET_CURRENT_RIP() ({                                          \
+      void *__rip;                                                    \
+      asm("lea 0(%%rip), %0;\n\t"                                     \
+         : "=r" (__rip));                                             \
+      __rip;                                                          \
+})
+
+#define GET_CURRENT_PC() GET_CURRENT_RIP()
+
+/*
+ * GET_CURRENT_LOCATION
+ *
+ * Updates the arguments with the values of the %rip, %rbp, and %rsp
+ * registers at the current code location where the macro is invoked,
+ * and the return address.
+ */
+#define GET_CURRENT_LOCATION(rip, rbp, rsp, retAddr)  do {         \
+      asm("lea 0(%%rip), %0\n"                                     \
+          "mov %%rbp, %1\n"                                        \
+          "mov %%rsp, %2\n"                                        \
+          : "=r" (rip), "=r" (rbp), "=r" (rsp));                   \
+      retAddr = (uint64) GetReturnAddress();                       \
+   } while (0)
+#endif
+
+/*
+ * FXSAVE/FXRSTOR
+ *     save/restore SIMD/MMX fpu state
+ *
+ * The pointer passed in must be 16-byte aligned.
+ *
+ * Intel and AMD processors behave differently w.r.t. fxsave/fxrstor. Intel
+ * processors unconditionally save the exception pointer state (instruction
+ * ptr., data ptr., and error instruction opcode). FXSAVE_ES1 and FXRSTOR_ES1
+ * work correctly for Intel processors.
+ *
+ * AMD processors only save the exception pointer state if ES=1. This leads to a
+ * security hole whereby one process/VM can inspect the state of another process
+ * VM. The AMD recommended workaround involves clobbering the exception pointer
+ * state unconditionally, and this is implemented in FXRSTOR_AMD_ES0. Note that
+ * FXSAVE_ES1 will only save the exception pointer state for AMD processors if
+ * ES=1.
+ *
+ * The workaround (FXRSTOR_AMD_ES0) only costs 1 cycle more than just doing an
+ * fxrstor, on both AMD Opteron and Intel Core CPUs.
+ */
+#if defined(__GNUC__)
+
+static INLINE void 
+FXSAVE_ES1(void *save)
+{
+   __asm__ __volatile__ ("fxsaveq %0  \n" : "=m" (*(uint8 *)save) : : "memory");
+}
+
+static INLINE void 
+FXSAVE_COMPAT_ES1(void *save)
+{
+   __asm__ __volatile__ ("fxsave %0  \n" : "=m" (*(uint8 *)save) : : "memory");
+}
+
+static INLINE void 
+FXRSTOR_ES1(const void *load)
+{
+   __asm__ __volatile__ ("fxrstorq %0 \n"
+                         : : "m" (*(const uint8 *)load) : "memory");
+}
+
+static INLINE void 
+FXRSTOR_COMPAT_ES1(const void *load)
+{
+   __asm__ __volatile__ ("fxrstor %0 \n"
+                         : : "m" (*(const uint8 *)load) : "memory");
+}
+
+static INLINE void 
+FXRSTOR_AMD_ES0(const void *load)
+{
+   uint64 dummy = 0;
+
+   __asm__ __volatile__ 
+       ("fnstsw  %%ax    \n"     // Grab x87 ES bit
+        "bt      $7,%%ax \n"     // Test ES bit
+        "jnc     1f      \n"     // Jump if ES=0
+        "fnclex          \n"     // ES=1. Clear it so fild doesn't trap
+        "1:              \n"
+        "ffree   %%st(7) \n"     // Clear tag bit - avoid poss. stack overflow
+        "fildl   %0      \n"     // Dummy Load from "safe address" changes all
+                                 // x87 exception pointers.
+        "fxrstorq %1 \n"
+        :
+        : "m" (dummy), "m" (*(const uint8 *)load)
+        : "ax", "memory");
+}
+
+#endif /* __GNUC__ */
+
+/*
+ * XSAVE/XRSTOR
+ *     save/restore GSSE/SIMD/MMX fpu state
+ *
+ * The pointer passed in must be 64-byte aligned.
+ * See above comment for more information.
+ */
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+
+static INLINE void 
+XSAVE_ES1(void *save, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x48, 0x0f, 0xae, 0x21 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xsaveq %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XSAVE_COMPAT_ES1(void *save, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x21 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xsave %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XSAVEOPT_ES1(void *save, uint64 mask)
+{
+   __asm__ __volatile__ (
+        ".byte 0x48, 0x0f, 0xae, 0x31 \n"
+        :
+        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+}
+
+static INLINE void 
+XRSTOR_ES1(const void *load, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x48, 0x0f, 0xae, 0x29 \n"
+        :
+        : "c" ((const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xrstorq %0 \n"
+        :
+        : "m" (*(const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XRSTOR_COMPAT_ES1(const void *load, uint64 mask)
+{
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+   __asm__ __volatile__ (
+        ".byte 0x0f, 0xae, 0x29 \n"
+        :
+        : "c" ((const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#else
+   __asm__ __volatile__ (
+        "xrstor %0 \n"
+        :
+        : "m" (*(const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+#endif
+}
+
+static INLINE void 
+XRSTOR_AMD_ES0(const void *load, uint64 mask)
+{
+   uint64 dummy = 0;
+
+   __asm__ __volatile__ 
+       ("fnstsw  %%ax    \n"     // Grab x87 ES bit
+        "bt      $7,%%ax \n"     // Test ES bit
+        "jnc     1f      \n"     // Jump if ES=0
+        "fnclex          \n"     // ES=1. Clear it so fild doesn't trap
+        "1:              \n"
+        "ffree   %%st(7) \n"     // Clear tag bit - avoid poss. stack overflow
+        "fildl   %0      \n"     // Dummy Load from "safe address" changes all
+                                 // x87 exception pointers.
+        "mov %%ebx, %%eax \n"
+#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+        ".byte 0x48, 0x0f, 0xae, 0x29 \n"
+        :
+        : "m" (dummy), "c" ((const uint8 *)load),
+          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
+#else
+        "xrstorq %1 \n"
+        :
+        : "m" (dummy), "m" (*(const uint8 *)load),
+          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
+#endif
+        : "eax", "memory");
+}
+
+#endif /* __GNUC__ */
+
+/*
+ * XTEST
+ *     Return TRUE if processor is in transaction region.
+ *
+ */
+#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+static INLINE Bool
+xtest(void)
+{
+   uint8 al;
+   __asm__ __volatile__(".byte 0x0f, 0x01, 0xd6    # xtest \n"
+                        "setnz %%al\n"
+                        : "=a"(al) : : "cc"); 
+   return al;
+}
+
+#endif /* __GNUC__ */
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Mul64x6464 --
+ *
+ *    Unsigned integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Unsigned 64-bit integer multiplicand.
+ *       Unsigned 64-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Unsigned 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && !defined(MUL64_NO_ASM)
+
+static INLINE uint64
+Mul64x6464(uint64 multiplicand,
+           uint64 multiplier,
+           uint32 shift)
+{
+   /*
+    * Implementation:
+    *    Multiply 64x64 bits to yield a full 128-bit product.
+    *    Clear the carry bit (needed for the shift == 0 case).
+    *    Shift result in RDX:RAX right by "shift".
+    *    Add the carry bit.  (If shift > 0, this is the highest order bit
+    *      that was discarded by the shift; else it is 0.)
+    *    Return the low-order 64 bits of the above.
+    *
+    */
+   uint64 result, dummy;
+
+   __asm__("mulq    %3           \n\t"
+           "clc                  \n\t"
+           "shrdq   %b4, %1, %0  \n\t"
+           "adc     $0, %0       \n\t"
+           : "=a" (result),
+             "=d" (dummy)
+           : "0"  (multiplier),
+             "rm" (multiplicand),
+             "c"  (shift)
+           : "cc");
+   return result;
+}
+
+#elif defined(_MSC_VER) && !defined(MUL64_NO_ASM)
+
+static INLINE uint64
+Mul64x6464(uint64 multiplicand,
+           uint64 multiplier,
+           uint32 shift)
+{
+   /*
+    * Unfortunately, MSVC intrinsics don't give us access to the carry
+    * flag after a 128-bit shift, so the implementation is more
+    * awkward:
+    *    Multiply 64x64 bits to yield a full 128-bit product.
+    *    Shift result right by "shift".
+    *    If shift != 0, extract and add in highest order bit that was
+    *      discarded by the shift.
+    *    Return the low-order 64 bits of the above.
+    */
+   uint64 tmplo, tmphi;
+   tmplo = _umul128(multiplicand, multiplier, &tmphi);
+   if (shift == 0) {
+      return tmplo;
+   } else {
+      return __shiftright128(tmplo, tmphi, (uint8) shift) +
+         ((tmplo >> (shift - 1)) & 1);
+   }
+}
+
+#else
+#define MUL64_NO_ASM 1
+#include "mul64.h"
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Muls64x64s64 --
+ *
+ *    Signed integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Signed 64-bit integer multiplicand.
+ *       Unsigned 64-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Signed 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) && !defined(MUL64_NO_ASM)
+
+static inline int64
+Muls64x64s64(int64 multiplicand,
+             int64 multiplier,
+             uint32 shift)
+{
+   int64 result, dummy;
+
+   /* Implementation:
+    *    Multiply 64x64 bits to yield a full 128-bit product.
+    *    Clear the carry bit (needed for the shift == 0 case).
+    *    Shift result in RDX:RAX right by "shift".
+    *    Add the carry bit.  (If shift > 0, this is the highest order bit
+    *      that was discarded by the shift; else it is 0.)
+    *    Return the low-order 64 bits of the above.
+    *
+    *    Note: using the unsigned shrd instruction is correct because
+    *    shift < 64 and we return only the low 64 bits of the shifted
+    *    result.
+    */
+   __asm__("imulq   %3           \n\t"
+           "clc                  \n\t"
+           "shrdq   %b4, %1, %0  \n\t"
+           "adc     $0, %0       \n\t"
+           : "=a" (result),
+             "=d" (dummy)
+           : "0"  (multiplier),
+             "rm" (multiplicand),
+             "c"  (shift)
+           : "cc");
+   return result;
+}
+
+#elif defined(_MSC_VER) && !defined(MUL64_NO_ASM)
+
+static INLINE int64
+Muls64x64s64(int64 multiplicand,
+             int64 multiplier,
+             uint32 shift)
+{
+   /*
+    * Unfortunately, MSVC intrinsics don't give us access to the carry
+    * flag after a 128-bit shift, so the implementation is more
+    * awkward:
+    *    Multiply 64x64 bits to yield a full 128-bit product.
+    *    Shift result right by "shift".
+    *    If shift != 0, extract and add in highest order bit that was
+    *      discarded by the shift.
+    *    Return the low-order 64 bits of the above.
+    *
+    * Note: using an unsigned shift is correct because shift < 64 and
+    * we return only the low 64 bits of the shifted result.
+    */
+   int64 tmplo, tmphi;
+   tmplo = _mul128(multiplicand, multiplier, &tmphi);
+   if (shift == 0) {
+      return tmplo;
+   } else {
+      return __shiftright128(tmplo, tmphi, (uint8) shift) +
+         ((tmplo >> (shift - 1)) & 1);
+   }
+}
+
+#endif
+
+#ifndef MUL64_NO_ASM
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Mul64x3264 --
+ *
+ *    Unsigned integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Unsigned 64-bit integer multiplicand.
+ *       Unsigned 32-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Unsigned 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   return Mul64x6464(multiplicand, multiplier, shift);
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Muls64x32s64 --
+ *
+ *    Signed integer by fixed point multiplication, with rounding:
+ *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
+ * 
+ *       Signed 64-bit integer multiplicand.
+ *       Unsigned 32-bit fixed point multiplier, represented as
+ *         (multiplier, shift), where shift < 64.
+ *
+ * Result:
+ *       Signed 64-bit integer product.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE int64
+Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
+{
+   return Muls64x64s64(multiplicand, multiplier, shift);
+}
+#endif
+
+#if defined(__GNUC__)
+
+static INLINE void *
+uint64set(void *dst, uint64 val, uint64 count)
+{
+   int dummy0;
+   int dummy1;
+   __asm__ __volatile__("\t"
+                        "cld"            "\n\t"
+                        "rep ; stosq"    "\n"
+                        : "=c" (dummy0), "=D" (dummy1)
+                        : "0" (count), "1" (dst), "a" (val)
+                        : "memory", "cc");
+   return dst;
+}
+
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Div643232 --
+ *
+ *    Unsigned integer division:
+ *       The dividend is 64-bit wide
+ *       The divisor  is 32-bit wide
+ *       The quotient is 32-bit wide
+ *
+ *    Use this function if you are certain that the quotient will fit in 32 bits,
+ *    If that is not the case, a #DE exception was generated in 32-bit version,
+ *    but not in this 64-bit version. So please be careful.
+ *
+ * Results:
+ *    Quotient and remainder
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__) || defined(_MSC_VER)
+
+static INLINE void
+Div643232(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint32 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   *quotient = (uint32)(dividend / divisor);
+   *remainder = (uint32)(dividend % divisor);
+}
+
+#endif
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Div643264 --
+ *
+ *    Unsigned integer division:
+ *       The dividend is 64-bit wide
+ *       The divisor  is 32-bit wide
+ *       The quotient is 64-bit wide
+ *
+ * Results:
+ *    Quotient and remainder
+ *
+ * Side effects:
+ *    None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#if defined(__GNUC__)
+
+static INLINE void
+Div643264(uint64 dividend,   // IN
+          uint32 divisor,    // IN
+          uint64 *quotient,  // OUT
+          uint32 *remainder) // OUT
+{
+   *quotient = dividend / divisor;
+   *remainder = dividend % divisor;
+}
+
+#endif
+
+#endif // _VM_BASIC_ASM_X86_64_H_
diff --git a/vmnet-only/vm_basic_asm_x86_common.h b/vmnet-only/vm_basic_asm_x86_common.h
new file mode 100644
index 00000000..6bbbc3e6
--- /dev/null
+++ b/vmnet-only/vm_basic_asm_x86_common.h
@@ -0,0 +1,313 @@
+/*********************************************************
+ * Copyright (C) 2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_asm_x86_common.h --
+ *
+ *	Basic assembler macros common to 32-bit and 64-bit x86 ISA.
+ */
+
+#ifndef _VM_BASIC_ASM_X86_COMMON_H_
+#define _VM_BASIC_ASM_X86_COMMON_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#ifndef VM_X86_ANY
+#error "Should be included only in x86 builds"
+#endif
+
+/*
+ * x86-64 windows doesn't support inline asm so we have to use these
+ * intrinsic functions defined in the compiler.  Not all of these are well
+ * documented.  There is an array in the compiler dll (c1.dll) which has
+ * an array of the names of all the intrinsics minus the leading
+ * underscore.  Searching around in the ntddk.h file can also be helpful.
+ *
+ * The declarations for the intrinsic functions were taken from the DDK.
+ * Our declarations must match the ddk's otherwise the 64-bit c++ compiler
+ * will complain about second linkage of the intrinsic functions.
+ * We define the intrinsic using the basic types corresponding to the
+ * Windows typedefs. This avoids having to include windows header files
+ * to get to the windows types.
+ */
+#if defined(_MSC_VER) && !defined(BORA_NO_WIN32_INTRINS)
+#ifdef __cplusplus
+extern "C" {
+#endif
+/*
+ * It seems x86 & x86-64 windows still implements these intrinsic
+ * functions.  The documentation for the x86-64 suggest the
+ * __inbyte/__outbyte intrinsics even though the _in/_out work fine and
+ * __inbyte/__outbyte aren't supported on x86.
+ */
+int            _inp(unsigned short);
+unsigned short _inpw(unsigned short);
+unsigned long  _inpd(unsigned short);
+
+int            _outp(unsigned short, int);
+unsigned short _outpw(unsigned short, unsigned short);
+unsigned long  _outpd(uint16, unsigned long);
+#pragma intrinsic(_inp, _inpw, _inpd, _outp, _outpw, _outpw, _outpd)
+
+/*
+ * Prevents compiler from re-ordering reads, writes and reads&writes.
+ * These functions do not add any instructions thus only affect
+ * the compiler ordering.
+ *
+ * See:
+ * `Lockless Programming Considerations for Xbox 360 and Microsoft Windows'
+ * http://msdn.microsoft.com/en-us/library/bb310595(VS.85).aspx
+ */
+void _ReadBarrier(void);
+void _WriteBarrier(void);
+void _ReadWriteBarrier(void);
+#pragma intrinsic(_ReadBarrier, _WriteBarrier, _ReadWriteBarrier)
+
+void _mm_mfence(void);
+void _mm_lfence(void);
+#pragma intrinsic(_mm_mfence, _mm_lfence)
+
+unsigned int __getcallerseflags(void);
+#pragma intrinsic(__getcallerseflags)
+
+#ifdef VM_X86_64
+/*
+ * intrinsic functions only supported by x86-64 windows as of 2k3sp1
+ */
+unsigned __int64 __rdtsc(void);
+void             __stosw(unsigned short *, unsigned short, size_t);
+void             __stosd(unsigned long *, unsigned long, size_t);
+void             _mm_pause(void);
+#pragma intrinsic(__rdtsc, __stosw, __stosd, _mm_pause)
+
+unsigned char  _BitScanForward64(unsigned long *, unsigned __int64);
+unsigned char  _BitScanReverse64(unsigned long *, unsigned __int64);
+#pragma intrinsic(_BitScanForward64, _BitScanReverse64)
+#endif /* VM_X86_64 */
+
+unsigned char  _BitScanForward(unsigned long *, unsigned long);
+unsigned char  _BitScanReverse(unsigned long *, unsigned long);
+#pragma intrinsic(_BitScanForward, _BitScanReverse)
+
+unsigned char  _bittest(const long *, long);
+unsigned char  _bittestandset(long *, long);
+unsigned char  _bittestandreset(long *, long);
+unsigned char  _bittestandcomplement(long *, long);
+#pragma intrinsic(_bittest, _bittestandset, _bittestandreset, _bittestandcomplement)
+#ifdef VM_X86_64
+unsigned char  _bittestandset64(__int64 *, __int64);
+unsigned char  _bittestandreset64(__int64 *, __int64);
+#pragma intrinsic(_bittestandset64, _bittestandreset64)
+#endif // VM_X86_64
+#ifdef __cplusplus
+}
+#endif
+#endif // _MSC_VER
+
+#ifdef __GNUC__
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ *
+ * volatile because reading from port can modify the state of the underlying
+ * hardware.
+ *
+ * Note: The undocumented %z construct doesn't work (internal compiler error)
+ *       with gcc-2.95.1
+ */
+
+#define __GCC_IN(s, type, name) \
+static INLINE type              \
+name(uint16 port)               \
+{                               \
+   type val;                    \
+                                \
+   __asm__ __volatile__(        \
+      "in" #s " %w1, %0"        \
+      : "=a" (val)              \
+      : "Nd" (port)             \
+   );                           \
+                                \
+   return val;                  \
+}
+
+__GCC_IN(b, uint8, INB)
+__GCC_IN(w, uint16, INW)
+__GCC_IN(l, uint32, IN32)
+
+
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ *
+ * Note: The undocumented %z construct doesn't work (internal compiler error)
+ *       with gcc-2.95.1
+ */
+
+#define __GCC_OUT(s, s2, port, val) do { \
+   __asm__(                              \
+      "out" #s " %" #s2 "1, %w0"         \
+      :                                  \
+      : "Nd" (port), "a" (val)           \
+   );                                    \
+} while (0)
+
+#define OUTB(port, val) __GCC_OUT(b, b, port, val)
+#define OUTW(port, val) __GCC_OUT(w, w, port, val)
+#define OUT32(port, val) __GCC_OUT(l, , port, val)
+
+#define GET_CURRENT_EIP(_eip) \
+      __asm__ __volatile("call 0\n\tpopl %0" : "=r" (_eip): );
+
+static INLINE unsigned int
+GetCallerEFlags(void)
+{
+   unsigned long flags;
+   asm volatile("pushf; pop %0" : "=r"(flags));
+   return flags;
+}
+
+#elif defined(_MSC_VER)
+static INLINE  uint8
+INB(uint16 port)
+{
+   return (uint8)_inp(port);
+}
+static INLINE void
+OUTB(uint16 port, uint8 value)
+{
+   _outp(port, value);
+}
+static INLINE uint16
+INW(uint16 port)
+{
+   return _inpw(port);
+}
+static INLINE void
+OUTW(uint16 port, uint16 value)
+{
+   _outpw(port, value);
+}
+static INLINE  uint32
+IN32(uint16 port)
+{
+   return _inpd(port);
+}
+static INLINE void
+OUT32(uint16 port, uint32 value)
+{
+   _outpd(port, value);
+}
+
+#ifndef VM_X86_64
+#ifdef NEAR
+#undef NEAR
+#endif
+
+#define GET_CURRENT_EIP(_eip) do { \
+   __asm call NEAR PTR $+5 \
+   __asm pop eax \
+   __asm mov _eip, eax \
+} while (0)
+#endif // VM_X86_64
+
+static INLINE unsigned int
+GetCallerEFlags(void)
+{
+   return __getcallerseflags();
+}
+
+#endif // __GNUC__
+
+/* Sequence recommended by Intel for the Pentium 4. */
+#define INTEL_MICROCODE_VERSION() (             \
+   __SET_MSR(MSR_BIOS_SIGN_ID, 0),              \
+   __GET_EAX_FROM_CPUID(1),                     \
+   __GET_MSR(MSR_BIOS_SIGN_ID))
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * RDTSC_BARRIER --
+ *
+ *      Implements an RDTSC fence.  Instructions executed prior to the
+ *      fence will have completed before the fence and all stores to
+ *      memory are flushed from the store buffer.
+ *
+ *      On AMD, MFENCE is sufficient.  On Intel, only LFENCE is
+ *      documented to fence RDTSC, but LFENCE won't drain the store
+ *      buffer.  So, use MFENCE;LFENCE, which will work on both AMD and
+ *      Intel.
+ *
+ *      It is the callers' responsibility to check for SSE2 before
+ *      calling this function.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Cause loads and stores prior to this to be globally visible, and
+ *      RDTSC will not pass.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+RDTSC_BARRIER(void)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "mfence \n\t"
+      "lfence \n\t"
+      ::: "memory"
+   );
+#elif defined _MSC_VER
+   /* Prevent compiler from moving code across mfence/lfence. */
+   _ReadWriteBarrier();
+   _mm_mfence();
+   _mm_lfence();
+   _ReadWriteBarrier();
+#else
+#error No compiler defined for RDTSC_BARRIER
+#endif
+}
+
+
+/*
+ * Compiler/CPU barriers. These take the form of <mem access type>_<mem access
+ * type>_MEM_BARRIER, where <mem access type> is either LD (load), ST (store) or
+ * LDST (any). On x86 we only need to care specifically about store-load
+ * reordering on normal memory types and mfence, otherwise only a compiler
+ * barrier is needed.
+ */
+#define LD_LD_MEM_BARRIER()      COMPILER_MEM_BARRIER()
+#define LD_ST_MEM_BARRIER()      COMPILER_MEM_BARRIER()
+#define LD_LDST_MEM_BARRIER()    COMPILER_MEM_BARRIER()
+#define ST_LD_MEM_BARRIER()      asm volatile ("mfence" ::: "memory")
+#define ST_ST_MEM_BARRIER()      COMPILER_MEM_BARRIER()
+#define ST_LDST_MEM_BARRIER()    ST_LD_MEM_BARRIER()
+#define LDST_LD_MEM_BARRIER()    ST_LD_MEM_BARRIER()
+#define LDST_ST_MEM_BARRIER()    COMPILER_MEM_BARRIER()
+#define LDST_LDST_MEM_BARRIER()  ST_LD_MEM_BARRIER()
+
+#endif // _VM_BASIC_ASM_X86_COMMON_H_
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
new file mode 100644
index 00000000..efe492ab
--- /dev/null
+++ b/vmnet-only/vm_basic_defs.h
@@ -0,0 +1,786 @@
+/*********************************************************
+ * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_basic_defs.h --
+ *
+ *	Standard macros for VMware source code.
+ */
+
+#ifndef _VM_BASIC_DEFS_H_
+#define _VM_BASIC_DEFS_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+#include "vm_basic_types.h" // For INLINE.
+
+/* Checks for FreeBSD, filtering out VMKERNEL. */
+#define __IS_FREEBSD__ (!defined(VMKERNEL) && defined(__FreeBSD__))
+#define __IS_FREEBSD_VER__(ver) (__IS_FREEBSD__ && __FreeBSD_version >= (ver))
+
+#if defined _WIN32 && defined USERLEVEL
+   #include <stddef.h>  /*
+                         * We redefine offsetof macro from stddef; make 
+                         * sure that it's already defined before we do that.
+                         */
+   #include <windows.h>	// for Sleep() and LOWORD() etc.
+   #undef GetFreeSpace  // Unpollute preprocessor namespace.
+#endif
+
+
+/*
+ * Simple macros
+ */
+
+#ifndef vmw_offsetof
+#define vmw_offsetof(TYPE, MEMBER) ((size_t) &((TYPE *)0)->MEMBER)
+#endif
+
+#if (defined __APPLE__ || defined __FreeBSD__) && \
+    (!defined KERNEL && !defined _KERNEL && !defined VMKERNEL && !defined __KERNEL__)
+#   include <stddef.h>
+#else
+#ifndef offsetof
+#define VMW_DEFINED_OFFSETOF
+
+/*
+ * XXX While the _WIN32 implementation appears to be identical to vmw_offsetof
+ * in terms of behavior, they need to be separate to match verbatim the
+ * definition used by the respective compilers, to avoid a redefinition warning.
+ *
+ * This is necessary until we eliminate the inclusion of <windows.h> above.
+ */
+#ifdef _WIN32
+#define offsetof(s,m)   (size_t)&(((s *)0)->m)
+/*
+ * We use the builtin offset for gcc/clang, except when we're running under the
+ * vmkernel's GDB macro preprocessor, since gdb doesn't understand
+ * __builtin_offsetof.
+ */
+#elif defined __GNUC__ && !defined VMKERNEL_GDB_MACRO_BUILDER
+#define offsetof __builtin_offsetof
+#else
+#define offsetof vmw_offsetof
+#endif
+
+#endif // offsetof
+#endif // __APPLE__
+
+#define VMW_CONTAINER_OF(ptr, type, member) \
+   ((type *)((char *)(ptr) - vmw_offsetof(type, member)))
+
+#ifndef ARRAYSIZE
+#define ARRAYSIZE(a) (sizeof (a) / sizeof *(a))
+#endif
+
+#ifndef MIN
+#define MIN(_a, _b)   (((_a) < (_b)) ? (_a) : (_b))
+#endif
+
+/* The Solaris 9 cross-compiler complains about these not being used */
+#ifndef sun
+static INLINE int 
+Min(int a, int b)
+{
+   return a < b ? a : b;
+}
+#endif
+
+#ifndef MAX
+#define MAX(_a, _b)   (((_a) > (_b)) ? (_a) : (_b))
+#endif
+
+#ifndef sun
+static INLINE int 
+Max(int a, int b)
+{
+   return a > b ? a : b;
+}
+#endif
+
+#define VMW_CLAMP(x, min, max) \
+   ((x) < (min) ? (min) : ((x) > (max) ? (max) : (x)))
+
+#define ROUNDUP(x,y)		(((x) + (y) - 1) / (y) * (y))
+#define ROUNDDOWN(x,y)		((x) / (y) * (y))
+#define ROUNDUPBITS(x, bits)	(((uintptr_t) (x) + MASK(bits)) & ~MASK(bits))
+#define ROUNDDOWNBITS(x, bits)	((uintptr_t) (x) & ~MASK(bits))
+#define CEILING(x, y)		(((x) + (y) - 1) / (y))
+#if defined __APPLE__
+#include <machine/param.h>
+#undef MASK
+#endif
+
+/*
+ * The MASK macro behaves badly when given negative numbers or numbers larger
+ * than the highest order bit number (e.g. 32 on a 32-bit machine) as an
+ * argument. The range 0..31 is safe.
+ */
+
+#define MASK(n)		((1 << (n)) - 1)	    /* make an n-bit mask */
+#define MASK64(n)	((CONST64U(1) << (n)) - 1)  /* make an n-bit mask */
+/*
+ * MASKRANGE64 makes a bit vector starting at bit lo and ending at bit hi.  No
+ * checking for lo < hi is done.
+ */
+#define MASKRANGE64(hi, lo)      (MASK64((hi) - (lo) + 1) << (lo))
+
+/* SIGNEXT64 sign extends a n-bit value to 64-bits. */
+#define SIGNEXT64(val, n)       (((int64)(val) << (64 - (n))) >> (64 - (n)))
+
+#define DWORD_ALIGN(x)          ((((x) + 3) >> 2) << 2)
+#define QWORD_ALIGN(x)          ((((x) + 7) >> 3) << 3)
+
+#define IMPLIES(a,b) (!(a) || (b))
+
+/*
+ * Not everybody (e.g., the monitor) has NULL
+ */
+
+#ifndef NULL
+#ifdef  __cplusplus
+#define NULL    0
+#else
+#define NULL    ((void *)0)
+#endif
+#endif
+
+
+/* 
+ * Token concatenation
+ *
+ * The C preprocessor doesn't prescan arguments when they are
+ * concatenated or stringified.  So we need extra levels of
+ * indirection to convince the preprocessor to expand its
+ * arguments.
+ */
+
+#define CONC(x, y)              x##y
+#define XCONC(x, y)             CONC(x, y)
+#define XXCONC(x, y)            XCONC(x, y)
+#define MAKESTR(x)              #x
+#define XSTR(x)                 MAKESTR(x)
+
+
+/*
+ * Wide versions of string constants.
+ */
+
+#ifndef WSTR
+#define WSTR_(X)     L ## X
+#define WSTR(X)      WSTR_(X)
+#endif
+
+
+/*
+ * Page operations
+ *
+ * It has been suggested that these definitions belong elsewhere
+ * (like x86types.h).  However, I deem them common enough
+ * (since even regular user-level programs may want to do
+ * page-based memory manipulation) to be here.
+ * -- edward
+ */
+
+#ifndef PAGE_SHIFT // {
+#if defined VM_I386
+   #define PAGE_SHIFT    12
+#elif defined __APPLE__
+   #define PAGE_SHIFT    12
+#elif defined VM_ARM_64
+   #define PAGE_SHIFT    12
+#elif defined __arm__
+   #define PAGE_SHIFT    12
+#else
+   #error
+#endif
+#endif // }
+
+#ifndef PAGE_SIZE
+#define PAGE_SIZE     (1 << PAGE_SHIFT)
+#endif
+
+#ifndef PAGE_MASK
+#define PAGE_MASK     (PAGE_SIZE - 1)
+#endif
+
+#ifndef PAGE_OFFSET
+#define PAGE_OFFSET(_addr)  ((uintptr_t)(_addr) & (PAGE_SIZE - 1))
+#endif
+
+#ifndef PAGE_NUMBER
+#define PAGE_NUMBER(_addr)  ((uintptr_t)(_addr) / PAGE_SIZE)
+#endif
+
+#ifndef VM_PAGE_BASE
+#define VM_PAGE_BASE(_addr)  ((_addr) & ~(PAGE_SIZE - 1))
+#endif
+
+#ifndef VM_PAGES_SPANNED
+#define VM_PAGES_SPANNED(_addr, _size) \
+   ((((_addr) & (PAGE_SIZE - 1)) + (_size) + (PAGE_SIZE - 1)) >> PAGE_SHIFT)
+#endif
+
+#ifndef BYTES_2_PAGES
+#define BYTES_2_PAGES(_nbytes)  ((_nbytes) >> PAGE_SHIFT)
+#endif
+
+#ifndef PAGES_2_BYTES
+#define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
+#endif
+
+#ifndef MBYTES_2_PAGES
+#define MBYTES_2_PAGES(_nbytes) ((_nbytes) << (20 - PAGE_SHIFT))
+#endif
+
+#ifndef PAGES_2_MBYTES
+#define PAGES_2_MBYTES(_npages) ((_npages) >> (20 - PAGE_SHIFT))
+#endif
+
+#ifndef GBYTES_2_PAGES
+#define GBYTES_2_PAGES(_nbytes) ((_nbytes) << (30 - PAGE_SHIFT))
+#endif
+
+#ifndef PAGES_2_GBYTES
+#define PAGES_2_GBYTES(_npages) ((_npages) >> (30 - PAGE_SHIFT))
+#endif
+
+#ifndef BYTES_2_MBYTES
+#define BYTES_2_MBYTES(_nbytes) ((_nbytes) >> 20)
+#endif
+
+#ifndef MBYTES_2_BYTES
+#define MBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << 20)
+#endif
+
+#ifndef BYTES_2_GBYTES
+#define BYTES_2_GBYTES(_nbytes) ((_nbytes) >> 30)
+#endif
+
+#ifndef GBYTES_2_BYTES
+#define GBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << 30)
+#endif
+
+#ifndef VM_PAE_LARGE_PAGE_SHIFT
+#define VM_PAE_LARGE_PAGE_SHIFT 21
+#endif
+
+#ifndef VM_PAE_LARGE_PAGE_SIZE
+#define VM_PAE_LARGE_PAGE_SIZE (1 << VM_PAE_LARGE_PAGE_SHIFT)
+#endif
+
+#ifndef VM_PAE_LARGE_PAGE_MASK
+#define VM_PAE_LARGE_PAGE_MASK (VM_PAE_LARGE_PAGE_SIZE - 1)
+#endif
+
+#ifndef VM_PAE_LARGE_2_SMALL_PAGES
+#define VM_PAE_LARGE_2_SMALL_PAGES (BYTES_2_PAGES(VM_PAE_LARGE_PAGE_SIZE))
+#endif
+
+/*
+ * Word operations
+ */
+
+#ifndef LOWORD
+#define LOWORD(_dw)   ((_dw) & 0xffff)
+#endif
+#ifndef HIWORD
+#define HIWORD(_dw)   (((_dw) >> 16) & 0xffff)
+#endif
+
+#ifndef LOBYTE
+#define LOBYTE(_w)    ((_w) & 0xff)
+#endif
+#ifndef HIBYTE
+#define HIBYTE(_w)    (((_w) >> 8) & 0xff)
+#endif
+
+#ifndef HIDWORD
+#define HIDWORD(_qw)   ((uint32)((_qw) >> 32))
+#endif
+#ifndef LODWORD
+#define LODWORD(_qw)   ((uint32)(_qw))
+#endif
+#define QWORD(_hi, _lo)   ((((uint64)(_hi)) << 32) | ((uint32)(_lo)))
+
+
+/*
+ * Deposit a field _src at _pos bits from the right,
+ * with a length of _len, into the integer _target.
+ */
+
+#define DEPOSIT_BITS(_src,_pos,_len,_target) { \
+	unsigned mask = ((1 << _len) - 1); \
+	unsigned shiftedmask = ((1 << _len) - 1) << _pos; \
+	_target = (_target & ~shiftedmask) | ((_src & mask) << _pos); \
+}
+
+
+/*
+ * Get return address.
+ */
+
+#ifdef _MSC_VER
+#ifdef __cplusplus
+extern "C"
+#endif 
+void *_ReturnAddress(void);
+#pragma intrinsic(_ReturnAddress)
+#define GetReturnAddress() _ReturnAddress()
+#elif __GNUC__
+#define GetReturnAddress() __builtin_return_address(0)
+#endif
+
+
+#ifdef __GNUC__
+#ifndef sun
+
+/*
+ * A bug in __builtin_frame_address was discovered in gcc 4.1.1, and
+ * fixed in 4.2.0; assume it originated in 4.0. PR 147638 and 554369.
+ */
+#if  !(__GNUC__ == 4 && (__GNUC_MINOR__ == 0 || __GNUC_MINOR__ == 1))
+#define GetFrameAddr() __builtin_frame_address(0)
+#endif
+
+#endif // sun
+#endif // __GNUC__
+
+/*
+ * Data prefetch was added in gcc 3.1.1
+ * http://www.gnu.org/software/gcc/gcc-3.1/changes.html
+ */
+#ifdef __GNUC__
+#  if ((__GNUC__ > 3) || (__GNUC__ == 3 && __GNUC_MINOR__ > 1) || \
+       (__GNUC__ == 3 && __GNUC_MINOR__ == 1 && __GNUC_PATCHLEVEL__ >= 1))
+#     define PREFETCH_R(var) __builtin_prefetch((var), 0 /* read */, \
+                                                3 /* high temporal locality */)
+#     define PREFETCH_W(var) __builtin_prefetch((var), 1 /* write */, \
+                                                3 /* high temporal locality */)
+#  else
+#     define PREFETCH_R(var) ((void)(var))
+#     define PREFETCH_W(var) ((void)(var))
+#  endif
+#endif /* __GNUC__ */
+
+
+#ifdef USERLEVEL // {
+
+/*
+ * Note this might be a problem on NT b/c while sched_yield guarantees it
+ * moves you to the end of your priority list, Sleep(0) offers no such
+ * guarantee.  Bummer.  --Jeremy.
+ */
+
+#if defined(N_PLAT_NLM)
+/* We do not have YIELD() as we do not need it yet... */
+#elif defined(_WIN32)
+#      define YIELD()		Sleep(0)
+#elif defined(VMKERNEL)
+/* We don't have a YIELD macro in the vmkernel */
+#else
+#      include <sched.h>        // For sched_yield.  Don't ask.  --Jeremy.
+#      define YIELD()		sched_yield()
+#endif 
+
+
+/*
+ * Standardize some Posix names on Windows.
+ */
+
+#ifdef _WIN32 // {
+
+#define snprintf  _snprintf
+#define strtok_r  strtok_s
+
+#if (_MSC_VER < 1500)
+#define	vsnprintf _vsnprintf
+#endif
+
+typedef int uid_t;
+typedef int gid_t;
+
+static INLINE void
+sleep(unsigned int sec)
+{
+   Sleep(sec * 1000);
+}
+
+static INLINE int
+usleep(unsigned long usec)
+{
+   Sleep(CEILING(usec, 1000));
+
+   return 0;
+}
+
+typedef int pid_t;
+#define       F_OK          0
+#define       X_OK          1
+#define       W_OK          2
+#define       R_OK          4
+
+#endif // }
+
+/*
+ * Macro for username comparison.
+ */
+
+#ifdef _WIN32 // {
+#define USERCMP(x,y)  Str_Strcasecmp(x,y)
+#else
+#define USERCMP(x,y)  strcmp(x,y)
+#endif // }
+
+
+#endif // }
+
+#ifndef va_copy
+
+#ifdef _WIN32
+
+/*
+ * Windows needs va_copy. This works for both 32 and 64-bit Windows
+ * based on inspection of how varags.h from the Visual C CRTL is
+ * implemented. (Future versions of the RTL may break this).
+ */
+
+#define va_copy(dest, src) ((dest) = (src))
+
+#elif defined(__APPLE__) && defined(KERNEL)
+
+#include "availabilityMacOS.h"
+
+#if MAC_OS_X_VERSION_MIN_REQUIRED >= 1050
+// The Mac OS 10.5 kernel SDK defines va_copy in stdarg.h.
+#include <stdarg.h>
+#else
+/*
+ * The Mac OS 10.4 kernel SDK needs va_copy. Based on inspection of
+ * stdarg.h from the MacOSX10.4u.sdk kernel framework, this should
+ * work.
+ */
+#define va_copy(dest, src) ((dest) = (src))
+#endif // MAC_OS_X_VERSION_MIN_REQUIRED
+
+#elif defined(__GNUC__) && (__GNUC__ < 3)
+
+/*
+ * Old versions of gcc recognize __va_copy, but not va_copy.
+ */
+
+#define va_copy(dest, src) __va_copy(dest, src)
+
+#endif // _WIN32
+
+#endif // va_copy
+
+/*
+ * This one is outside USERLEVEL because it's used by
+ * files compiled into the Windows hgfs driver or the display
+ * driver.
+ */
+
+#ifdef _WIN32
+#define PATH_MAX 256
+#ifndef strcasecmp
+#define strcasecmp(_s1,_s2)   _stricmp((_s1),(_s2))
+#endif
+#ifndef strncasecmp
+#define strncasecmp(_s1,_s2,_n)   _strnicmp((_s1),(_s2),(_n))
+#endif
+#endif
+
+#if defined __linux__ && !defined __KERNEL__ && !defined MODULE && \
+                         !defined VMM && !defined FROBOS && !defined __ANDROID__
+#include <features.h>
+#if __GLIBC_PREREQ(2, 1) && !defined GLIBC_VERSION_21
+#define GLIBC_VERSION_21
+#endif
+#if __GLIBC_PREREQ(2, 2) && !defined GLIBC_VERSION_22
+#define GLIBC_VERSION_22
+#endif
+#if __GLIBC_PREREQ(2, 3) && !defined GLIBC_VERSION_23
+#define GLIBC_VERSION_23
+#endif
+#if __GLIBC_PREREQ(2, 4) && !defined GLIBC_VERSION_24
+#define GLIBC_VERSION_24
+#endif
+#if __GLIBC_PREREQ(2, 5) && !defined GLIBC_VERSION_25
+#define GLIBC_VERSION_25
+#endif
+#if __GLIBC_PREREQ(2, 12) && !defined GLIBC_VERSION_212
+#define GLIBC_VERSION_212
+#endif
+#endif
+
+/*
+ * Convenience definitions of unicode characters.
+ */
+
+#ifndef UTF8_ELLIPSIS
+#define UTF8_ELLIPSIS "\xe2\x80\xa6"
+#endif
+
+/*
+ * Convenience macros and definitions. Can often be used instead of #ifdef.
+ */
+
+#undef ARM64_ONLY
+#ifdef VM_ARM_64
+#define ARM64_ONLY(x)    x
+#else
+#define ARM64_ONLY(x)
+#endif
+
+#undef X86_ONLY
+#ifdef VM_X86_ANY
+#define X86_ONLY(x)      x
+#else
+#define X86_ONLY(x)
+#endif
+
+#undef DEBUG_ONLY
+#ifdef VMX86_DEBUG
+#define vmx86_debug      1
+#define DEBUG_ONLY(x)    x
+#else
+#define vmx86_debug      0
+#define DEBUG_ONLY(x)
+#endif
+
+#ifdef VMX86_STATS
+#define vmx86_stats   1
+#define STATS_ONLY(x) x
+#else
+#define vmx86_stats   0
+#define STATS_ONLY(x)
+#endif
+
+#ifdef VMX86_DEVEL
+#define vmx86_devel   1
+#define DEVEL_ONLY(x) x
+#else
+#define vmx86_devel   0
+#define DEVEL_ONLY(x)
+#endif
+
+#ifdef VMX86_LOG
+#define vmx86_log     1
+#define LOG_ONLY(x)   x
+#else
+#define vmx86_log     0
+#define LOG_ONLY(x)
+#endif
+
+#ifdef VMX86_BETA
+#define vmx86_beta     1
+#define BETA_ONLY(x)   x
+#else
+#define vmx86_beta     0
+#define BETA_ONLY(x)
+#endif
+
+#ifdef VMX86_RELEASE
+#define vmx86_release   1
+#define RELEASE_ONLY(x) x
+#else
+#define vmx86_release   0
+#define RELEASE_ONLY(x) 
+#endif
+
+#ifdef VMX86_SERVER
+#define vmx86_server 1
+#define SERVER_ONLY(x) x
+#define HOSTED_ONLY(x)
+#else
+#define vmx86_server 0
+#define SERVER_ONLY(x)
+#define HOSTED_ONLY(x) x
+#endif
+
+#ifdef VMKERNEL
+#define vmkernel 1
+#define VMKERNEL_ONLY(x) x
+#else
+#define vmkernel 0
+#define VMKERNEL_ONLY(x)
+#endif
+
+#ifdef _WIN32
+#define WIN32_ONLY(x) x
+#define POSIX_ONLY(x)
+#define vmx86_win32 1
+#else
+#define WIN32_ONLY(x)
+#define POSIX_ONLY(x) x
+#define vmx86_win32 0
+#endif
+
+#ifdef __linux__
+#define vmx86_linux 1
+#define LINUX_ONLY(x) x
+#else
+#define vmx86_linux 0
+#define LINUX_ONLY(x)
+#endif
+
+#ifdef __APPLE__
+#define vmx86_apple 1
+#define APPLE_ONLY(x) x
+#else
+#define vmx86_apple 0
+#define APPLE_ONLY(x) 
+#endif
+
+#ifdef VMM
+#define VMM_ONLY(x) x
+#define USER_ONLY(x)
+#else
+#define VMM_ONLY(x)
+#define USER_ONLY(x) x
+#endif
+
+/* VMVISOR ifdef only allowed in the vmkernel */
+#ifdef VMKERNEL
+#ifdef VMVISOR
+#define vmvisor 1
+#define VMVISOR_ONLY(x) x
+#else
+#define vmvisor 0
+#define VMVISOR_ONLY(x)
+#endif
+#endif
+
+#ifdef _WIN32
+#define VMW_INVALID_HANDLE INVALID_HANDLE_VALUE
+#else
+#define VMW_INVALID_HANDLE (-1LL)
+#endif
+
+#ifdef _WIN32
+#define fsync(fd) _commit(fd)
+#define fileno(f) _fileno(f)
+#else
+#endif
+
+/*
+ * Debug output macros for Windows drivers (the Eng variant is for
+ * display/printer drivers only.
+ */
+#ifdef _WIN32
+#ifndef USES_OLD_WINDDK
+#if defined(VMX86_LOG)
+#ifdef _WIN64
+#define WinDrvPrint(arg, ...) DbgPrintEx(DPFLTR_IHVDRIVER_ID, (ULONG)~0, arg, __VA_ARGS__)
+#else
+#define WinDrvPrint(arg, ...) DbgPrint(arg, __VA_ARGS__)
+#endif
+#define WinDrvEngPrint(arg, ...) EngDbgPrint(arg, __VA_ARGS__)
+#else
+#define WinDrvPrint(arg, ...)
+#define WinDrvEngPrint(arg, ...)
+#endif
+#endif
+#endif // _WIN32
+
+#ifdef HOSTED_LG_PG
+#define hosted_lg_pg 1
+#else
+#define hosted_lg_pg 0
+#endif
+
+/*
+ * Use to initialize cbSize for this structure to preserve < Vista
+ * compatibility.
+ */
+#define NONCLIENTMETRICSINFO_V1_SIZE CCSIZEOF_STRUCT(NONCLIENTMETRICS, \
+                                                     lfMessageFont)
+
+/* This is not intended to be thread-safe. */
+#define DO_ONCE(code)                                                   \
+   do {                                                                 \
+      static Bool _doOnceDone = FALSE;                                  \
+      if (UNLIKELY(!_doOnceDone)) {                                     \
+         _doOnceDone = TRUE;                                            \
+         code;                                                          \
+      }                                                                 \
+   } while (0)
+
+/*
+ * Bug 827422 and 838523.
+ */
+
+#if defined __GNUC__ && __GNUC__ >= 4
+#define VISIBILITY_HIDDEN __attribute__((visibility("hidden")))
+#else
+#define VISIBILITY_HIDDEN /* nothing */
+#endif
+
+
+/*
+ * Bitfield extraction.
+ */
+
+#define EXTRACT_BITSLICE32(_val , _lsb, _msb)  \
+   (((uint32)(_val) << (31 - (_msb))) >> ((31 - (_msb)) + (_lsb)))
+#define EXTRACT_BITFIELD32(_val, _pos, _len) \
+   EXTRACT_BITSLICE32((_val), (_pos), ((_pos) + (_len) - 1))
+#define EXTRACT_BITSLICE64(_val, _lsb, _msb) \
+   (((uint64)(_val) << (63 - (_msb))) >> ((63 - (_msb)) + (_lsb)))
+#define EXTRACT_BITFIELD64(_val, _pos, _len) \
+   EXTRACT_BITSLICE64((_val), (_pos), ((_pos) + (_len) - 1))
+
+/*
+ * Typical cache line size.  Use this for aligning structures to cache
+ * lines for performance, but do not rely on it for correctness.
+ *
+ * On x86, all current processors newer than P4 have 64-byte lines,
+ * but P4 had 128.
+ *
+ * On ARM, the line size can vary between cores.  64-byte lines are
+ * common, but either larger or smaller powers of two are possible.
+ */
+#define CACHELINE_SIZE             64
+#define CACHELINE_SHIFT            6
+#define CACHELINE_ALIGNMENT_MASK   (CACHELINE_SIZE - 1)
+
+
+/*
+ * Bits to bytes sizes.
+ */
+
+#define SIZE_8BIT   1
+#define SIZE_16BIT  2
+#define SIZE_24BIT  3
+#define SIZE_32BIT  4
+#define SIZE_48BIT  6
+#define SIZE_64BIT  8
+#define SIZE_80BIT  10
+#define SIZE_128BIT 16
+#define SIZE_256BIT 32
+
+
+#endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
new file mode 100644
index 00000000..17b11b96
--- /dev/null
+++ b/vmnet-only/vm_basic_types.h
@@ -0,0 +1,1158 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ *
+ * vm_basic_types.h --
+ *
+ *    basic data types.
+ */
+
+
+#ifndef _VM_BASIC_TYPES_H_
+#define _VM_BASIC_TYPES_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+/* STRICT ANSI means the Xserver build and X defines Bool differently. */
+#if !defined(_XTYPEDEF_BOOL) && \
+    (!defined(__STRICT_ANSI__) || defined(__FreeBSD__) || defined(__MINGW32__))
+#define _XTYPEDEF_BOOL
+typedef char           Bool;
+#endif
+
+#ifndef FALSE
+#define FALSE          0
+#endif
+
+#ifndef TRUE
+#define TRUE           1
+#endif
+
+#define IsBool(x)      (((x) & ~1) == 0)
+#define IsBool2(x, y)  ((((x) | (y)) & ~1) == 0)
+
+/*
+ * Macros __i386__ and __ia64 are intrinsically defined by GCC
+ */
+#if defined _MSC_VER && defined _M_X64
+#  define __x86_64__
+#elif defined _MSC_VER && defined _M_IX86
+#  define __i386__
+#endif
+
+/*
+ * Setup a bunch of defines for instruction set architecture (ISA) related
+ * properties.
+ *
+ * For compiler types/size:
+ *
+ * - VM_32BIT for a 32-bit ISA (with the same C compiler types/sizes as 32-bit
+ *   x86/ARM).
+ * - VM_64BIT for a 64-bit ISA (with the same C compiler types/sizes as 64-bit
+ *   x86/ARM).
+ *
+ * For a given <arch> in {X86, ARM}:
+ *
+ * - VM_<arch>_32 for the 32-bit variant.
+ * - VM_<arch>_64 for the 64-bit variant.
+ * - VM_<arch>_ANY for any variant of <arch>.
+ *
+ * VM_X86_ANY is synonymous with the confusing and deprecated VM_I386 (which
+ * should really be VM_X86_32).
+ */
+
+#ifdef __i386__
+/* VM_I386 is historically synonymous with VM_X86_ANY in bora, but misleading,
+ * since it is confused with the __i386__ gcc but defined for both 32- and
+ * 64-bit x86. We retain it here for legacy compatibility.
+ */
+#define VM_I386
+#define VM_X86_32
+#define VM_X86_ANY
+#define VM_32BIT
+#endif
+
+#ifdef __x86_64__
+#define VM_X86_64
+#define VM_I386
+#define VM_X86_ANY
+#define VM_64BIT
+#define vm_x86_64 (1)
+#else
+#define vm_x86_64 (0)
+#endif
+
+#ifdef __arm__
+#define VM_ARM_32
+#define VM_ARM_ANY
+#define VM_32BIT
+#endif
+
+#ifdef __aarch64__
+#define VM_ARM_64
+#define VM_ARM_ANY
+#define VM_64BIT
+#define vm_arm_64 (1)
+#else
+#define vm_arm_64 (0)
+#endif
+
+#ifdef _MSC_VER
+
+#pragma warning (3 :4505) // unreferenced local function
+#pragma warning (disable :4018) // signed/unsigned mismatch
+#pragma warning (disable :4761) // integral size mismatch in argument; conversion supplied
+#pragma warning (disable :4305) // truncation from 'const int' to 'short'
+#pragma warning (disable :4244) // conversion from 'unsigned short' to 'unsigned char'
+#pragma warning (disable :4267) // truncation of 'size_t'
+#pragma warning (disable :4146) // unary minus operator applied to unsigned type, result still unsigned
+#pragma warning (disable :4142) // benign redefinition of type
+
+#endif
+
+#if defined(__linux__) && defined(__cplusplus) && __cplusplus >= 201103L
+
+/*
+ * We're using stdint.h instead of cstdint below because of libstdcpp.cpp.
+ * It looks like a C++ file. When being preprocessed all the C++ specific
+ * defines(e.g. __cplusplus) are set, but the C++ include paths are not.
+ */
+#include <stdint.h>
+
+typedef char          Bool;
+
+typedef uint64_t    uint64;
+typedef  int64_t     int64;
+typedef uint32_t    uint32;
+typedef  int32_t     int32;
+typedef uint16_t    uint16;
+typedef  int16_t     int16;
+typedef  uint8_t     uint8;
+typedef   int8_t      int8;
+
+typedef uint64 BA;
+typedef uint64 MA;
+typedef uint32 MPN32;
+
+#elif defined(__APPLE__) || defined(HAVE_STDINT_H)
+
+/*
+ * TODO: This is a C99 standard header.  We should be able to test for
+ * #if __STDC_VERSION__ >= 199901L, but that breaks the Netware build
+ * (which doesn't have stdint.h).
+ */
+
+#include <stdint.h>
+
+typedef uint64_t    uint64;
+typedef  int64_t     int64;
+typedef uint32_t    uint32;
+typedef  int32_t     int32;
+typedef uint16_t    uint16;
+typedef  int16_t     int16;
+typedef  uint8_t    uint8;
+typedef   int8_t     int8;
+
+/*
+ * Note: C does not specify whether char is signed or unsigned, and
+ * both gcc and msvc implement processor-specific signedness.  With
+ * three types:
+ * typeof(char) != typeof(signed char) != typeof(unsigned char)
+ *
+ * Be careful here, because gcc (4.0.1 and others) likes to warn about
+ * conversions between signed char * and char *.
+ */
+
+#else /* !HAVE_STDINT_H */
+
+#ifdef _MSC_VER
+
+typedef unsigned __int64 uint64;
+typedef signed __int64 int64;
+
+#elif __GNUC__
+/* The Xserver source compiles with -ansi -pendantic */
+#   if !defined(__STRICT_ANSI__) || defined(__FreeBSD__)
+#      if defined(VM_X86_64) || defined(VM_ARM_64)
+typedef unsigned long uint64;
+typedef long int64;
+#      else
+typedef unsigned long long uint64;
+typedef long long int64;
+#      endif
+#   endif
+#else
+#   error - Need compiler define for int64/uint64
+#endif /* _MSC_VER */
+
+typedef unsigned int       uint32;
+typedef unsigned short     uint16;
+typedef unsigned char      uint8;
+
+typedef int                int32;
+typedef short              int16;
+typedef signed char        int8;
+
+#endif /* HAVE_STDINT_H */
+
+/*
+ * FreeBSD (for the tools build) unconditionally defines these in
+ * sys/inttypes.h so don't redefine them if this file has already
+ * been included. [greg]
+ *
+ * This applies to Solaris as well.
+ */
+
+/*
+ * Before trying to do the includes based on OS defines, see if we can use
+ * feature-based defines to get as much functionality as possible
+ */
+
+#ifdef HAVE_INTTYPES_H
+#include <inttypes.h>
+#endif
+#ifdef HAVE_SYS_TYPES_H
+#include <sys/types.h>
+#endif
+#ifdef HAVE_SYS_INTTYPES_H
+#include <sys/inttypes.h>
+#endif
+#ifdef HAVE_STDLIB_H
+#include <stdlib.h>
+#endif
+
+#ifdef __FreeBSD__
+#include <sys/param.h> /* For __FreeBSD_version */
+#endif
+
+#if !defined(USING_AUTOCONF)
+#   if defined(__FreeBSD__) || defined(sun)
+#      ifdef KLD_MODULE
+#         include <sys/types.h>
+#      else
+#         if __FreeBSD_version >= 500043
+#            if !defined(VMKERNEL)
+#               include <inttypes.h>
+#            endif
+#            include <sys/types.h>
+#         else
+#            include <sys/inttypes.h>
+#         endif
+#      endif
+#   elif defined __APPLE__
+#      if KERNEL
+#         include <sys/unistd.h>
+#         include <sys/types.h> /* mostly for size_t */
+#         include <stdint.h>
+#      else
+#         include <unistd.h>
+#         include <inttypes.h>
+#         include <stdlib.h>
+#         include <stdint.h>
+#      endif
+#   elif defined __ANDROID__
+#      include <stdint.h>
+#   else
+#      if !defined(__intptr_t_defined) && !defined(intptr_t)
+#         ifdef VM_I386
+#            define __intptr_t_defined
+#            if defined(VM_X86_64)
+typedef int64     intptr_t;
+#            else
+typedef int32     intptr_t;
+#            endif
+#         elif defined(VM_ARM_64)
+#            define __intptr_t_defined
+typedef int64     intptr_t;
+#         elif defined(__arm__)
+#            define __intptr_t_defined
+typedef int32     intptr_t;
+#         endif
+#      endif
+
+#      ifndef _STDINT_H
+#         ifdef VM_I386
+#            if defined(VM_X86_64)
+typedef uint64    uintptr_t;
+#            else
+typedef uint32    uintptr_t;
+#            endif
+#         elif defined(VM_ARM_64)
+typedef uint64    uintptr_t;
+#         elif defined(__arm__)
+typedef uint32    uintptr_t;
+#         endif
+#      endif
+#   endif
+#endif
+
+
+/*
+ * Time
+ * XXX These should be cleaned up.  -- edward
+ */
+
+typedef int64 VmTimeType;          /* Time in microseconds */
+typedef int64 VmTimeRealClock;     /* Real clock kept in microseconds */
+typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
+
+/*
+ * Printf format specifiers for size_t and 64-bit number.
+ * Use them like this:
+ *    printf("%" FMT64 "d\n", big);
+ * The spaces are important for C++11 compatibility.
+ *
+ * FMTH is for handles/fds.
+ */
+
+#ifdef _MSC_VER
+   #define FMT64      "I64"
+   #ifdef VM_X86_64
+      #define FMTSZ      "I64"
+      #define FMTPD      "I64"
+      #define FMTH       "I64"
+   #else
+      #define FMTSZ      "I"
+      #define FMTPD      "I"
+      #define FMTH       "I"
+   #endif
+#elif defined __APPLE__
+   /* Mac OS hosts use the same formatters for 32- and 64-bit. */
+   #define FMT64 "ll"
+   #if KERNEL
+      #define FMTSZ "l"
+   #else
+      #define FMTSZ "z"
+   #endif
+   #define FMTPD "l"
+   #define FMTH ""
+#elif __GNUC__
+   #define FMTH ""
+   #if defined(N_PLAT_NLM) || defined(sun) || \
+       (defined(__FreeBSD__) && (__FreeBSD__ + 0) && ((__FreeBSD__ + 0) < 5))
+      /*
+       * Why (__FreeBSD__ + 0)?  See bug 141008.
+       * Yes, we really need to test both (__FreeBSD__ + 0) and
+       * ((__FreeBSD__ + 0) < 5).  No, we can't remove "+ 0" from
+       * ((__FreeBSD__ + 0) < 5).
+       */
+      #if defined(VM_X86_64) || defined(VM_ARM_64)
+         #define FMTSZ  "l"
+         #define FMTPD  "l"
+      #else
+         #define FMTSZ  ""
+         #define FMTPD  ""
+      #endif
+   #elif defined(__linux__) \
+      || (defined(_POSIX_C_SOURCE) && _POSIX_C_SOURCE >= 200112L) \
+      || (defined(_POSIX_VERSION) && _POSIX_VERSION >= 200112L) \
+      || (defined(_POSIX2_VERSION) && _POSIX2_VERSION >= 200112L)
+      /* BSD, Linux */
+      #define FMTSZ     "z"
+
+      #if defined(VM_X86_64) || defined(VM_ARM_64)
+         #define FMTPD  "l"
+      #else
+         #define FMTPD  ""
+      #endif
+   #else
+      /* Systems with a pre-C99 libc */
+      #define FMTSZ     "Z"
+      #if defined(VM_X86_64) || defined(VM_ARM_64)
+         #define FMTPD  "l"
+      #else
+         #define FMTPD  ""
+      #endif
+   #endif
+   #if defined(VM_X86_64) || defined(VM_ARM_64)
+      #define FMT64     "l"
+   #elif defined(sun) || defined(__FreeBSD__)
+      #define FMT64     "ll"
+   #else
+      #define FMT64     "L"
+   #endif
+#else
+   #error - Need compiler define for FMT64 and FMTSZ
+#endif
+
+/*
+ * Suffix for 64-bit constants.  Use it like this:
+ *    CONST64(0x7fffffffffffffff) for signed or
+ *    CONST64U(0x7fffffffffffffff) for unsigned.
+ *
+ * 2004.08.30(thutt):
+ *   The vmcore/asm64/gen* programs are compiled as 32-bit
+ *   applications, but must handle 64 bit constants.  If the
+ *   64-bit-constant defining macros are already defined, the
+ *   definition will not be overwritten.
+ */
+
+#if !defined(CONST64) || !defined(CONST64U)
+#ifdef _MSC_VER
+#define CONST64(c) c##I64
+#define CONST64U(c) c##uI64
+#elif defined __APPLE__
+#define CONST64(c) c##LL
+#define CONST64U(c) c##uLL
+#elif __GNUC__
+#if defined(VM_X86_64) || defined(VM_ARM_64)
+#define CONST64(c) c##L
+#define CONST64U(c) c##uL
+#else
+#define CONST64(c) c##LL
+#define CONST64U(c) c##uLL
+#endif
+#else
+#error - Need compiler define for CONST64
+#endif
+#endif
+
+/*
+ * Use CONST3264/CONST3264U if you want a constant to be
+ * treated as a 32-bit number on 32-bit compiles and
+ * a 64-bit number on 64-bit compiles. Useful in the case
+ * of shifts, like (CONST3264U(1) << x), where x could be
+ * more than 31 on a 64-bit compile.
+ */
+
+#if defined(VM_X86_64) || defined(VM_ARM_64)
+    #define CONST3264(a) CONST64(a)
+    #define CONST3264U(a) CONST64U(a)
+#else
+    #define CONST3264(a) (a)
+    #define CONST3264U(a) (a)
+#endif
+
+#define MIN_INT8   ((int8)0x80)
+#define MAX_INT8   ((int8)0x7f)
+
+#define MIN_UINT8  ((uint8)0)
+#define MAX_UINT8  ((uint8)0xff)
+
+#define MIN_INT16  ((int16)0x8000)
+#define MAX_INT16  ((int16)0x7fff)
+
+#define MIN_UINT16 ((uint16)0)
+#define MAX_UINT16 ((uint16)0xffff)
+
+#define MIN_INT32  ((int32)0x80000000)
+#define MAX_INT32  ((int32)0x7fffffff)
+
+#define MIN_UINT32 ((uint32)0)
+#define MAX_UINT32 ((uint32)0xffffffff)
+
+#define MIN_INT64  (CONST64(0x8000000000000000))
+#define MAX_INT64  (CONST64(0x7fffffffffffffff))
+
+#define MIN_UINT64 (CONST64U(0))
+#define MAX_UINT64 (CONST64U(0xffffffffffffffff))
+
+typedef uint8 *TCA;  /* Pointer into TC (usually). */
+
+/*
+ * Type big enough to hold an integer between 0..100
+ */
+typedef uint8 Percent;
+#define AsPercent(v)	((Percent)(v))
+
+
+typedef uintptr_t VA;
+typedef uintptr_t VPN;
+
+typedef uint64    PA;
+typedef uint32    PPN;
+
+typedef uint64    TPA;
+typedef uint32    TPPN;
+
+typedef uint64    PhysMemOff;
+typedef uint64    PhysMemSize;
+
+/* The Xserver source compiles with -ansi -pendantic */
+#ifndef __STRICT_ANSI__
+typedef uint64    BA;
+#endif
+
+#ifdef VMKERNEL
+typedef void     *BPN;
+#else
+typedef uint64    BPN;
+#endif
+
+#define UINT64_2_BPN(u) ((BPN)(u))
+#define BPN_2_UINT64(b) ((uint64)(b))
+
+typedef uint32    PageNum;
+typedef unsigned      MemHandle;
+typedef unsigned int  IoHandle;
+typedef int32     World_ID;
+
+/* !! do not alter the definition of INVALID_WORLD_ID without ensuring
+ * that the values defined in both bora/public/vm_basic_types.h and
+ * lib/vprobe/vm_basic_types.h are the same.  Additionally, the definition
+ * of VMK_INVALID_WORLD_ID in vmkapi_world.h also must be defined with
+ * the same value
+ */
+
+#define INVALID_WORLD_ID ((World_ID)0)
+
+typedef World_ID User_CartelID;
+#define INVALID_CARTEL_ID INVALID_WORLD_ID
+
+typedef User_CartelID User_SessionID;
+#define INVALID_SESSION_ID INVALID_CARTEL_ID
+
+typedef User_CartelID User_CartelGroupID;
+#define INVALID_CARTELGROUP_ID INVALID_CARTEL_ID
+
+typedef uint32 Worldlet_ID;
+#define INVALID_WORLDLET_ID ((Worldlet_ID)-1)
+
+typedef  int8    Reg8;
+typedef  int16   Reg16;
+typedef  int32   Reg32;
+typedef  int64   Reg64;
+
+typedef uint8   UReg8;
+typedef uint16  UReg16;
+typedef uint32  UReg32;
+typedef uint64  UReg64;
+
+#if defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
+    defined (VMKERNEL) || defined (VMKBOOT)
+typedef  Reg64  Reg;
+typedef UReg64 UReg;
+#endif
+/* The Xserver source compiles with -ansi -pendantic */
+#ifndef __STRICT_ANSI__
+typedef uint64 MA;
+typedef uint32 MPN32;
+#endif
+
+/*
+ * This type should be used for variables that contain sector
+ * position/quantity.
+ */
+typedef uint64 SectorType;
+
+/*
+ * Linear address
+ */
+
+typedef uintptr_t LA;
+typedef uintptr_t LPN;
+#define LA_2_LPN(_la)     ((_la) >> PAGE_SHIFT)
+#define LPN_2_LA(_lpn)    ((_lpn) << PAGE_SHIFT)
+
+#define LAST_LPN   ((((LA)  1) << (8 * sizeof(LA)   - PAGE_SHIFT)) - 1)
+#define LAST_LPN32 ((((LA32)1) << (8 * sizeof(LA32) - PAGE_SHIFT)) - 1)
+#define LAST_LPN64 ((((LA64)1) << (8 * sizeof(LA64) - PAGE_SHIFT)) - 1)
+
+/* Valid bits in a LPN. */
+#define LPN_MASK   LAST_LPN
+#define LPN_MASK32 LAST_LPN32
+#define LPN_MASK64 LAST_LPN64
+
+/*
+ * On 64 bit platform, address and page number types default
+ * to 64 bit. When we need to represent a 32 bit address, we use
+ * types defined below.
+ *
+ * On 32 bit platform, the following types are the same as the
+ * default types.
+ */
+typedef uint32 VA32;
+typedef uint32 VPN32;
+typedef uint32 LA32;
+typedef uint32 LPN32;
+typedef uint32 PA32;
+typedef uint32 PPN32;
+
+/*
+ * On 64 bit platform, the following types are the same as the
+ * default types.
+ */
+typedef uint64 VA64;
+typedef uint64 VPN64;
+typedef uint64 LA64;
+typedef uint64 LPN64;
+typedef uint64 PA64;
+typedef uint64 PPN64;
+typedef uint64 MA64;
+typedef uint64 MPN;
+
+/*
+ * IO device DMA virtual address and page number (translated by IOMMU to
+ * MA/MPN). IOPN can be in the inclusive range 0 -> MAX_IOPN.
+ */
+typedef uint64 IOA;
+typedef uint64 IOPN;
+
+/*
+ * VA typedefs for user world apps.
+ */
+typedef VA32 UserVA32;
+typedef VA64 UserVA64;
+typedef UserVA64 UserVAConst; /* Userspace ptr to data that we may only read. */
+typedef UserVA32 UserVA32Const; /* Userspace ptr to data that we may only read. */
+typedef UserVA64 UserVA64Const; /* Used by 64-bit syscalls until conversion is finished. */
+#ifdef VMKERNEL
+typedef UserVA64 UserVA;
+#else
+typedef void * UserVA;
+#endif
+
+
+#define MAX_PPN_BITS      31
+#define MAX_PPN           (((PPN)1 << MAX_PPN_BITS) - 1) /* Maximal observable PPN value. */
+#define INVALID_PPN       ((PPN)0xffffffff)
+#define APIC_INVALID_PPN  ((PPN)0xfffffffe)
+
+#define INVALID_BPN       ((BPN)0x000000ffffffffffull)
+
+#define MPN38_MASK        ((1ull << 38) - 1)
+
+#define RESERVED_MPN      ((MPN)0)
+#define INVALID_MPN       ((MPN)MPN38_MASK)
+#define MEMREF_MPN        ((MPN)MPN38_MASK - 1)
+#define RELEASED_MPN      ((MPN)MPN38_MASK - 2)
+
+/* account for special MPNs defined above */
+#define MAX_MPN           ((MPN)MPN38_MASK - 3) /* 50 bits of address space */
+
+#define INVALID_IOPN      ((IOPN)-1)
+#define MAX_IOPN          (INVALID_IOPN - 1)
+
+#define INVALID_LPN       ((LPN)-1)
+#define INVALID_VPN       ((VPN)-1)
+#define INVALID_LPN64     ((LPN64)-1)
+#define INVALID_PAGENUM   ((PageNum)-1)
+
+/*
+ * Format modifier for printing VA, LA, and VPN.
+ * Use them like this: Log("%#" FMTLA "x\n", laddr)
+ */
+
+#if defined(VMM) || defined(FROBOS64) || vm_x86_64 || vm_arm_64 || defined __APPLE__
+#   define FMTLA "l"
+#   define FMTVA "l"
+#   define FMTVPN "l"
+#else
+#   define FMTLA ""
+#   define FMTVA ""
+#   define FMTVPN ""
+#endif
+
+#ifndef EXTERN
+#define EXTERN        extern
+#endif
+#define CONST         const
+
+
+#ifndef INLINE
+#   ifdef _MSC_VER
+#      define INLINE        __inline
+#   else
+#      define INLINE        inline
+#   endif
+#endif
+
+
+/*
+ * Annotation for data that may be exported into a DLL and used by other
+ * apps that load that DLL and import the data.
+ */
+#if defined(_WIN32) && defined(VMX86_IMPORT_DLLDATA)
+#  define VMX86_EXTERN_DATA       extern __declspec(dllimport)
+#else // !_WIN32
+#  define VMX86_EXTERN_DATA       extern
+#endif
+
+#ifdef _WIN32
+
+/* under windows, __declspec(thread) is supported since VS 2003 */
+#define __thread __declspec(thread)
+
+#else
+
+/*
+ * under other platforms instead, __thread is supported by gcc since
+ * version 3.3.1 and by clang since version 3.x
+ */
+
+#endif
+
+
+/*
+ * Due to the wonderful "registry redirection" feature introduced in
+ * 64-bit Windows, if you access any key under HKLM\Software in 64-bit
+ * code, you need to open/create/delete that key with
+ * VMKEY_WOW64_32KEY if you want a consistent view with 32-bit code.
+ */
+
+#ifdef _WIN32
+#ifdef _WIN64
+#define VMW_KEY_WOW64_32KEY KEY_WOW64_32KEY
+#else
+#define VMW_KEY_WOW64_32KEY 0x0
+#endif
+#endif
+
+
+/*
+ * At present, we effectively require a compiler that is at least
+ * gcc-3.3 (circa 2003).  Enforce this here, various things below
+ * this line depend upon it.
+ *
+ * In practice, most things presently compile with gcc-4.1 or gcc-4.4.
+ * The various linux kernel modules may use older (gcc-3.3) compilers.
+ */
+#if defined __GNUC__ && (__GNUC__ < 3 || (__GNUC__ == 3 && __GNUC_MINOR__ < 3))
+#error "gcc version is too old to compile assembly, need gcc-3.3 or better"
+#endif
+
+
+/*
+ * Consider the following reasons functions are inlined:
+ *
+ *  1) inlined for performance reasons
+ *  2) inlined because it's a single-use function
+ *
+ * Functions which meet only condition 2 should be marked with this
+ * inline macro; It is not critical to be inlined (but there is a
+ * code-space & runtime savings by doing so), so when other callers
+ * are added the inline-ness should be removed.
+ */
+
+#if defined __GNUC__
+/*
+ * Starting at version 3.3, gcc does not always inline functions marked
+ * 'inline' (it depends on their size and other factors). To force gcc
+ * to inline a function, one must use the __always_inline__ attribute.
+ * This attribute should be used sparingly and with care.  It is usually
+ * preferable to let gcc make its own inlining decisions
+ */
+#   define INLINE_ALWAYS INLINE __attribute__((__always_inline__))
+#else
+#   define INLINE_ALWAYS INLINE
+#endif
+#define INLINE_SINGLE_CALLER INLINE_ALWAYS
+
+/*
+ * Used when a hard guaranteed of no inlining is needed. Very few
+ * instances need this since the absence of INLINE is a good hint
+ * that gcc will not do inlining.
+ */
+
+#if defined(__GNUC__)
+#define ABSOLUTELY_NOINLINE __attribute__((__noinline__))
+#elif defined(_MSC_VER)
+#define ABSOLUTELY_NOINLINE __declspec(noinline)
+#endif
+
+/*
+ * Used when a function has no effects except the return value and the
+ * return value depends only on the parameters and/or global variables
+ * Such a function can be subject to common subexpression elimination
+ * and loop optimization just as an arithmetic operator would be.
+ */
+
+#if defined(__GNUC__) && (defined(VMM) || defined (VMKERNEL))
+#define SIDE_EFFECT_FREE __attribute__((__pure__))
+#else
+#define SIDE_EFFECT_FREE
+#endif
+
+/*
+ * Used when a function exmaines no input other than its arguments and
+ * has no side effects other than its return value.  Stronger than
+ * SIDE_EFFECT_FREE as the function is not allowed to read from global
+ * memory.
+ */
+
+#if defined(__GNUC__) && (defined(VMM) || defined (VMKERNEL))
+#define CONST_FUNCTION __attribute__((__const__))
+#else
+#define CONST_FUNCTION
+#endif
+
+/*
+ * Attributes placed on function declarations to tell the compiler
+ * that the function never returns.
+ */
+
+#ifdef _MSC_VER
+#define NORETURN __declspec(noreturn)
+#elif defined __GNUC__
+#define NORETURN __attribute__((__noreturn__))
+#else
+#define NORETURN
+#endif
+
+/*
+ * Static profiling hints for functions.
+ *    A function can be either hot, cold, or neither.
+ *    It is an error to specify both hot and cold for the same function.
+ *    Note that there is no annotation for "neither."
+ */
+
+#if defined __GNUC__ && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3))
+#define HOT __attribute__((hot))
+#define COLD __attribute__((cold))
+#else
+#define HOT
+#define COLD
+#endif
+
+/*
+ * Branch prediction hints:
+ *     LIKELY(exp)   - Expression exp is likely TRUE.
+ *     UNLIKELY(exp) - Expression exp is likely FALSE.
+ *   Usage example:
+ *        if (LIKELY(excCode == EXC_NONE)) {
+ *               or
+ *        if (UNLIKELY(REAL_MODE(vc))) {
+ *
+ * We know how to predict branches on gcc3 and later (hopefully),
+ * all others we don't so we do nothing.
+ */
+
+#if defined __GNUC__
+/*
+ * gcc3 uses __builtin_expect() to inform the compiler of an expected value.
+ * We use this to inform the static branch predictor. The '!!' in LIKELY
+ * will convert any !=0 to a 1.
+ */
+#define LIKELY(_exp)     __builtin_expect(!!(_exp), 1)
+#define UNLIKELY(_exp)   __builtin_expect((_exp), 0)
+#else
+#define LIKELY(_exp)      (_exp)
+#define UNLIKELY(_exp)    (_exp)
+#endif
+
+/*
+ * GCC's argument checking for printf-like functions
+ * This is conditional until we have replaced all `"%x", void *'
+ * with `"0x%08x", (uint32) void *'. Note that %p prints different things
+ * on different platforms.  Argument checking is enabled for the
+ * vmkernel, which has already been cleansed.
+ *
+ * fmtPos is the position of the format string argument, beginning at 1
+ * varPos is the position of the variable argument, beginning at 1
+ */
+
+#if defined(__GNUC__)
+# define PRINTF_DECL(fmtPos, varPos) __attribute__((__format__(__printf__, fmtPos, varPos)))
+#else
+# define PRINTF_DECL(fmtPos, varPos)
+#endif
+
+#if defined(__GNUC__)
+# define SCANF_DECL(fmtPos, varPos) __attribute__((__format__(__scanf__, fmtPos, varPos)))
+#else
+# define SCANF_DECL(fmtPos, varPos)
+#endif
+
+/*
+ * UNUSED_PARAM should surround the parameter name and type declaration,
+ * e.g. "int MyFunction(int var1, UNUSED_PARAM(int var2))"
+ *
+ */
+
+#ifndef UNUSED_PARAM
+# if defined(__GNUC__)
+#  define UNUSED_PARAM(_parm) _parm  __attribute__((__unused__))
+# else
+#  define UNUSED_PARAM(_parm) _parm
+# endif
+#endif
+
+#ifndef UNUSED_TYPE
+// XXX _Pragma would better but doesn't always work right now.
+#  define UNUSED_TYPE(_parm) UNUSED_PARAM(_parm)
+#endif
+
+#ifndef UNUSED_VARIABLE
+// XXX is there a better way?
+#  define UNUSED_VARIABLE(_var) (void)_var
+#endif
+
+/*
+ * gcc can warn us if we're ignoring returns
+ */
+#if defined(__GNUC__)
+# define MUST_CHECK_RETURN __attribute__((warn_unused_result))
+#else
+# define MUST_CHECK_RETURN
+#endif
+
+/*
+ * ALIGNED specifies minimum alignment in "n" bytes.
+ */
+
+#ifdef __GNUC__
+#define ALIGNED(n) __attribute__((__aligned__(n)))
+#else
+#define ALIGNED(n)
+#endif
+
+/*
+ * Once upon a time, this was used to silence compiler warnings that
+ * get generated when the compiler thinks that a function returns
+ * when it is marked noreturn.  Don't do it.  Use NOT_REACHED().
+ */
+
+#define INFINITE_LOOP()           do { } while (1)
+
+/*
+ * On FreeBSD (for the tools build), size_t is typedef'd if _BSD_SIZE_T_
+ * is defined. Use the same logic here so we don't define it twice. [greg]
+ */
+#ifdef __FreeBSD__
+#   ifdef _BSD_SIZE_T_
+#      undef _BSD_SIZE_T_
+#      ifdef VM_I386
+#         ifdef VM_X86_64
+             typedef uint64 size_t;
+#         else
+             typedef uint32 size_t;
+#         endif
+#      endif /* VM_I386 */
+#   endif
+
+#   ifdef _BSD_SSIZE_T_
+#      undef _BSD_SSIZE_T_
+#      ifdef VM_I386
+#         ifdef VM_X86_64
+             typedef int64 ssize_t;
+#         else
+             typedef int32 ssize_t;
+#         endif
+#      endif /* VM_I386 */
+#   endif
+
+#else
+#   if !defined(_SIZE_T) && !defined(_SIZE_T_DEFINED)
+#      ifdef VM_I386
+#         define _SIZE_T
+#         ifdef VM_X86_64
+             typedef uint64 size_t;
+#         else
+             typedef uint32 size_t;
+#         endif
+#      elif defined(VM_ARM_64)
+#         define _SIZE_T
+          typedef uint64 size_t;
+#      elif defined(__arm__)
+#         define _SIZE_T
+          typedef uint32 size_t;
+#      endif
+#   endif
+
+#   if !defined(FROBOS) && !defined(_SSIZE_T) && !defined(_SSIZE_T_) && \
+       !defined(ssize_t) && !defined(__ssize_t_defined) && \
+       !defined(_SSIZE_T_DECLARED) && !defined(_SSIZE_T_DEFINED) && \
+       !defined(_SSIZE_T_DEFINED_)
+#      ifdef VM_I386
+#         define _SSIZE_T
+#         define __ssize_t_defined
+#         define _SSIZE_T_DECLARED
+#         define _SSIZE_T_DEFINED_
+#         ifdef VM_X86_64
+             typedef int64 ssize_t;
+#         else
+             typedef int32 ssize_t;
+#         endif
+#      elif defined(VM_ARM_64)
+#         define _SSIZE_T
+#         define __ssize_t_defined
+#         define _SSIZE_T_DECLARED
+#         define _SSIZE_T_DEFINED_
+          typedef int64 ssize_t;
+#      elif defined(__arm__)
+#         define _SSIZE_T
+#         define __ssize_t_defined
+#         define _SSIZE_T_DECLARED
+#         define _SSIZE_T_DEFINED_
+             typedef int32 ssize_t;
+#      endif
+#   endif
+
+#endif
+
+/*
+ * Format modifier for printing pid_t.  On sun the pid_t is a ulong, but on
+ * Linux it's an int.
+ * Use this like this: printf("The pid is %" FMTPID ".\n", pid);
+ */
+#ifdef sun
+#   ifdef VM_X86_64
+#      define FMTPID "d"
+#   else
+#      define FMTPID "lu"
+#   endif
+#else
+# define FMTPID "d"
+#endif
+
+/*
+ * Format modifier for printing uid_t.  On Solaris 10 and earlier, uid_t
+ * is a ulong, but on other platforms it's an unsigned int.
+ * Use this like this: printf("The uid is %" FMTUID ".\n", uid);
+ */
+#if defined(sun) && !defined(SOL11)
+#   ifdef VM_X86_64
+#      define FMTUID "u"
+#   else
+#      define FMTUID "lu"
+#   endif
+#else
+# define FMTUID "u"
+#endif
+
+/*
+ * Format modifier for printing mode_t.  On sun the mode_t is a ulong, but on
+ * Linux it's an int.
+ * Use this like this: printf("The mode is %" FMTMODE ".\n", mode);
+ */
+#ifdef sun
+#   ifdef VM_X86_64
+#      define FMTMODE "o"
+#   else
+#      define FMTMODE "lo"
+#   endif
+#else
+# define FMTMODE "o"
+#endif
+
+/*
+ * Format modifier for printing time_t. Most platforms define a time_t to be
+ * a long int, but on FreeBSD (as of 5.0, it seems), the time_t is a signed
+ * size quantity. Refer to the definition of FMTSZ to see why we need silly
+ * preprocessor arithmetic.
+ * Use this like this: printf("The mode is %" FMTTIME ".\n", time);
+ */
+#if defined(__FreeBSD__) && (__FreeBSD__ + 0) && ((__FreeBSD__ + 0) >= 5)
+#   define FMTTIME FMTSZ"d"
+#else
+#   if defined(_MSC_VER)
+#      ifndef _SAFETIME_H_
+#         if (_MSC_VER < 1400) || defined(_USE_32BIT_TIME_T)
+#             define FMTTIME "ld"
+#         else
+#             define FMTTIME FMT64"d"
+#         endif
+#      else
+#         ifndef FMTTIME
+#            error "safetime.h did not define FMTTIME"
+#         endif
+#      endif
+#   else
+#      define FMTTIME "ld"
+#   endif
+#endif
+
+#ifdef __APPLE__
+/*
+ * Format specifier for all these annoying types such as {S,U}Int32
+ * which are 'long' in 32-bit builds
+ *       and  'int' in 64-bit builds.
+ */
+#   ifdef __LP64__
+#      define FMTLI ""
+#   else
+#      define FMTLI "l"
+#   endif
+
+/*
+ * Format specifier for all these annoying types such as NS[U]Integer
+ * which are  'int' in 32-bit builds
+ *       and 'long' in 64-bit builds.
+ */
+#   ifdef __LP64__
+#      define FMTIL "l"
+#   else
+#      define FMTIL ""
+#   endif
+#endif
+
+
+/*
+ * Define MXSemaHandle here so both vmmon and vmx see this definition.
+ */
+
+#ifdef _WIN32
+typedef uintptr_t MXSemaHandle;
+#else
+typedef int MXSemaHandle;
+#endif
+
+/*
+ * Define type for poll device handles.
+ */
+
+typedef int64 PollDevHandle;
+
+/*
+ * Define the utf16_t type.
+ */
+
+#if defined(_WIN32) && defined(_NATIVE_WCHAR_T_DEFINED)
+typedef wchar_t utf16_t;
+#else
+typedef uint16 utf16_t;
+#endif
+
+/*
+ * Define for point and rectangle types.  Defined here so they
+ * can be used by other externally facing headers in bora/public.
+ */
+
+typedef struct VMPoint {
+   int x, y;
+} VMPoint;
+
+#if defined _WIN32 && defined USERLEVEL
+struct tagRECT;
+typedef struct tagRECT VMRect;
+#else
+typedef struct VMRect {
+   int left;
+   int top;
+   int right;
+   int bottom;
+} VMRect;
+#endif
+
+/*
+ * ranked locks "everywhere"
+ */
+
+typedef uint32 MX_Rank;
+
+#endif  /* _VM_BASIC_TYPES_H_ */
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
new file mode 100644
index 00000000..e2cb477f
--- /dev/null
+++ b/vmnet-only/vm_device_version.h
@@ -0,0 +1,309 @@
+/*********************************************************
+ * Copyright (C) 1998,2005-2012,2014-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef VM_DEVICE_VERSION_H
+#define VM_DEVICE_VERSION_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#ifdef _WIN32
+#ifdef __MINGW32__
+#include "initguid.h"
+#else
+#include "guiddef.h"
+#endif
+#endif
+
+/* LSILogic 53C1030 Parallel SCSI controller
+ * LSILogic SAS1068 SAS controller
+ */
+#define PCI_VENDOR_ID_LSILOGIC          0x1000
+#define PCI_DEVICE_ID_LSI53C1030        0x0030
+#define PCI_DEVICE_ID_LSISAS1068        0x0054
+
+/* Our own PCI IDs
+ *    VMware SVGA II (Unified VGA)
+ *    VMware SVGA (PCI Accelerator)
+ *    VMware vmxnet (Idealized NIC)
+ *    VMware vmxscsi (Abortive idealized SCSI controller)
+ *    VMware chipset (Subsystem ID for our motherboards)
+ *    VMware e1000 (Subsystem ID)
+ *    VMware vmxnet3 (Uniform Pass Through NIC)
+ *    VMware HD Audio codec
+ *    VMware HD Audio controller
+ */
+#define PCI_VENDOR_ID_VMWARE                    0x15AD
+#define PCI_DEVICE_ID_VMWARE_SVGA2              0x0405
+#define PCI_DEVICE_ID_VMWARE_SVGA               0x0710
+#define PCI_DEVICE_ID_VMWARE_VGA                0x0711
+#define PCI_DEVICE_ID_VMWARE_NET                0x0720
+#define PCI_DEVICE_ID_VMWARE_SCSI               0x0730
+#define PCI_DEVICE_ID_VMWARE_VMCI               0x0740
+#define PCI_DEVICE_ID_VMWARE_CHIPSET            0x1976
+#define PCI_DEVICE_ID_VMWARE_82545EM            0x0750 /* single port */
+#define PCI_DEVICE_ID_VMWARE_82546EB            0x0760 /* dual port   */
+#define PCI_DEVICE_ID_VMWARE_EHCI               0x0770
+#define PCI_DEVICE_ID_VMWARE_UHCI               0x0774
+#define PCI_DEVICE_ID_VMWARE_XHCI_0096          0x0778
+#define PCI_DEVICE_ID_VMWARE_XHCI_0100          0x0779
+#define PCI_DEVICE_ID_VMWARE_1394               0x0780
+#define PCI_DEVICE_ID_VMWARE_BRIDGE             0x0790
+#define PCI_DEVICE_ID_VMWARE_ROOTPORT           0x07A0
+#define PCI_DEVICE_ID_VMWARE_VMXNET3            0x07B0
+#define PCI_DEVICE_ID_VMWARE_PVSCSI             0x07C0
+#define PCI_DEVICE_ID_VMWARE_82574              0x07D0
+#define PCI_DEVICE_ID_VMWARE_AHCI               0x07E0
+#define PCI_DEVICE_ID_VMWARE_HDAUDIO_CODEC      0x1975
+#define PCI_DEVICE_ID_VMWARE_HDAUDIO_CONTROLLER 0x1977
+
+/* The hypervisor device might grow.  Please leave room
+ * for 7 more subfunctions.
+ */
+#define PCI_DEVICE_ID_VMWARE_HYPER      0x0800
+#define PCI_DEVICE_ID_VMWARE_VMI        0x0801
+
+#define PCI_DEVICE_VMI_CLASS            0x05
+#define PCI_DEVICE_VMI_SUBCLASS         0x80
+#define PCI_DEVICE_VMI_INTERFACE        0x00
+#define PCI_DEVICE_VMI_REVISION         0x01
+
+#define PCI_DEVICE_ID_VMWARE_DUMMY      0x0809
+
+#define PCI_DEVICE_ID_VMWARE_NVDIMM     0x0810
+#define PCI_DEVICE_ID_VMWARE_VRDMA      0x0820
+
+/*
+ * VMware Virtual Device Test Infrastructure (VDTI) devices
+ */
+#define PCI_DEVICE_ID_VMWARE_VDTI               0x7E57  /* stands for "TEST" */
+
+/* From linux/pci_ids.h:
+ *   AMD Lance Ethernet controller
+ *   BusLogic SCSI controller
+ *   Ensoniq ES1371 sound controller
+ */
+#define PCI_VENDOR_ID_AMD               0x1022
+#define PCI_DEVICE_ID_AMD_VLANCE        0x2000
+#define PCI_VENDOR_ID_BUSLOGIC			0x104B
+#define PCI_DEVICE_ID_BUSLOGIC_MULTIMASTER_NC	0x0140
+#define PCI_DEVICE_ID_BUSLOGIC_MULTIMASTER	0x1040
+#define PCI_VENDOR_ID_ENSONIQ           0x1274
+#define PCI_DEVICE_ID_ENSONIQ_ES1371    0x1371
+
+/* From linux/pci_ids.h:
+ *    Intel 82439TX (430 HX North Bridge)
+ *    Intel 82371AB (PIIX4 South Bridge)
+ *    Intel 82443BX (440 BX North Bridge and AGP Bridge)
+ *    Intel 82545EM (e1000, server adapter, single port)
+ *    Intel 82546EB (e1000, server adapter, dual port)
+ *    Intel HECI (as embedded in ich9m)
+ *    Intel XHCI (Panther Point / Intel 7 Series)
+ */
+#define PCI_VENDOR_ID_INTEL             0x8086
+#define PCI_DEVICE_ID_INTEL_82439TX     0x7100
+#define PCI_DEVICE_ID_INTEL_82371AB_0   0x7110
+#define PCI_DEVICE_ID_INTEL_82371AB_2   0x7112
+#define PCI_DEVICE_ID_INTEL_82371AB_3   0x7113
+#define PCI_DEVICE_ID_INTEL_82371AB     0x7111
+#define PCI_DEVICE_ID_INTEL_82443BX     0x7190
+#define PCI_DEVICE_ID_INTEL_82443BX_1   0x7191
+#define PCI_DEVICE_ID_INTEL_82443BX_2   0x7192 /* Used when no AGP support */
+#define PCI_DEVICE_ID_INTEL_82545EM     0x100f
+#define PCI_DEVICE_ID_INTEL_82546EB     0x1010
+#define PCI_DEVICE_ID_INTEL_82574       0x10d3
+#define PCI_DEVICE_ID_INTEL_82574_APPLE 0x10f6
+#define PCI_DEVICE_ID_INTEL_HECI        0x2a74
+#define PCI_DEVICE_ID_INTEL_PANTHERPOINT_XHCI 0x1e31
+
+/* From drivers/usb/host/xhci-pci.c:
+ *    Intel XHCI (Lynx Point / Intel 8 Series)
+ */
+#define PCI_DEVICE_ID_INTEL_LYNXPOINT_XHCI 0x8c31
+
+#define E1000E_PCI_DEVICE_ID_CONFIG_STR "e1000e.pci.deviceID"
+#define E1000E_PCI_SUB_VENDOR_ID_CONFIG_STR "e1000e.pci.subVendorID"
+#define E1000E_PCI_SUB_DEVICE_ID_CONFIG_STR "e1000e.pci.subDeviceID"
+
+/*
+ * Intel HD Audio controller and Realtek ALC885 codec.
+ */
+#define PCI_DEVICE_ID_INTEL_631XESB_632XESB  0x269a
+#define PCI_VENDOR_ID_REALTEK                0x10ec
+#define PCI_DEVICE_ID_REALTEK_ALC885         0x0885
+
+
+/*
+ * Fresco Logic xHCI (USB 3.0) Controller
+ */
+#define PCI_VENDOR_ID_FRESCO            0x1B73
+#define PCI_DEVICE_ID_FRESCO_FL1000     0x1000   // Original 1-port chip
+#define PCI_DEVICE_ID_FRESCO_FL1009     0x1009   // New 2-port chip (Driver 3.0.98+)
+#define PCI_DEVICE_ID_FRESCO_FL1400     0x1400   // Unknown (4-port? Dev hardware?)
+
+/*
+ * NEC/Renesas xHCI (USB 3.0) Controller
+ */
+#define PCI_VENDOR_ID_NEC               0x1033
+#define PCI_DEVICE_ID_NEC_UPD720200     0x0194
+#define PCI_REVISION_NEC_UPD720200      0x03
+#define PCI_FIRMWARE_NEC_UPD720200      0x3015
+
+#define SATA_ID_SERIAL_STR "00000000000000000001"  /* Must be 20 Bytes */
+#define SATA_ID_FIRMWARE_STR  "00000001"    /* Must be 8 Bytes */
+
+#define AHCI_ATA_MODEL_STR PRODUCT_GENERIC_NAME " Virtual SATA Hard Drive"
+#define AHCI_ATAPI_MODEL_STR PRODUCT_GENERIC_NAME " Virtual SATA CDRW Drive"
+
+/************* Strings for IDE Identity Fields **************************/
+#define VIDE_ID_SERIAL_STR	"00000000000000000001"	/* Must be 20 Bytes */
+#define VIDE_ID_FIRMWARE_STR	"00000001"		/* Must be 8 Bytes */
+
+/* No longer than 40 Bytes */
+#define VIDE_ATA_MODEL_STR PRODUCT_GENERIC_NAME " Virtual IDE Hard Drive"
+#define VIDE_ATAPI_MODEL_STR PRODUCT_GENERIC_NAME " Virtual IDE CDROM Drive"
+
+#define ATAPI_VENDOR_ID	"NECVMWar"		/* Must be 8 Bytes */
+#define ATAPI_PRODUCT_ID PRODUCT_GENERIC_NAME " IDE CDROM"	/* Must be 16 Bytes */
+#define ATAPI_REV_LEVEL	"1.00"			/* Must be 4 Bytes */
+
+#define IDE_NUM_INTERFACES   2	/* support for two interfaces */
+#define IDE_DRIVES_PER_IF    2
+
+/************* Strings for SCSI Identity Fields **************************/
+#define SCSI_DISK_MODEL_STR PRODUCT_GENERIC_NAME " Virtual SCSI Hard Drive"
+#define SCSI_DISK_VENDOR_NAME COMPANY_NAME
+#define SCSI_DISK_REV_LEVEL "1.0"
+#define SCSI_CDROM_MODEL_STR PRODUCT_GENERIC_NAME " Virtual SCSI CDROM Drive"
+#define SCSI_CDROM_VENDOR_NAME COMPANY_NAME
+#define SCSI_CDROM_REV_LEVEL "1.0"
+
+/************* SCSI implementation limits ********************************/
+#define SCSI_MAX_CONTROLLERS	 4	  // Need more than 1 for MSCS clustering
+#define	SCSI_MAX_DEVICES	 16	  // BT-958 emulates only 16
+#define PVSCSI_MAX_DEVICES       255      // 255 (including the controller)
+
+/************* SATA implementation limits ********************************/
+#define SATA_MAX_CONTROLLERS   4
+#define SATA_MAX_DEVICES       30
+#define AHCI_MIN_PORTS         1
+#define AHCI_MAX_PORTS SATA_MAX_DEVICES
+
+/*
+ * Maximum number of supported disk in a VM.
+ *
+ * Note: With some config options for PVSCSI, maximum number of disks could
+ * be ~1K but that number is not publicly supported yet.
+ */
+#define MAX_NUM_DISKS \
+   ((SATA_MAX_CONTROLLERS * SATA_MAX_DEVICES) + \
+    (SCSI_MAX_CONTROLLERS * SCSI_MAX_DEVICES) + \
+    (IDE_NUM_INTERFACES * IDE_DRIVES_PER_IF))
+
+/*
+ * VSCSI_BV_INTS is the number of uint32's needed for a bit vector
+ * to cover all scsi devices per target.
+ */
+#define VSCSI_BV_INTS            CEILING(PVSCSI_MAX_DEVICES, 8 * sizeof (uint32))
+#define SCSI_IDE_CHANNEL         SCSI_MAX_CONTROLLERS
+#define SCSI_IDE_HOSTED_CHANNEL  (SCSI_MAX_CONTROLLERS + 1)
+#define SCSI_SATA_CHANNEL_FIRST  (SCSI_IDE_HOSTED_CHANNEL + 1)
+#define SCSI_MAX_CHANNELS        (SCSI_SATA_CHANNEL_FIRST + SATA_MAX_CONTROLLERS)
+
+/************* SCSI-SATA channel IDs********************************/
+#define SATA_ID_TO_SCSI_ID(sataId)    \
+   (SCSI_SATA_CHANNEL_FIRST + (sataId))
+
+#define SCSI_ID_TO_SATA_ID(scsiId)    \
+   ((scsiId) - SCSI_SATA_CHANNEL_FIRST)
+
+/************* Strings for the VESA BIOS Identity Fields *****************/
+#define VBE_OEM_STRING COMPANY_NAME " SVGA"
+#define VBE_VENDOR_NAME COMPANY_NAME
+#define VBE_PRODUCT_NAME PRODUCT_GENERIC_NAME
+
+/************* PCI implementation limits ********************************/
+#define PCI_MAX_BRIDGES         15
+
+/************* Ethernet implementation limits ***************************/
+#define MAX_ETHERNET_CARDS      10
+
+/********************** Floppy limits ***********************************/
+#define MAX_FLOPPY_DRIVES      2
+
+/************* PCI Passthrough implementation limits ********************/
+#define MAX_PCI_PASSTHRU_DEVICES 16
+
+/************* Test device implementation limits ********************/
+#define MAX_PCI_TEST_DEVICES 16
+
+/************* VDTI PCI Device implementation limits ********************/
+#define MAX_VDTI_PCI_DEVICES 16
+
+/************* USB implementation limits ********************************/
+#define MAX_USB_DEVICES_PER_HOST_CONTROLLER 127
+
+/************* NVDIMM implementation limits ********************************/
+#define MAX_NVDIMM 64
+
+/************* vRDMA implementation limits ******************************/
+#define MAX_VRDMA_DEVICES 2
+
+/************* Strings for Host USB Driver *******************************/
+
+#ifdef _WIN32
+
+/*
+ * Globally unique ID for the VMware device interface. Define INITGUID before including
+ * this header file to instantiate the variable.
+ */
+DEFINE_GUID(GUID_DEVICE_INTERFACE_VMWARE_USB_DEVICES, 
+0x2da1fe75, 0xaab3, 0x4d2c, 0xac, 0xdf, 0x39, 0x8, 0x8c, 0xad, 0xa6, 0x65);
+
+/*
+ * Globally unique ID for the VMware device setup class.
+ */
+DEFINE_GUID(GUID_CLASS_VMWARE_USB_DEVICES, 
+0x3b3e62a5, 0x3556, 0x4d7e, 0xad, 0xad, 0xf5, 0xfa, 0x3a, 0x71, 0x2b, 0x56);
+
+/*
+ * This string defines the device ID string of a VMware USB device.
+ * The format is USB\Vid_XXXX&Pid_YYYY, where XXXX and YYYY are the
+ * hexadecimal representations of the vendor and product ids, respectively.
+ *
+ * The official vendor ID for VMware, Inc. is 0x0E0F.
+ * The product id for USB generic devices is 0x0001.
+ */
+#define USB_VMWARE_DEVICE_ID_WIDE L"USB\\Vid_0E0F&Pid_0001"
+#define USB_DEVICE_ID_LENGTH (sizeof(USB_VMWARE_DEVICE_ID_WIDE) / sizeof(WCHAR))
+
+#ifdef UNICODE
+#define USB_PNP_SETUP_CLASS_NAME L"VMwareUSBDevices"
+#define USB_PNP_DRIVER_NAME L"vmusb"
+#else
+#define USB_PNP_SETUP_CLASS_NAME "VMwareUSBDevices"
+#define USB_PNP_DRIVER_NAME "vmusb"
+#endif
+#endif
+
+#endif /* VM_DEVICE_VERSION_H */
diff --git a/vmnet-only/vm_oui.h b/vmnet-only/vm_oui.h
new file mode 100644
index 00000000..a67075a2
--- /dev/null
+++ b/vmnet-only/vm_oui.h
@@ -0,0 +1,207 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _VM_OUI_H_
+#define _VM_OUI_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#include "includeCheck.h"
+
+#include "vm_basic_asm.h"
+
+/*
+ * Our own OUIs given by IEEE.
+ */
+
+/*
+ * This OUI was previously used for generated MAC addresses on ESX.
+ * Don't reuse.
+ */
+#define VMX86_LEGACY_OUI      0x000569
+
+/* This OUI is used for static MAC addresses. */
+#define VMX86_STATIC_OUI      0x005056
+
+/* This OUI is used for generated MAC addresses. */
+#define VMX86_GENERATED_OUI   0x000C29
+
+/* Entire OUI is reserved and should not be used for any purpose. */
+#define VMX86_FUTURE_OUI      0x001C14
+
+#define VMX86_OUI_SIZE	3
+
+#define VMX86_OUI_BYTE0(x) ((uint8) (((x) >> (VMX86_OUI_SIZE - 1) * 8) & 0xFF))
+#define VMX86_OUI_BYTE1(x) ((uint8) (((x) >> (VMX86_OUI_SIZE - 2) * 8) & 0xFF))
+#define VMX86_OUI_BYTE2(x) ((uint8) (((x) >> (VMX86_OUI_SIZE - 3) * 8) & 0xFF))
+
+#define VMX86_LEGACY_OUI0 VMX86_OUI_BYTE0(VMX86_LEGACY_OUI)
+#define VMX86_LEGACY_OUI1 VMX86_OUI_BYTE1(VMX86_LEGACY_OUI)
+#define VMX86_LEGACY_OUI2 VMX86_OUI_BYTE2(VMX86_LEGACY_OUI)
+
+#define VMX86_STATIC_OUI0 VMX86_OUI_BYTE0(VMX86_STATIC_OUI)
+#define VMX86_STATIC_OUI1 VMX86_OUI_BYTE1(VMX86_STATIC_OUI)
+#define VMX86_STATIC_OUI2 VMX86_OUI_BYTE2(VMX86_STATIC_OUI)
+
+#define VMX86_GEN_OUI0    VMX86_OUI_BYTE0(VMX86_GENERATED_OUI)
+#define VMX86_GEN_OUI1    VMX86_OUI_BYTE1(VMX86_GENERATED_OUI)
+#define VMX86_GEN_OUI2    VMX86_OUI_BYTE2(VMX86_GENERATED_OUI)
+
+#define VMX86_FUTURE_OUI0 VMX86_OUI_BYTE0(VMX86_FUTURE_OUI)
+#define VMX86_FUTURE_OUI1 VMX86_OUI_BYTE1(VMX86_FUTURE_OUI)
+#define VMX86_FUTURE_OUI2 VMX86_OUI_BYTE2(VMX86_FUTURE_OUI)
+
+#define VMX86_LEGACY_MIN_MAC  (((uint64)VMX86_LEGACY_OUI) << (VMX86_OUI_SIZE) * 8)
+#define VMX86_LEGACY_MAX_MAC  ((((uint64)VMX86_LEGACY_OUI) << (VMX86_OUI_SIZE) * 8) | 0xFFFFFF)
+
+#define VMX86_STATIC_MIN_MAC  (((uint64)VMX86_STATIC_OUI) << (VMX86_OUI_SIZE) * 8)
+#define VMX86_STATIC_MAX_MAC  ((((uint64)VMX86_STATIC_OUI) << (VMX86_OUI_SIZE) * 8) | 0xFFFFFF)
+
+#define VMX86_STATIC_NON_VPX_RANGE1_MIN_MAC  VMX86_STATIC_MIN_MAC
+#define VMX86_STATIC_NON_VPX_RANGE1_MAX_MAC  ((((uint64)VMX86_STATIC_OUI) << (VMX86_OUI_SIZE) * 8) | 0x7FFFFF)
+
+#define VMX86_STATIC_NON_VPX_RANGE2_MIN_MAC  ((((uint64)VMX86_STATIC_OUI) << (VMX86_OUI_SIZE) * 8) | 0xC00000)
+#define VMX86_STATIC_NON_VPX_RANGE2_MAX_MAC  VMX86_STATIC_MAX_MAC
+
+#define VMX86_GENERATED_MIN_MAC  (((uint64)VMX86_GENERATED_OUI) << (VMX86_OUI_SIZE) * 8)
+#define VMX86_GENERATED_MAX_MAC  ((((uint64)VMX86_GENERATED_OUI) << (VMX86_OUI_SIZE) * 8) | 0xFFFFFF)
+
+
+/* This OUI is used for generated WWN addresses. */
+/* What exactly is a WWN address, anyway? */
+#define VMX86_STATIC_WWN_OUI   0x000C29
+
+#define VMX86_WWN_OUI_SIZE	3
+
+#define VMX86_STATIC_WWN_OUI0 ((uint8) (VMX86_STATIC_WWN_OUI >> (VMX86_WWN_OUI_SIZE - 1) * 8))
+#define VMX86_STATIC_WWN_OUI1 ((uint8) (VMX86_STATIC_WWN_OUI >> (VMX86_WWN_OUI_SIZE - 2) * 8))
+#define VMX86_STATIC_WWN_OUI2 ((uint8) (VMX86_STATIC_WWN_OUI >> (VMX86_WWN_OUI_SIZE - 3) * 8))
+
+/*
+ * Top 2 bits of byte 3 of MAC address
+ */
+
+#define VMX86_MAC_PREFIX      0xc0
+#define VMX86_MAC_RESERVED    0xc0  // reserved private MAC range.
+#define VMX86_MAC_VPX         0x80  // VPX MAC range (old IP-based)
+#define VMX86_MAC_STATIC      0x00  // reserved static MAC range.
+#define VMX86_MAC_ESX         0x40  // standalone ESX VNIC MAC range.
+#define VMX86_MAC_VMWARE_OUI_VPX_PREFIX_MIN 0x80 // VPX MAC range begin (old IP-based)
+#define VMX86_MAC_VMWARE_OUI_VPX_PREFIX_MAX 0xBF // VPX MAC range end
+
+/*
+ * Bits left for MAC address assignment
+ *
+ * The explicit casts shut the compiler up.
+ */
+
+#define VMX86_MAC_BITS		22
+
+#define VMX86_IS_LEGACY_OUI(addr) \
+   ((addr)[0] == VMX86_LEGACY_OUI0 && \
+    (addr)[1] == VMX86_LEGACY_OUI1 && \
+    (addr)[2] == VMX86_LEGACY_OUI2)
+
+#define VMX86_IS_STATIC_OUI(addr) \
+   ((addr)[0] == VMX86_STATIC_OUI0 && \
+    (addr)[1] == VMX86_STATIC_OUI1 && \
+    (addr)[2] == VMX86_STATIC_OUI2)
+
+#define VMX86_IS_GENERATED_OUI(addr) \
+   ((addr)[0] == VMX86_GEN_OUI0 && \
+    (addr)[1] == VMX86_GEN_OUI1 && \
+    (addr)[2] == VMX86_GEN_OUI2)
+
+#define VMX86_IS_FUTURE_OUI(addr) \
+   ((addr)[0] == VMX86_FUTURE_OUI0 && \
+    (addr)[1] == VMX86_FUTURE_OUI1 && \
+    (addr)[2] == VMX86_FUTURE_OUI2)
+
+#define VMX86_IS_RESERVED_MAC(addr) \
+   (VMX86_IS_STATIC_OUI(addr) && \
+    ((addr)[3] & VMX86_MAC_PREFIX) == VMX86_MAC_RESERVED)
+
+#define VMX86_IS_STATIC_MAC(addr) \
+   (VMX86_IS_STATIC_OUI(addr) && \
+    ((addr)[3] & VMX86_MAC_PREFIX) == VMX86_MAC_STATIC)
+
+#define VMX86_IS_VMWARE_OUI_VPX_MAC(addr) \
+   (VMX86_IS_STATIC_OUI(addr) && \
+    (((addr)[3] & VMX86_MAC_PREFIX) >= VMX86_MAC_VMWARE_OUI_VPX_PREFIX_MIN) && \
+    (((addr)[3] & VMX86_MAC_PREFIX) <= VMX86_MAC_VMWARE_OUI_VPX_PREFIX_MAX))
+
+/*
+ * MAC addresses reserved for hostonly adapters.
+ */
+#define VMX86_IS_VIRT_ADAPTER_MAC(addr) \
+   (VMX86_IS_RESERVED_MAC(addr) && \
+    ((addr)[3] & ~VMX86_MAC_PREFIX) == 0x00 && \
+    (addr)[4] == 0x00)
+
+#define VMX86_BUILD_MAC(addr, suffix) do {                        \
+   (addr)[0] = VMX86_STATIC_OUI0;                                 \
+   (addr)[1] = VMX86_STATIC_OUI1;                                 \
+   (addr)[2] = VMX86_STATIC_OUI2;                                 \
+   (addr)[3] = (uint8) (VMX86_MAC_RESERVED                        \
+                      | (((suffix) >> 16) & ~VMX86_MAC_PREFIX));  \
+   (addr)[4] = (uint8) ((suffix) >> 8);                           \
+   (addr)[5] = (uint8) (suffix);                                  \
+} while (0)
+
+/*
+ * Generate a random static MAC usable by devices that are not
+ * virtual host adapters.
+ *
+ * XXX - 0 if non-x86
+ */
+
+static INLINE void
+VMX86_GENERATE_RANDOM_MAC(uint8 mac[6])
+{
+   uint32 offset, r = 0;
+
+   /*
+    * We use the offset to only generate addresses in the range
+    * 0xe0:00:00-0xff:ff:ff instead of 0xc0:00:00-0xff:ff:ff.
+    * We reserve the lower range for other purposes that may come
+    * later.
+    * E.g. virtual host adapters use the range c0:00:00-c0:00:ff.
+    */
+   offset = 0x200000;
+   /* Randomize bits 20-0 and make them unique on this machine. */
+#if defined(__i386__) || defined(__x86_64__)
+   r = (uint32)RDTSC();
+#endif
+   VMX86_BUILD_MAC(mac, r | offset);
+}
+
+
+static INLINE void
+VMX86_GENERATE_LEGACY_MAC(uint8 mac[6],  //OUT:
+			  uint32 suffix) //IN: Only 3 lower bytes are used.
+{
+   mac[0] = VMX86_LEGACY_OUI0;
+   mac[1] = VMX86_LEGACY_OUI1;
+   mac[2] = VMX86_LEGACY_OUI2;
+   mac[3] = (suffix >> 16) & 0xff;
+   mac[4] = (suffix >> 8) & 0xff;
+   mac[5] = (suffix) & 0xff;
+}
+
+#endif
diff --git a/vmnet-only/vmnetInt.h b/vmnet-only/vmnetInt.h
new file mode 100644
index 00000000..0ee52ec1
--- /dev/null
+++ b/vmnet-only/vmnetInt.h
@@ -0,0 +1,100 @@
+/*********************************************************
+ * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __VMNETINT_H__
+#define __VMNETINT_H__
+
+
+#define INCLUDE_ALLOW_MODULE
+#include "includeCheck.h"
+#include "driver-config.h"
+
+
+/*
+ * Hide all kernel compatibility stuff in those macros.  This part of code
+ * is used only when building prebuilt modules, when autoconf code is disabled.
+ */
+
+/* All kernels above 2.6.23 have net namespaces. */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24) && !defined(VMW_NETDEV_HAS_NET)
+#   define VMW_NETDEV_HAS_NET
+#endif
+
+/* All kernels above 2.6.23 have skb argument in nf_hookfn. */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24) && !defined(VMW_NFHOOK_USES_SKB)
+#   define VMW_NFHOOK_USES_SKB
+#endif
+
+/* All kernels above 2.6.25 have dev_net & friends. */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 26) && !defined(VMW_NETDEV_HAS_DEV_NET)
+#   define VMW_NETDEV_HAS_DEV_NET
+#endif
+
+
+#ifdef skb_shinfo
+#  define SKB_IS_CLONE_OF(clone, skb)   (  \
+      skb_shinfo(clone) == skb_shinfo(skb) \
+   )
+#else
+#  define SKB_IS_CLONE_OF(clone, skb)   (      \
+      skb_datarefp(clone) == skb_datarefp(skb) \
+   )
+#endif
+#define DEV_QUEUE_XMIT(skb, dev, pri)   (                 \
+    (skb)->dev = (dev),                                   \
+    (skb)->priority = (pri),                              \
+    compat_skb_reset_mac_header(skb),                     \
+    compat_skb_set_network_header(skb, sizeof (struct ethhdr)),  \
+    dev_queue_xmit(skb)                                   \
+  )
+#define dev_lock_list()    read_lock(&dev_base_lock)
+#define dev_unlock_list()  read_unlock(&dev_base_lock)
+#ifdef VMW_NETDEV_HAS_NET
+#   define DEV_GET(x)      __dev_get_by_name(&init_net, (x)->name)
+#   ifdef VMW_NETDEV_HAS_DEV_NET
+#      define compat_dev_net(x) dev_net(x)
+#   else
+#      define compat_dev_net(x) (x)->nd_net
+#   endif
+#else
+#   define DEV_GET(x)      __dev_get_by_name((x)->name)
+#endif
+
+
+extern struct proto vmnet_proto;
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 2, 0)
+#   define compat_sk_alloc(_bri, _pri) sk_alloc(&init_net, \
+                                                PF_NETLINK, _pri, &vmnet_proto, 1)
+#elif defined(VMW_NETDEV_HAS_NET)
+#   define compat_sk_alloc(_bri, _pri) sk_alloc(&init_net, \
+                                                PF_NETLINK, _pri, &vmnet_proto)
+#else
+#   define compat_sk_alloc(_bri, _pri) sk_alloc(PF_NETLINK, _pri, &vmnet_proto, 1)
+#endif
+
+
+#ifdef NF_IP_LOCAL_IN
+#define VMW_NF_INET_LOCAL_IN     NF_IP_LOCAL_IN
+#define VMW_NF_INET_POST_ROUTING NF_IP_POST_ROUTING
+#else
+#define VMW_NF_INET_LOCAL_IN     NF_INET_LOCAL_IN
+#define VMW_NF_INET_POST_ROUTING NF_INET_POST_ROUTING
+#endif
+
+
+#endif /* __VMNETINT_H__ */
diff --git a/vmnet-only/vmware_pack_begin.h b/vmnet-only/vmware_pack_begin.h
new file mode 100644
index 00000000..d0eb4bd9
--- /dev/null
+++ b/vmnet-only/vmware_pack_begin.h
@@ -0,0 +1,43 @@
+/*********************************************************
+ * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmware_pack_begin.h --
+ *
+ *    Begin of structure packing. See vmware_pack_init.h for details.
+ *
+ *    Note that we do not use the following construct in this include file,
+ *    because we want to emit the code every time the file is included --hpreg
+ *
+ *    #ifndef foo
+ *    #   define foo
+ *    ...
+ *    #endif
+ *
+ */
+
+
+#include "vmware_pack_init.h"
+
+
+#ifdef _MSC_VER
+#   pragma pack(push, 1)
+#elif __GNUC__
+#else
+#   error Compiler packing...
+#endif
diff --git a/vmnet-only/vmware_pack_end.h b/vmnet-only/vmware_pack_end.h
new file mode 100644
index 00000000..f02e2152
--- /dev/null
+++ b/vmnet-only/vmware_pack_end.h
@@ -0,0 +1,44 @@
+/*********************************************************
+ * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmware_pack_end.h --
+ *
+ *    End of structure packing. See vmware_pack_init.h for details.
+ *
+ *    Note that we do not use the following construct in this include file,
+ *    because we want to emit the code every time the file is included --hpreg
+ *
+ *    #ifndef foo
+ *    #   define foo
+ *    ...
+ *    #endif
+ *
+ */
+
+
+#include "vmware_pack_init.h"
+
+
+#ifdef _MSC_VER
+#   pragma pack(pop)
+#elif __GNUC__
+__attribute__((__packed__))
+#else
+#   error Compiler packing...
+#endif
diff --git a/vmnet-only/vmware_pack_init.h b/vmnet-only/vmware_pack_init.h
new file mode 100644
index 00000000..c401d66c
--- /dev/null
+++ b/vmnet-only/vmware_pack_init.h
@@ -0,0 +1,65 @@
+/*********************************************************
+ * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef __VMWARE_PACK_INIT_H__
+#   define __VMWARE_PACK_INIT_H__
+
+
+/*
+ * vmware_pack_init.h --
+ *
+ *    Platform-independent code to make the compiler pack (i.e. have them
+ *    occupy the smallest possible space) structure definitions. The following
+ *    constructs are known to work --hpreg
+ *
+ *    #include "vmware_pack_begin.h"
+ *    struct foo {
+ *       ...
+ *    }
+ *    #include "vmware_pack_end.h"
+ *    ;
+ *
+ *    typedef
+ *    #include "vmware_pack_begin.h"
+ *    struct foo {
+ *       ...
+ *    }
+ *    #include "vmware_pack_end.h"
+ *    foo;
+ */
+
+
+#ifdef _MSC_VER
+/*
+ * MSVC 6.0 emits warning 4103 when the pack push and pop pragma pairing is
+ * not balanced within 1 included file. That is annoying because our scheme
+ * is based on the pairing being balanced between 2 included files.
+ *
+ * So we disable this warning, but this is safe because the compiler will also
+ * emit warning 4161 when there is more pops than pushes within 1 main
+ * file --hpreg
+ */
+
+#   pragma warning(disable:4103)
+#elif __GNUC__
+#else
+#   error Compiler packing...
+#endif
+
+
+#endif /* __VMWARE_PACK_INIT_H__ */
diff --git a/vmnet-only/vnet.h b/vmnet-only/vnet.h
new file mode 100644
index 00000000..f6f45e72
--- /dev/null
+++ b/vmnet-only/vnet.h
@@ -0,0 +1,450 @@
+/*********************************************************
+ * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _VNET_H
+#define _VNET_H
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMK_MODULE
+
+#include "includeCheck.h"
+#include "vm_basic_types.h"
+#include "vm_atomic.h"
+#include "monitorAction_exported.h"
+
+#define VNET_PVN_ABI_ID_LEN    (256 / 8)  // bytes used on ioctl()
+#define VNET_PVN_ID_LEN        (160 / 8)  // actual length used
+
+#define VNET_BIND_VERSION  0x1
+#define VNET_BIND_TO_VNET  0x1
+#define VNET_BIND_TO_PVN   0x2
+
+typedef struct VNet_Bind {
+   uint32 version;                 // VNET_BIND_VERSION
+   uint32 bindType;                // VNET_BIND_TO_xxx
+   int32 number;                   // used for VNET_BIND_TO_VNET
+   uint8  id[VNET_PVN_ABI_ID_LEN]; // used for VNET_BIND_TO_PVN
+} VNet_Bind;
+
+/*
+ * We define customized ioctl commands by adding 0x1000
+ * to the standard Linux definitions.
+ *
+ * See comments in iocontrols.h
+ */
+
+#define VNET_FIRST_CMD     0x99F2
+
+// #define SIOCSKEEP          0x99F0  // not used
+// #define SIOCGKEEP          0x99F1  // not used
+#define SIOCSLADRF         0x99F2
+#define SIOCPORT           0x99F3
+#define SIOCBRIDGE         0x99F4
+#define SIOCNETIF          0x99F5
+
+#define SIOCSETMACADDR     0x99F6
+#define SIOCSSWITCHMAP     0x99F7
+#define SIOCSETNOTIFY      0x99F8
+#define SIOCUNSETNOTIFY    0x99F9
+// #define SIOCSETCLUSTERSIZE 0x99FA  // obsolete
+#define SIOCSETNOTIFY2     0x99FB
+#define SIOCGETAPIVERSION  0x99FC
+#define SIOCINJECTLINKSTATE 0x99FD
+
+#define VNET_NOTIFY_VERSION     5
+#define VNET_LAST_CMD      0x99FD
+
+#if defined __linux__ || defined __APPLE__
+#define SIOCGETAPIVERSION2 _IOWR(0x99, 0xE0, uint32)
+#define SIOCGBRSTATUS	    _IOR(0x99, 0xFD, uint32)
+#define SIOCSPEER	    _IOW(0x99, 0xFE, char[8])
+#define SIOCSPEER2          _IOW(0x99, 0xFE, char[32])
+#define SIOCSBIND           _IOW(0x99, 0xFF, VNet_Bind)
+#define SIOCSFILTERRULES    _IOW(0x99, 0xE1, VNet_RuleHeader)
+#define SIOCSUSERLISTENER   _IOW(0x99, 0xE2, VNet_SetUserListener)
+#define SIOCSMCASTFILTER    _IOW(0x99, 0xE3, VNetMcastFilter)
+#endif
+
+#if defined __linux__
+#define VNET_BRFLAG_FORCE_SMAC    0x00000001
+
+#pragma pack(push, 1)
+typedef struct VNet_BridgeParams {
+   char   name[32];
+   uint32 flags;
+} VNet_BridgeParams;
+#pragma pack(pop)
+
+#define SIOCSPEER3         _IOW(0x99, 0xE4, VNet_BridgeParams)
+#endif
+
+#ifdef __APPLE__
+
+#define VMNET_KEXT_NAME "com.vmware.kext.vmnet"
+
+/*
+ * We use [gs]etsockopt on Mac OS instead of ioctls for operations on vmnet
+ */
+enum VMNetSockOpt {
+   VMNET_SO_APIVERSION = 0,     // Must come first, should never change
+   VMNET_SO_BRSTATUS,
+   VMNET_SO_PEER,
+   VMNET_SO_BINDTOHUB,
+   VMNET_SO_IFADDR,
+   VMNET_SO_NETIFCREATE,
+   VMNET_SO_IFFLAGS,
+   VMNET_SO_LADRF,
+   VMNET_SO_BRCREATE,
+   VMNET_SO_SETNOTIFY,
+   VMNET_SO_READDATA,
+   VMNET_SO_UNSETNOTIFY,
+   VMNET_SO_SETUSERLISTENER,
+   VMNET_SO_MCASTFILTER,
+   VMNET_SO_INJECTLINKSTATE,
+   VMNET_SO_BRFILTER,
+};
+
+/*
+ * This magic value is populated in VNet_Notify.actionID and VNet_Notify.pollMask
+ * to request the driver to clear the Notify pollPtr if the receive queue is empty.
+ */
+#define VNET_NOTIFY_CLR_MAGIC   0xDECAFBAD
+
+typedef struct VNet_NetIf {
+   char name[16];               // The BSD name of the interface
+   uint8 instance;              // The "unit number" of the interface
+} VNet_NetIf;
+
+#pragma pack(push, 1)
+typedef struct {
+   char name[16]; // IN: BSD name of the interface to bridge.
+   int media;     // IN: Media of the interface to bridge.
+} VNet_Bridge;
+#pragma pack(pop)
+
+#ifdef LATER
+typedef struct VNet_Read {
+   VA uAddr;            // Buffer to read into
+   size_t len;          // Max number of bytes to read
+} VNet_Read;
+#endif
+
+#endif
+
+/*
+ * VMnet driver version.
+ *
+ * Increment major version when you make an incompatible change.
+ * Compatibility goes both ways (old driver with new executable
+ * as well as new driver with old executable).
+ */
+
+#ifdef linux
+#define VNET_API_VERSION                (3 << 16 | 0)
+#elif defined __APPLE__
+#define VNET_API_VERSION                (6 << 16 | 0)
+#else
+#define VNET_API_VERSION                (6 << 16 | 0)
+#endif
+#define VNET_API_VERSION_MAJOR(v)       ((uint32) (v) >> 16)
+#define VNET_API_VERSION_MINOR(v)       ((uint16) (v))
+
+/* version 1 structure */
+
+typedef struct VNet_SetMacAddrIOCTL {
+   int             version;
+   unsigned char   addr[6];
+   unsigned        flags;
+} VNet_SetMacAddrIOCTL;
+
+#pragma pack(push, 1)
+typedef struct VNet_Notify {
+   uint32            version;
+   uint32            actionVersion;  /* Version of monitor action logic */
+   VA64              actPtr;         /* User VA of a MonitorActionIntr */
+   VA64              pollPtr;        /* User VA of a volatile uint32 */
+   VA64              recvClusterPtr; /* User VA of a uint32 */
+   MonitorIdemAction actionID;
+   uint32            pollMask;
+} VNet_Notify;
+#pragma pack(pop)
+
+#define VNET_SETMACADDRF_UNIQUE      0x01
+/*
+ * The latest 802.3 standard sort of says that the length field ought to
+ * be less than 1536 (for VLAN tagging support). I am choosing 1532
+ * as our max VNET_MTU size, as I'd rather keep it a multiple of 4 and
+ * VLAN tagging uses only upto 1518 bytes.
+ */
+#define VNET_MTU                     1532
+
+
+#define VNET_BUF_TOO_SMALL           (-1)
+
+/*
+ *  vlan switch stuff
+ */
+
+
+#define VNET_MAX_VLANS     255
+
+struct VNetSwitchMap {
+   int  trunk;
+   int  vlan;
+   int  connect;
+   int  vnet;
+};
+
+
+/*
+ * The upper limit of exact multicast filter
+ * length used by vmnet layer. It should be 
+ * equal to MAC_MAX_EXACT_FILTER_LEN.
+ */
+#define VNET_MAX_EXACT_FILTER_LEN 32
+
+/* multicast filter in Vmnet layer */
+#pragma pack(push, 1)
+typedef struct VNetMcastFilter {
+   uint32 exactFilterLen;
+   uint32 ladrf[2];
+   uint8  exactFilter[VNET_MAX_EXACT_FILTER_LEN][6];
+} VNetMcastFilter;
+#pragma pack(pop)
+
+/* Filter in Vmnet layer */
+#define VNET_FILTER_ACTION_BRIDGE_HOST_BLOCK 0x1
+#define VNET_FILTER_ACTION_BRIDGE_VM_BLOCK   0x2
+
+#pragma pack(push, 1)
+typedef struct MACVNetPortFilterArgs {
+   int enable;
+   int vnetNum;
+} MACVNetPortFilterArgs;
+#pragma pack(pop)
+
+/*
+ *----------------------------------------------------------------------------
+ * VNetEvent
+ *----------------------------------------------------------------------------
+ */
+
+/* the current version */
+#define VNET_EVENT_VERSION         1
+
+/* event classes */
+#define VNET_EVENT_CLASS_UPLINK    1
+
+/* event types */
+#define VNET_EVENT_TYPE_LINK_STATE 0
+
+/* parameter for SIOCSUSERLISTENER */
+#pragma pack(push, 1)
+typedef struct VNet_SetUserListener {
+   uint32 version;
+   uint32 classMask;
+} VNet_SetUserListener;
+#pragma pack(pop)
+
+/* the event header */
+#pragma pack(push, 1)
+typedef struct VNet_EventHeader {
+   uint32 size;
+   uint32 senderId;
+   uint32 eventId;
+   uint32 classSet;
+   uint32 type;
+} VNet_EventHeader;
+#pragma pack(pop)
+
+/*
+ * the link state event
+ * header = { sizeof(VNet_LinkStateEvent), ?, ?, VNET_EVENT_CLASS_BRIDGE,
+ *            VNET_EVENT_TYPE_LINK_STATE }
+ */
+#pragma pack(push, 1)
+typedef struct VNet_LinkStateEvent {
+   VNet_EventHeader header;
+   uint32 adapter;
+   Bool up;
+   char _pad[3];
+} VNet_LinkStateEvent;
+#pragma pack(pop)
+
+/*
+ *----------------------------------------------------------------------------
+ */
+
+#if defined __APPLE__ && !defined KERNEL
+
+#include <fcntl.h>
+#include <sys/ioctl.h>
+#include <sys/kern_control.h>
+#include <sys/socket.h>
+#include <sys/sys_domain.h>
+#include "str.h"
+#include "vm_product.h"
+#include "file.h"
+
+#define AUTH_PROMISC_FILE_PATH VMWARE_HOST_DIRECTORY_PREFIX "/promiscAuthorized"
+
+/*
+ *----------------------------------------------------------------------------
+ *
+ * VMNetOpen --
+ *
+ *      Create a socket connected to the vmnet kernel control extension, bind
+ *      it to a vmnet hub. Optionally make the socket non-blocking. Optionally
+ *      set the interface MAC address. Optionally set interface flags.
+ *
+ * Results:
+ *      Connected and bound socket on success.
+ *      -1 on failure, returns error message in the "error" parameter.
+ *
+ * Side Effects:
+ *      Allocates memory for returning "error" message to caller. Caller should
+ *      remember to free(error).
+ *
+ *----------------------------------------------------------------------------
+ */
+
+static INLINE int
+VMNetOpen(int hubNum,                   // IN: hub number to bind to
+          Bool nonBlocking,             // IN: make socket non-blocking
+          VNet_SetMacAddrIOCTL *ifAddr, // IN: optional MAC address
+          uint32 flags,                 // IN: optional interface flags
+          char **error)                 // OUT: error message on failures
+{
+   int fd;
+   struct sockaddr_ctl addr;
+   struct ctl_info info;
+   socklen_t optlen;
+   uint32 apiVersion;
+
+   fd = socket(PF_SYSTEM, SOCK_DGRAM, SYSPROTO_CONTROL);
+   if (fd == -1) {
+      if (error) {
+         *error = Str_Asprintf(NULL, "Failed to create control socket: "
+                               "errno %d\n", errno);
+      }
+      return -1;
+   }
+
+   bzero(&addr, sizeof addr);
+   addr.sc_len = sizeof addr;
+   addr.sc_family = AF_SYSTEM;
+   addr.ss_sysaddr = AF_SYS_CONTROL;
+
+   memset(&info, 0, sizeof info);
+   strncpy(info.ctl_name, VMNET_KEXT_NAME, sizeof info.ctl_name);
+   if (ioctl(fd, CTLIOCGINFO, &info)) {
+      if (error) {
+         *error = Str_Asprintf(NULL, "ioctl(CTLIOCGINFO) failed: errno %d\n",
+                               errno);
+      }
+      goto exit_failure;
+   }
+
+   addr.sc_id = info.ctl_id;
+
+   if (connect(fd, (struct sockaddr *)&addr, sizeof addr) < 0) {
+      if (error) {
+         *error = Str_Asprintf(NULL, "Connect to vmnet kext failed: errno %d\n",
+                               errno);
+      }
+      goto exit_failure;
+   }
+
+   /* Optionally make socket non-blocking */
+   if (nonBlocking) {
+      int fFlags;
+      fFlags = fcntl(fd, F_GETFL);
+      if (fFlags == -1 || fcntl(fd, F_SETFL, fFlags | O_NONBLOCK) < 0) {
+         if (error) {
+            *error = Str_Asprintf(NULL, "Couldn't make socket non-blocking: "
+                                  "errno %d\n", errno);
+         }
+         goto exit_failure;
+      }
+   }
+
+   optlen = sizeof apiVersion;
+   if (getsockopt(fd, SYSPROTO_CONTROL, VMNET_SO_APIVERSION, &apiVersion,
+                  &optlen) < 0) {
+      if (error) {
+         *error = Str_Asprintf(NULL, "getsockopt(VMNET_SO_APIVERSION) failed: "
+                               "errno %d\n", errno);
+      }
+      goto exit_failure;
+   }
+
+   if (VNET_API_VERSION_MAJOR(apiVersion) !=
+       VNET_API_VERSION_MAJOR(VNET_API_VERSION)) {
+      if (error) {
+         *error = Str_Asprintf(NULL, "Module version mismatch. Please update "
+                               "host.\n");
+      }
+      goto exit_failure;
+   }
+
+   if (setsockopt(fd, SYSPROTO_CONTROL, VMNET_SO_BINDTOHUB, &hubNum,
+                  sizeof hubNum) < 0) {
+      if (error) {
+         *error = Str_Asprintf(NULL, "Could not bind to hub %d: errno %d\n",
+                               hubNum, errno);
+      }
+      goto exit_failure;
+   }
+
+   /* Optionally set MAC address */
+   if (ifAddr) {
+      if (setsockopt(fd, SYSPROTO_CONTROL, VMNET_SO_IFADDR, ifAddr,
+                     sizeof (*ifAddr)) < 0) {
+         if (error) {
+            *error = Str_Asprintf(NULL, "Could not set MAC address: errno %d\n",
+                                  errno);
+         }
+         goto exit_failure;
+      }
+   }
+
+   /* Optionally set interface flags */
+   if (flags) {
+      if (setsockopt(fd, SYSPROTO_CONTROL, VMNET_SO_IFFLAGS, &flags,
+                     sizeof flags) < 0) {
+         if (error) {
+            *error = Str_Asprintf(NULL, "Could not set interface flags to 0x%x: "
+                                  "errno %d\n", flags, errno);
+         }
+         goto exit_failure;
+      }
+   }
+
+   /* Return success */
+   return fd;
+
+exit_failure:
+   /* Return failure */
+   close(fd);
+   return -1;
+}
+
+#endif // __APPLE__ && ! KERNEL
+
+#endif
diff --git a/vmnet-only/vnetEvent.c b/vmnet-only/vnetEvent.c
new file mode 100644
index 00000000..3fda7f5a
--- /dev/null
+++ b/vmnet-only/vnetEvent.c
@@ -0,0 +1,557 @@
+/*********************************************************
+ * Copyright (C) 2007 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vnetEvent.c --
+ *
+ *    The event notification mechanism for the vmnet module. It consists of
+ *    mechanisms, senders, listeners, and events. A mechanism is the scope of
+ *    a single notification mechanism. Within this scope, senders send events
+ *    to listeners and listeners handle events by means of their registered
+ *    event handler.
+ *
+ *    Mechanisms, senders, and listeners can be created and destroyed in any
+ *    order. The implementation ensures proper destruction independent of the
+ *    destruction order.
+ *
+ *    The event handlers registered by the listeners are not allowed to
+ *    recursively enter the mechanism. The implementation enforces this rule.
+ *    The event handlers are not allowed to block.
+ *
+ *    Mechanisms, senders, and listeners are thread-safe, i.e. they can be
+ *    accessed concurrently by multiple threads. Event handlers must be thread-
+ *    safe.
+ *
+ *    Callers into the event notification mechanism can assume that they are
+ *    not called recursively by event handlers. Furthermore, they can assume
+ *    that they do not block.
+ *
+ *    Implementation Notes
+ *
+ *    The mechanism, including senders, listeners, ands event lists are
+ *    guarded by the mechanism's 'lock' spinlock. The listener's event
+ *    handlers are called holding this lock.
+ *
+ *    To avoid deadlock from event handlers recursively calling the
+ *    notification mechanism, the mechanism's 'currentHandler' field stores the
+ *    calling task during invocation of an event handler.
+ *
+ */
+
+#include "vnetKernel.h"
+#include "vnetEvent.h"
+
+typedef struct VNetEvent_EventNode VNetEvent_EventNode;
+
+struct VNetEvent_EventNode {
+   VNetEvent_EventNode *nextEvent;
+   VNet_EventHeader event;
+};
+
+#define EVENT_NODE_HEADER_SIZE offsetof(struct VNetEvent_EventNode, event)
+
+struct VNetEvent_Mechanism {
+   VNetKernel_SpinLock lock;          /* mechanism lock */
+   void *handlerTask;                 /* task calling an event handler */
+   uint32 refCount;                   /* ref count */
+   uint32 senderId;                   /* next sender id */
+   VNetEvent_Sender *firstSender;     /* first sender */
+   VNetEvent_Listener *firstListener; /* first listener */
+};
+
+struct VNetEvent_Sender {
+   VNetEvent_Mechanism *m;            /* mechanism */
+   uint32 senderId;                   /* sender id */
+   VNetEvent_Sender *nextSender;      /* next sender */
+   VNetEvent_EventNode *firstEvent;   /* first event */
+};
+
+struct VNetEvent_Listener {
+   VNetEvent_Mechanism *m;            /* mechanism */
+   VNetEvent_Listener *nextListener;  /* next listener */
+   VNetEvent_Handler handler;         /* event handler */
+   void *data;                        /* event handler data */
+   uint32 classMask;                  /* event handler class mask */
+};
+
+
+/*
+ *-----------------------------------------------------------------------------
+ * VNetEvent_Mechanism
+ *-----------------------------------------------------------------------------
+ */
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetEvent_CreateMechanism --
+ *
+ *    Creates a mechanism.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetEvent_CreateMechanism(VNetEvent_Mechanism **m) // OUT: the new mechanism
+{
+   VNetEvent_Mechanism *t;
+
+   /* allocate mechanism */
+   t = VNetKernel_MemoryAllocate(sizeof *t);
+   if (t == NULL) {
+      return VNetKernel_ENOMEM;
+   }
+
+   /* initialize mechanism */
+   VNetKernel_SpinLockInit(&t->lock);
+   t->handlerTask = NULL;
+   t->refCount = 1;
+   t->senderId = 0;
+   t->firstSender = NULL;
+   t->firstListener = NULL;
+
+   /* return mechanism */
+   *m = t;
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetEvent_DestroyMechanism --
+ *
+ *    Destroys a mechanism.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetEvent_DestroyMechanism(VNetEvent_Mechanism *m) // IN: a mechanism
+{
+   uint32 refCount;
+
+   /* check handler recursion */
+   if (m->handlerTask == VNetKernel_ThreadCurrent()) {
+      return VNetKernel_EBUSY;
+   }
+
+   /* Warning: The implementation may not be a spinlock. Eg. on Mac OS */
+   VNetKernel_SpinLockAcquire(&m->lock);
+   /* decrement ref count */
+   refCount = --m->refCount;
+   VNetKernel_SpinLockRelease(&m->lock);
+
+   /* free mechanism */
+   if (refCount == 0) {
+      VNetKernel_SpinLockFree(&m->lock);
+      VNetKernel_MemoryFree(m);
+   }
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ * VNetEvent_Sender
+ *-----------------------------------------------------------------------------
+ */
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetEvent_CreateSender --
+ *
+ *    Creates a sender.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetEvent_CreateSender(VNetEvent_Mechanism *m, // IN: a mechanism
+                       VNetEvent_Sender **s)   // OUT: the new sender
+{
+   VNetEvent_Sender *t;
+
+   /* check handler recursion */
+   if (m->handlerTask == VNetKernel_ThreadCurrent()) {
+      return VNetKernel_EBUSY;
+   }
+
+   /* allocate sender */
+   t = VNetKernel_MemoryAllocate(sizeof *t);
+   if (t == NULL) {
+      return VNetKernel_ENOMEM;
+   }
+
+   /* initialize sender and insert it into sender list */
+   VNetKernel_SpinLockAcquire(&m->lock);
+   t->m = m;
+   m->refCount++;
+   t->senderId = m->senderId;
+   m->senderId++;
+   t->nextSender = m->firstSender;
+   m->firstSender = t;
+   t->firstEvent = NULL;
+   VNetKernel_SpinLockRelease(&m->lock);
+
+   /* return sender */
+   *s = t;
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetEvent_DestroySender --
+ *
+ *    Destroys a sender.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetEvent_DestroySender(VNetEvent_Sender *s) // IN: a sender
+{
+   VNetEvent_Mechanism *m;
+   VNetEvent_Sender *p;
+   VNetEvent_Sender **q;
+   VNetEvent_EventNode *n;
+
+   /* check handler recursion */
+   m = s->m;
+
+   /*
+    * m->handlerTask might get updated while doing this check, we must acquire
+    * a read lock if we want to make this foolproof.
+    */
+   if (m->handlerTask == VNetKernel_ThreadCurrent()) {
+      return VNetKernel_EBUSY;
+   }
+
+   /* remove sender from sender list */
+   VNetKernel_SpinLockAcquire(&m->lock);
+   q = &m->firstSender;
+   while (TRUE) {
+      p = *q;
+      if (p == NULL) {
+         /* not found */
+         VNetKernel_SpinLockRelease(&m->lock);
+         return VNetKernel_EINVAL;
+      } else if (p == s) {
+        /* found */
+        break;
+      }
+      q = &p->nextSender;
+   }
+   *q = p->nextSender;
+   VNetKernel_SpinLockRelease(&m->lock);
+   VNetEvent_DestroyMechanism(m);
+
+   /* free sender and events */
+   n = s->firstEvent;
+   while (n != NULL) {
+      VNetEvent_EventNode *t = n;
+      n = n->nextEvent;
+      VNetKernel_MemoryFree(t);
+   }
+   VNetKernel_MemoryFree(s);
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetEvent_GetSenderId --
+ *
+ *    Returns the sender id of a sender.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetEvent_GetSenderId(const VNetEvent_Sender *s, // IN: a sender
+                      uint32 *senderId)          // OUT: the sender id
+{
+
+   /* we don't check handler recursion */
+
+   /* return senderId */
+   *senderId = s->senderId;
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetEvent_Send --
+ *
+ *    Sends an event to all listeners registered with a sender. The
+ *    precondition 's->senderId == e->senderId' must hold.
+ *    If an identical event (sender + type + size) exists in the sent queue,
+ *    the function reuses the event node.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetEvent_Send(VNetEvent_Sender *s, // IN: a sender
+               VNet_EventHeader *e) // IN: an event
+{
+   VNetEvent_Mechanism *m;
+   VNetEvent_EventNode *p;
+   VNetEvent_EventNode **q;
+   VNetEvent_Listener *l;
+   uint32 classSet;
+
+   /* check handler recursion */
+   m = s->m;
+   if (m->handlerTask == VNetKernel_ThreadCurrent()) {
+      return VNetKernel_EBUSY;
+   }
+
+   /* precondition */
+   if (s->senderId != e->senderId) {
+      return VNetKernel_EINVAL;
+   }
+
+   /* lock */
+   VNetKernel_SpinLockAcquire(&m->lock);
+   m->handlerTask = VNetKernel_ThreadCurrent();
+
+   /* find previously sent event */
+   q = &s->firstEvent;
+   while (TRUE) {
+       p = *q;
+       if (p == NULL ||
+           (p->event.eventId == e->eventId && p->event.type == e->type)) {
+               break;
+           }
+      q = &p->nextEvent;
+   }
+
+   /* remove previously sent event */
+   if (p != NULL && p->event.size != e->size) {
+      *q = p->nextEvent;
+      VNetKernel_MemoryFree(p);
+      p = NULL;
+   }
+
+   /* insert new event into event list*/
+   if (p == NULL) {
+      p = VNetKernel_MemoryAllocate(EVENT_NODE_HEADER_SIZE + e->size);
+      if (p == NULL) {
+         m->handlerTask = NULL;
+         VNetKernel_SpinLockRelease(&m->lock);
+         return VNetKernel_ENOMEM;
+      }
+      p->nextEvent = s->firstEvent;
+      s->firstEvent = p;
+   }
+   memcpy(&p->event, e, e->size);
+
+   /* send event */
+   classSet = e->classSet;
+   l = m->firstListener;
+   while (l != NULL) {
+      if ((classSet & l->classMask) != 0) {
+         l->handler(l->data, e);
+      }
+      l = l->nextListener;
+   }
+
+   /* unlock */
+   m->handlerTask = NULL;
+   VNetKernel_SpinLockRelease(&m->lock);
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ * VNetEvent_Listener
+ *-----------------------------------------------------------------------------
+ */
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetEvent_CreateListener --
+ *
+ *    Creates a listener and re-sends all existing events to the listener's
+ *    event handler. The listener will receive events that satisfy
+ *    'event.class & classMask != 0'.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetEvent_CreateListener(VNetEvent_Mechanism *m, // IN: a mechanism
+                         VNetEvent_Handler h,    // IN: a handler
+                         void *data,             // IN: the handler's data
+                         uint32 classMask,       // IN: a class mask
+                         VNetEvent_Listener **l) // OUT: the new listener
+{
+   VNetEvent_Listener *t;
+   VNetEvent_Sender *s;
+   VNetEvent_EventNode *e;
+
+   /* check handler recursion */
+   if (m->handlerTask == VNetKernel_ThreadCurrent()) {
+      return VNetKernel_EBUSY;
+   }
+
+   /* allocate listener */
+   t = VNetKernel_MemoryAllocate(sizeof *t);
+   if (t == NULL) {
+      return VNetKernel_ENOMEM;
+   }
+
+   /* lock */
+   VNetKernel_SpinLockAcquire(&m->lock);
+   m->handlerTask = VNetKernel_ThreadCurrent();
+
+   /* initialize listener and insert it into listener list */
+   t->m = m;
+   m->refCount++;
+   t->nextListener = m->firstListener;
+   m->firstListener = t;
+   t->handler = h;
+   t->data = data;
+   t->classMask = classMask;
+
+   /* creation done, so send all events */
+   s = m->firstSender;
+   while (s != NULL) {
+      e = s->firstEvent;
+      while (e != NULL) {
+         if ((e->event.classSet & classMask) != 0) {
+            h(data, &e->event);
+         }
+         e = e->nextEvent;
+      }
+      s = s->nextSender;
+   }
+
+   /* unlock */
+   m->handlerTask = NULL;
+   VNetKernel_SpinLockRelease(&m->lock);
+
+   /* return listener */
+   *l = t;
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VNetEvent_DestroyListener --
+ *
+ *    Destroys a listener.
+ *
+ * Results:
+ *    Returns 0 if successful, or a negative value if an error occurs.
+ *
+ * Side effects:
+ *    None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+VNetEvent_DestroyListener(VNetEvent_Listener *l) // IN: a listener
+{
+   VNetEvent_Mechanism *m;
+   VNetEvent_Listener *p;
+   VNetEvent_Listener **q;
+
+   /* check handler recursion */
+   m = l->m;
+   if (m->handlerTask == VNetKernel_ThreadCurrent()) {
+      return VNetKernel_EBUSY;
+   }
+
+   /* remove listener from listener list */
+   VNetKernel_SpinLockAcquire(&m->lock);
+   q = &m->firstListener;
+   while (TRUE) {
+      p = *q;
+      if (p == NULL) {
+         /* not found */
+         VNetKernel_SpinLockRelease(&m->lock);
+         return VNetKernel_EINVAL;
+      } else if (p == l) {
+        /* found */
+        break;
+      }
+      q = &p->nextListener;
+   }
+   *q = p->nextListener;
+   VNetKernel_SpinLockRelease(&m->lock);
+   VNetEvent_DestroyMechanism(m);
+
+   /* free listener */
+   VNetKernel_MemoryFree(l);
+   return 0;
+}
diff --git a/vmnet-only/vnetEvent.h b/vmnet-only/vnetEvent.h
new file mode 100644
index 00000000..a2e20140
--- /dev/null
+++ b/vmnet-only/vnetEvent.h
@@ -0,0 +1,50 @@
+/*********************************************************
+ * Copyright (C) 2007 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vnetEvent.h --
+ */
+
+#ifndef _VNETEVENT_H_
+#define _VNETEVENT_H_
+
+#include "vm_basic_types.h"
+#include "vnet.h"
+
+typedef struct VNetEvent_Mechanism VNetEvent_Mechanism;
+
+typedef struct VNetEvent_Sender VNetEvent_Sender;
+
+typedef struct VNetEvent_Listener VNetEvent_Listener;
+
+typedef void (*VNetEvent_Handler)(void *data, VNet_EventHeader *e);
+
+int VNetEvent_CreateMechanism(VNetEvent_Mechanism **m);
+int VNetEvent_DestroyMechanism(VNetEvent_Mechanism *m);
+
+int VNetEvent_CreateSender(VNetEvent_Mechanism *m, VNetEvent_Sender **s);
+int VNetEvent_DestroySender(VNetEvent_Sender *s);
+int VNetEvent_Send(VNetEvent_Sender *s, VNet_EventHeader *e);
+int VNetEvent_GetSenderId(const VNetEvent_Sender *s, uint32 *senderId);
+
+int VNetEvent_CreateListener(VNetEvent_Mechanism *m, VNetEvent_Handler h,
+                             void *data, uint32 classMask,
+                             VNetEvent_Listener **l);
+int VNetEvent_DestroyListener(VNetEvent_Listener *l);
+
+#endif // _VNETEVENT_H_
diff --git a/vmnet-only/vnetFilter.h b/vmnet-only/vnetFilter.h
new file mode 100644
index 00000000..af99974e
--- /dev/null
+++ b/vmnet-only/vnetFilter.h
@@ -0,0 +1,191 @@
+/*********************************************************
+ * Copyright (C) 2006-2014 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vnetFilter.h --
+ *
+ *      This file defines the external interface provided
+ *      by the vmnet driver for host packet filter 
+ *      functionality.  This functionality is likely to
+ *      be eventually moved to a separate driver.
+ *
+ */
+
+#ifndef _VNETFILTER_H_
+#define _VNETFILTER_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+/*
+ * Call:
+ *      Windows vmnet driver using IOCTL_VNET_FILTERHOST2.
+ *      Linux vmnet driver using SIOCSFILTERRULES.
+ */
+
+
+/* list of subcommands for the host filter ioctl() call */
+#define VNET_FILTER_CMD_MIN                 0x1000 /* equal to smallest sub-command */
+#define VNET_FILTER_CMD_CREATE_RULE_SET     0x1000
+#define VNET_FILTER_CMD_DELETE_RULE_SET     0x1001
+#define VNET_FILTER_CMD_ADD_IPV4_RULE       0x1002
+#define VNET_FILTER_CMD_ADD_IPV6_RULE       0x1003 /* not implemented */
+#define VNET_FILTER_CMD_CHANGE_RULE_SET     0x1004
+#define VNET_FILTER_CMD_SET_LOG_LEVEL       0x1005
+#define VNET_FILTER_CMD_MAX                 0x1005 /* equal to largest sub-command */
+
+/* action for a rule or rule set */
+/* VNet_CreateRuleSet.defaultAction */
+/* VNet_AddIPv4Rule.action */
+/* VNet_ChangeRuleSet.defaultAction */
+#define VNET_FILTER_RULE_NO_CHANGE  0x2000
+#define VNET_FILTER_RULE_BLOCK      0x2001
+#define VNET_FILTER_RULE_ALLOW      0x2002
+
+/* direction that should apply to a rule */
+/* VNet_AddIPv4Rule.direction */
+#define VNET_FILTER_DIRECTION_IN   0x3001
+#define VNET_FILTER_DIRECTION_OUT  0x3002
+#define VNET_FILTER_DIRECTION_BOTH 0x3003
+
+/* used to change which rule set is used for host filtering */
+/* VNet_ChangeRuleSet.activate */
+#define VNET_FILTER_STATE_NO_CHANGE 0x4000
+#define VNET_FILTER_STATE_ENABLE    0x4001
+#define VNET_FILTER_STATE_DISABLE   0x4002
+
+/* log Levels, cut and paste from bora/lib/public/policy.h */
+#define VNET_FILTER_LOGLEVEL_NONE    (0)
+#define VNET_FILTER_LOGLEVEL_TERSE   (1)
+#define VNET_FILTER_LOGLEVEL_NORMAL  (2)
+#define VNET_FILTER_LOGLEVEL_VERBOSE (3)
+#define VNET_FILTER_LOGLEVEL_MAXIMUM (4)
+
+/* header that's common for all command structs */
+#pragma pack(push, 1)
+typedef struct VNet_RuleHeader {
+   uint32 type;   /* type of struct */
+   uint32 ver;    /* version of struct */
+   uint32 len;    /* length of struct */
+} VNet_RuleHeader;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct VNet_CreateRuleSet {
+   VNet_RuleHeader header; /* type = VNET_FILTER_CMD_CREATE_RULE_SET, ver = 1,
+                              len = sizeof(VNet_CreateRuleSet) */
+
+   uint32 ruleSetId;       /* id of rule to delete (must be non-0) */
+   uint32 defaultAction;   /* VNET_FILTER_RULE_DROP or VNET_FILTER_RULE_PERMIT */
+} VNet_CreateRuleSet;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct VNet_DeleteRuleSet {
+   VNet_RuleHeader header; /* type = VNET_FILTER_CMD_DELETE_RULE_SET, ver = 1,
+                              len = sizeof(VNet_DeleteRuleSet) */
+
+   uint32 ruleSetId;       /* rule set to delete (from VNet_CreateRuleSet.ruleSetId) */
+} VNet_DeleteRuleSet;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct VNet_AddIPv4Rule {
+   VNet_RuleHeader header; /* type = VNET_FILTER_CMD_ADD_IPV4_RULE, ver = 1,
+                              len = sizeof(VNet_AddIPv4Rule) +
+                              addrListLen  * sizeof(VNet_IPv4Address) +
+                              protoListLen * sizeof(VNet_IPv4Protocol) */
+
+   uint32 ruleSetId;       /* rule set (from VNet_CreateRuleSet.ruleSetId) */
+   uint32 action;          /* VNET_FILTER_RULE_DROP or VNET_FILTER_RULE_PERMIT */
+   uint32 direction;       /* VNET_FILTER_DIRECTION_IN, VNET_FILTER_DIRECTION_OUT, or
+                              VNET_FILTER_DIRECTION_BOTH */
+
+   uint32 addressListLen;  /* Number of VNet_IPv4Address's that follow.
+                              Must be at least one.  Must equal 1 if addr==mask==0.
+                              expected but not required: (addr & ~mask) == 0 */
+
+   uint32 proto;           /* ~0 is don't care, otherwise protocol in IP header*/
+
+   uint32 portListLen;     /* Number of VNet_IPv4Port's that follow the
+                              VNet_IPv4Address's.  Ports currently only apply for
+                              TCP and UDP.  Must be at least one, even if non-TCP or
+                              non-UDP protocol is specified in 'proto' (use 0 or ~0 for
+                              all elements in VNet_IPv4Port).  Must equal 1 if all
+                              elements in a VNet_IPv4Port are ~0. */
+   /* add flags for tracking in which direction the connection is established? */
+} VNet_AddIPv4Rule;
+#pragma pack(pop)
+
+/*
+ * VNet_AddIPv4Rule is immediately followed by 1 or more VNet_IPv4Address.
+ * The last VNet_IPv4Address is immediately followed by 1 or more VNet_IPv4Port.
+ */
+
+#pragma pack(push, 1)
+typedef struct VNet_IPv4Address {
+   /* currently no fields for local address/mask (add them?) */
+
+   /* can specify don't care on IP address via addr==mask==0,
+      but only for a list with 1 item */
+   uint32 ipv4RemoteAddr; /* remote entity's address (dst on outbound, src on inbound) */
+   uint32 ipv4RemoteMask; /* remote entity's mask    (dst on outbound, src on inbound) */
+} VNet_IPv4Address;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct VNet_IPv4Port {
+   /* can specify ~0 for all 4 only if one item in the list */
+
+   uint32 localPortLow;    /* ~0 is don't care, otherwise low  local range (inclusive) */
+   uint32 localPortHigh;   /* ~0 is don't care, otherwise high local range (inclusive) */
+   uint32 remotePortLow;   /* ~0 is don't care, otherwise low  remote range (inclusive) */
+   uint32 remotePortHigh;  /* ~0 is don't care, otherwise high remote range (inclusive) */
+} VNet_IPv4Port;
+#pragma pack(pop)
+
+// typedef struct VNet_IPv4Port VNet_IPv6Port;
+
+#pragma pack(push, 1)
+typedef struct VNet_ChangeRuleSet {
+   VNet_RuleHeader header; /* type = VNET_FILTER_CMD_CHANGE_RULE_SET, ver = 1,
+                              len = sizeof(VNet_ChangeRuleSet) */
+
+   uint32 ruleSetId;       /* rule set (from VNet_CreateRuleSet.ruleSetId) */
+   uint32 defaultAction;   /* usually VNET_FILTER_RULE_NO_CHANGE, but can change default
+                              rule via VNET_FILTER_RULE_DROP or VNET_FILTER_RULE_PERMIT */
+   uint32 activate;        /* specify rule to use for filtering via
+                              VNET_FILTER_STATE_ENABLE or VNET_FILTER_STATE_DISABLE.
+                              Can use VNET_FILTER_STATE_NO_CHANGE to change only the
+                              default rule of the rule set */
+} VNet_ChangeRuleSet;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct VNet_SetLogLevel {
+   VNet_RuleHeader header; /* type = VNET_FILTER_CMD_SET_LOG_LEVEL, */
+                           /* ver = 1,                              */
+                           /* len = sizeof(VNet_SetLogLevel)        */
+   uint32 logLevel;        /* the log level to set                  */
+} VNet_SetLogLevel;
+#pragma pack(pop)
+
+#endif // ifndef _VNETFILTER_H_
diff --git a/vmnet-only/vnetFilterInt.h b/vmnet-only/vnetFilterInt.h
new file mode 100644
index 00000000..e69de29b
diff --git a/vmnet-only/vnetInt.h b/vmnet-only/vnetInt.h
new file mode 100644
index 00000000..5f41269d
--- /dev/null
+++ b/vmnet-only/vnetInt.h
@@ -0,0 +1,365 @@
+/*********************************************************
+ * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _VNETINT_H
+#define _VNETINT_H
+
+#define INCLUDE_ALLOW_MODULE
+#include "includeCheck.h"
+#include "vnet.h"
+#include "vm_oui.h"
+#include "net.h"
+#include "vnetEvent.h"
+
+#include <asm/page.h>
+
+#include <linux/mutex.h>
+
+#define INLINE inline
+
+
+/*
+ * Logging
+ */
+
+#ifdef notdef
+#ifdef VMX86_RELEASE
+#define LOGLEVEL 0
+#else
+#define LOGLEVEL 1
+#endif
+#endif
+     
+#define LOGLEVEL 1
+
+#if LOGLEVEL >= 0
+#define LOG(level, args) ((void) (LOGLEVEL >= (level) ? (printk args) : 0))
+#else
+#define LOG(level, args)
+#endif
+
+#define MAX(_a, _b)   (((_a) > (_b)) ? (_a) : (_b))
+
+/*
+ * Ethernet
+ */
+
+#define MAC_EQ(_a, _b)         !memcmp((_a), (_b), ETH_ALEN)
+#define SKB_2_DESTMAC(_skb)    (((struct ethhdr *)(_skb)->data)->h_dest)
+#define SKB_2_SRCMAC(_skb)     (((struct ethhdr *)(_skb)->data)->h_source)
+#define UP_AND_RUNNING(_flags) (((_flags) & (IFF_RUNNING|IFF_UP)) == \
+				(IFF_RUNNING|IFF_UP))
+#define NETDEV_UP_AND_RUNNING(dev) ((((dev)->flags) & IFF_UP) && netif_running(dev))
+
+/*
+ * Misc defines 
+ */
+
+#define NULL_TERMINATE_STRING(a) (a)[sizeof (a) - 1] = '\0'
+
+/*
+ * Fundamental sizes
+ */
+
+#define VNET_NUM_VNETS         256
+#define VNET_MAJOR_NUMBER      119
+
+/* We support upto 32 adapters with LSP + DHCP + NAT + netif + sniffer */
+#define NUM_JACKS_PER_HUB      68 
+#define VNET_MAX_QLEN          1024
+
+#define VNET_NUM_IPBASED_MACS  64
+#define VNET_MAX_JACK_NAME_LEN 16
+
+#define VNET_LADRF_LEN         8
+
+#if ( defined(IFNAMSIZ) && (IFNAMSIZ >= 16) )
+#define VNET_NAME_LEN          IFNAMSIZ
+#else
+#define VNET_NAME_LEN          16
+#endif
+
+/*
+ * Data structures
+ */
+
+/*
+ * Newer kernels and those without CONFIG_PROC_FS don't have read_proc_t,
+ * so define our own here to make things a bit simpler.
+ */
+typedef int (VNetProcReadFn)(char *page, char **start, off_t off,
+                             int count, int *eof, void *data);
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 10, 0)
+typedef struct VNetProcEntry {
+   struct proc_dir_entry *pde;   /* Procfs node entry. */
+   void *data;                   /* User data. */
+   VNetProcReadFn *fn;           /* Callback fuction to read node. */
+} VNetProcEntry;
+#else
+typedef struct proc_dir_entry VNetProcEntry;
+#endif
+
+typedef struct VNetJack VNetJack;
+typedef struct VNetPort VNetPort;
+
+/*
+ *  The jack is the basic mechanism for connecting to objects
+ *  that send packet between them.
+ */
+
+extern struct mutex vnetStructureMutex;
+
+struct VNetJack {
+   VNetJack      *peer;
+   int            numPorts;
+   char           name[VNET_MAX_JACK_NAME_LEN];
+   void          *private;     // private field for containing object
+   int            index;       // private field for containing object
+   VNetProcEntry *procEntry;   // private field for containing object
+   Bool           state;       // TRUE for enabled
+   struct kref    kref;        // ref count
+
+   void         (*free)(VNetJack *this);
+   void         (*rcv)(VNetJack *this, struct sk_buff *skb);
+   Bool         (*cycleDetect)(VNetJack *this, int generation);
+   void         (*portsChanged)(VNetJack *this);
+   int          (*isBridged)(VNetJack *this);
+};
+
+
+/*
+ *  The port is an extension of the jack. It has a user level
+ *  interface and an ethernet address. There are 3 types of ports:
+ *  userif, netif, and bridge.
+ */
+
+struct VNetPort {
+   VNetJack    jack;     // must be first
+   unsigned    id;
+   unsigned    hubNum;
+   uint32      flags;
+   uint8       paddr[ETH_ALEN];
+   uint8       ladrf[VNET_LADRF_LEN];
+   uint8       exactFilter[VNET_MAX_EXACT_FILTER_LEN][ETHER_ADDR_LEN];
+   uint32      exactFilterLen;
+   
+   VNetPort   *next;
+   
+   int       (*fileOpRead)(VNetPort *this, struct file *filp,
+                           char *buf, size_t count);
+   int       (*fileOpWrite)(VNetPort *this, struct file *filp,
+                            const char *buf, size_t count);
+   int       (*fileOpIoctl)(VNetPort *this, struct file *filp,
+                            unsigned int iocmd, unsigned long ioarg);   
+   int       (*fileOpPoll)(VNetPort *this, struct file *filp,
+                           poll_table *wait);
+};
+
+
+
+/*
+ *  Functions exported from vnet module
+ */
+
+VNetJack *VNetHub_AllocVnet(int hubNum);
+VNetJack *VNetHub_AllocPvn(uint8 id[VNET_PVN_ID_LEN]);
+int VNetHub_CreateSender(VNetJack *jack, VNetEvent_Sender **s);
+int VNetHub_CreateListener(VNetJack *jack, VNetEvent_Handler h, void* data,
+                           uint32 classMask, VNetEvent_Listener **l);
+
+int VNetConnect(VNetJack *jack1, VNetJack *jack2);
+
+VNetJack *VNetDisconnect(VNetJack *jack);
+
+void VNetSend(VNetJack *jack, struct sk_buff *skb);
+
+int VNetProc_MakeEntry(char *name, int mode, void *data,
+                       VNetProcReadFn *fn, VNetProcEntry **ret);
+
+void VNetProc_RemoveEntry(VNetProcEntry *node);
+
+int VNetPrintJack(const VNetJack *jack, char *buf);
+
+int VNet_MakeMACAddress(VNetPort *port);
+
+int VNetSetMACUnique(VNetPort *port, const uint8 mac[ETH_ALEN]);
+
+     
+/*
+ *  Utility functions
+ */
+
+extern const uint8 allMultiFilter[VNET_LADRF_LEN];
+extern const uint8 broadcast[ETH_ALEN];
+ 
+Bool VNetPacketMatch(const uint8 *destAddr, const uint8 *ifAddr, 
+                     const uint8 *exactFilter, const uint32 exactFilterLen,
+		     const uint8 *ladrf, uint32 flags);
+
+Bool VNetCycleDetectIf(const char *name, int generation);
+
+int VNetPrintPort(const VNetPort *port, char *buf);
+
+int VNetSnprintf(char *str, size_t size, const char *format, ...);
+
+/*
+ *  Procfs file system
+ */
+
+extern int VNetProc_Init(void);
+
+extern void VNetProc_Cleanup(void);
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetCycleDetect --
+ *
+ *      Perform the cycle detect alogorithm for this generation.
+ *
+ * Results: 
+ *      TRUE if a cycle was detected, FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VNetCycleDetect(VNetJack *jack,       // IN: jack
+                int       generation) // IN: 
+{
+   if (jack && jack->cycleDetect) {
+      return jack->cycleDetect(jack, generation);
+   }
+
+   return FALSE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetPortsChanged --
+ *
+ *      Notify a jack that the number of connected ports has changed.
+ *	vnetStructureSemaphore must be held.
+ *
+ * Results: 
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VNetPortsChanged(VNetJack *jack) // IN:
+{
+   if (jack && jack->portsChanged) {
+      jack->portsChanged(jack);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetIsBridged --
+ *
+ *      Check whether we are bridged.
+ *      vnetPeerLock must be held.
+ *
+ * Results:
+ *      0 - not bridged
+ *      1 - we are bridged but the interface is down
+ *      2 - we are bridged and the interface is up
+ *      3 - some bridges are down
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE int
+VNetIsBridged(VNetJack *jack) // IN: jack
+{
+   if (jack && jack->state && jack->peer && jack->peer->state &&
+       jack->peer->isBridged) {
+      return jack->peer->isBridged(jack->peer);
+   }
+
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetFree --
+ *
+ *      Free the resources owned by the jack.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+VNetFree(VNetJack *jack) // IN: jack
+{
+   if (jack && jack->free) {
+      jack->free(jack);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetGetAttachedPorts --
+ *
+ *      Get the number of ports attached to this jack through its peer.
+ *
+ * Results:
+ *      The number of attached ports to this jack through its peer.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE int
+VNetGetAttachedPorts(VNetJack *jack) // IN: jack
+{
+   if (jack && jack->state && jack->peer && jack->peer->state) {
+      return jack->peer->numPorts;
+   }
+   return 0;
+}
+
+#endif
diff --git a/vmnet-only/vnetKernel.h b/vmnet-only/vnetKernel.h
new file mode 100644
index 00000000..eb4eba4e
--- /dev/null
+++ b/vmnet-only/vnetKernel.h
@@ -0,0 +1,83 @@
+/*********************************************************
+ * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vnetKernel.h --
+ *    This file defines platform-independent functions for accessing basic
+ *    kernel functions. This is the Linux implementation.
+ */
+
+#ifndef _VNETKERNEL_H_
+#define _VNETKERNEL_H_
+
+#include "driver-config.h" /* must be first */
+#include <linux/errno.h>
+#include <linux/slab.h>
+#include "vm_basic_types.h"
+
+#define VNetKernel_EBUSY  (-EBUSY)
+#define VNetKernel_EINVAL (-EINVAL)
+#define VNetKernel_ENOMEM (-ENOMEM)
+
+typedef struct VNetKernel_SpinLock {
+   spinlock_t lock;
+} VNetKernel_SpinLock;
+
+static INLINE void *
+VNetKernel_MemoryAllocate(size_t size)
+{
+   return kmalloc(size, GFP_ATOMIC);
+}
+
+static INLINE void
+VNetKernel_MemoryFree(void *ptr)
+{
+   kfree(ptr);
+}
+
+static INLINE void
+VNetKernel_SpinLockInit(VNetKernel_SpinLock *lock)
+{
+   spin_lock_init(&lock->lock);
+}
+
+static INLINE void
+VNetKernel_SpinLockFree(VNetKernel_SpinLock *lock)
+{
+   /* nothing to do */
+}
+
+static INLINE void
+VNetKernel_SpinLockAcquire(VNetKernel_SpinLock *lock)
+{
+   spin_lock(&lock->lock);
+}
+
+static INLINE void
+VNetKernel_SpinLockRelease(VNetKernel_SpinLock *lock)
+{
+   spin_unlock(&lock->lock);
+}
+
+static INLINE void *
+VNetKernel_ThreadCurrent(void)
+{
+   return current;
+}
+
+#endif // _VNETKERNEL_H_
diff --git a/vmnet-only/vnetUserListener.c b/vmnet-only/vnetUserListener.c
new file mode 100644
index 00000000..114f3907
--- /dev/null
+++ b/vmnet-only/vnetUserListener.c
@@ -0,0 +1,336 @@
+/*********************************************************
+ * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vnetUserListener.c --
+ *
+ *    The user listener module implements an event queue that can be accessed
+ *    by the vmx process.
+ *
+ *    It registers an event listener with a given classMask. The listener
+ *    enqueues events and the vmx process dequeues them. The vmx process can
+ *    use blocking or non-blocking reads to consume the events. The user
+ *    listener is thread safe.
+ */
+
+#include "driver-config.h" /* must be first */
+
+#include <linux/netdevice.h>
+#include <linux/poll.h>
+#include <linux/sched.h>
+#include <linux/wait.h>
+
+#include "compat_skbuff.h"
+#include "vnetInt.h"
+
+typedef struct VNetUserListener_EventNode VNetUserListener_EventNode;
+
+struct VNetUserListener_EventNode {
+   VNetUserListener_EventNode *nextEvent;
+   VNet_EventHeader event;
+};
+
+#define EVENT_NODE_HEADER_SIZE offsetof(struct VNetUserListener_EventNode, event)
+
+typedef struct VNetUserListener {
+   VNetPort port;                          /* base port/jack */
+   VNetEvent_Listener *eventListener;      /* event listener */
+   spinlock_t lock;                        /* listener lock */
+   wait_queue_head_t readerQueue;          /* reader queue */
+   VNetUserListener_EventNode *firstEvent; /* first event to be read */
+   VNetUserListener_EventNode *lastEvent;  /* last event to be read*/
+} VNetUserListener;
+
+static void VNetUserListenerFree(VNetJack *jack);
+static void VNetUserListenerEventHandler(void *context, VNet_EventHeader *e);
+static int VNetUserListenerRead(VNetPort *port, struct file *filp, char *buf,
+                                size_t count);
+static int VNetUserListenerPoll(VNetPort *port, struct file *filp,
+                                poll_table *wait);
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserListener_Create --
+ *
+ *      Creates a user listener. Initializes the jack, the port, and itself.
+ *      Finally, registers the event listener.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetUserListener_Create(uint32 classMask,  // IN: the listener's class mask
+                        VNetJack *hubJack, // IN: the future hub jack
+                        VNetPort **port)   // OUT: port to virtual hub
+{
+   static unsigned id = 0;
+   VNetUserListener *userListener;
+   int res;
+
+   /* allocate user listener */
+   userListener = kmalloc(sizeof *userListener, GFP_USER);
+   if (userListener == NULL) {
+      return -ENOMEM;
+   }
+
+   /* initialize jack */
+   userListener->port.jack.peer = NULL;
+   userListener->port.jack.numPorts = 1;
+   VNetSnprintf(userListener->port.jack.name,
+                sizeof userListener->port.jack.name, "userListener%u", id);
+   userListener->port.jack.private = userListener;
+   userListener->port.jack.index = 0;
+   userListener->port.jack.procEntry = NULL;
+   userListener->port.jack.free = VNetUserListenerFree;
+   userListener->port.jack.rcv = NULL;
+   userListener->port.jack.cycleDetect = NULL;
+   userListener->port.jack.portsChanged = NULL;
+   userListener->port.jack.isBridged = NULL;
+
+   /* initialize port */
+   userListener->port.id = id++;
+   userListener->port.flags = 0;
+   memset(userListener->port.paddr, 0, sizeof userListener->port.paddr);
+   memset(userListener->port.ladrf, 0, sizeof userListener->port.ladrf);
+   userListener->port.next = NULL;
+   userListener->port.fileOpRead = VNetUserListenerRead;
+   userListener->port.fileOpWrite = NULL;
+   userListener->port.fileOpIoctl = NULL;
+   userListener->port.fileOpPoll = VNetUserListenerPoll;
+
+   /* initialize user listener */
+   userListener->eventListener = NULL;
+   spin_lock_init(&userListener->lock);
+   init_waitqueue_head(&userListener->readerQueue);
+   userListener->firstEvent = NULL;
+   userListener->lastEvent = NULL;
+
+   /*
+    * create listener, must be after initialization because it fires right away
+    * and populates the event queue, i.e. the event handler callback is called
+    * before create listener returns
+    */
+   res = VNetHub_CreateListener(hubJack, VNetUserListenerEventHandler,
+                                userListener, classMask,
+                                &userListener->eventListener);
+   if (res != 0) {
+      LOG(0, (KERN_DEBUG "VNetUserListener_Create, can't create listener "
+              "(%d)\n", res));
+      kfree(userListener);
+      return res;
+   }
+
+   /* return listener */
+   *port = (VNetPort*)userListener;
+   return 0;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserListenerFree --
+ *
+ *      Frees a user listenere. Unregisters the event listener and drains the
+ *      event queue.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetUserListenerFree(VNetJack *jack) // IN: jack to free
+{
+   VNetUserListener *userListener;
+   int res;
+   VNetUserListener_EventNode *p;
+
+   /* destroy event listener */
+   userListener = (VNetUserListener*)jack;
+   res = VNetEvent_DestroyListener(userListener->eventListener);
+   if (res != 0) {
+      LOG(0, (KERN_DEBUG "VNetUserListenerFree, can't destroy listener"
+              "(%d)\n", res));
+   }
+
+   /* clear event queue */
+   spin_lock(&userListener->lock);
+   p = userListener->firstEvent;
+   while (p != NULL) {
+      VNetUserListener_EventNode *t = p;
+      p = p->nextEvent;
+      kfree(t);
+   }
+   spin_unlock(&userListener->lock);
+
+   /* free user listener */
+   kfree(userListener);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserListenerEventHandler --
+ *
+ *      Enqueues an event.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+VNetUserListenerEventHandler(void *context,       // IN: the user listener
+                             VNet_EventHeader *e) // IN: an event
+{
+   VNetUserListener *userListener;
+   VNetUserListener_EventNode *t;
+
+   /* allocate and initialize event node */
+   t = kmalloc(EVENT_NODE_HEADER_SIZE + e->size, GFP_ATOMIC);
+   if (t == NULL) {
+      LOG(0, (KERN_DEBUG "VNetUserListenerEventHandler, out of memory\n"));
+      return;
+   }
+   t->nextEvent = NULL;
+   memcpy(&t->event, e, e->size);
+
+   /* append event to event list */
+   userListener = (VNetUserListener*)context;
+   spin_lock(&userListener->lock);
+   if (userListener->lastEvent != NULL) {
+      userListener->lastEvent->nextEvent = t;
+   } else {
+      userListener->firstEvent = t;
+   }
+   userListener->lastEvent = t;
+   spin_unlock(&userListener->lock);
+
+   /* wake up readers */
+   wake_up_interruptible(&userListener->readerQueue);
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserListenerRead --
+ *
+ *      Dequeues an event. May or may not block depending of the filp flags.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetUserListenerRead(VNetPort    *port, // IN: the user listener
+                     struct file *filp, // IN: the filp
+                     char        *buf,  // OUT: the buffer
+                     size_t      count) // IN: the buffer size
+{
+   VNetUserListener *userListener;
+   VNetUserListener_EventNode *t;
+   size_t n;
+   int res;
+
+   /* wait until there is data */
+   userListener = (VNetUserListener*)port->jack.private;
+   spin_lock(&userListener->lock);
+   while (userListener->firstEvent == NULL) {
+      spin_unlock(&userListener->lock);
+
+      /* can we block? */
+      if (filp->f_flags & O_NONBLOCK) {
+         return -EAGAIN;
+      }
+
+      /* wait until there is data or we get interrupted */
+      if (wait_event_interruptible(userListener->readerQueue,
+                                   userListener->firstEvent != NULL)) {
+         return -ERESTARTSYS;
+      }
+
+      spin_lock(&userListener->lock);
+   }
+
+   /* remove event from event list */
+   t = userListener->firstEvent;
+   userListener->firstEvent = t->nextEvent;
+   if (userListener->firstEvent == NULL) {
+      userListener->lastEvent = NULL;
+   }
+   spin_unlock(&userListener->lock);
+
+   /* return data and free event */
+   n = t->event.size;
+   if (count < n) {
+      n = count;
+   }
+   res = copy_to_user(buf, &t->event, n);
+   kfree(t);
+   return res ? -EFAULT : n;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetUserListenerPoll --
+ *
+ *      Polls an event.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static int
+VNetUserListenerPoll(VNetPort     *port, // IN: the user listener
+                     struct file  *filp, // IN: the filp
+                     poll_table   *wait) // IN: the poll table
+{
+   VNetUserListener *userListener = (VNetUserListener*)port->jack.private;
+   poll_wait(filp, &userListener->readerQueue, wait);
+   return userListener->firstEvent != NULL ? POLLIN | POLLRDNORM : 0;
+}
diff --git a/vmnet-only/x86cpuid.h b/vmnet-only/x86cpuid.h
new file mode 100644
index 00000000..a1412f32
--- /dev/null
+++ b/vmnet-only/x86cpuid.h
@@ -0,0 +1,1815 @@
+/*********************************************************
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _X86CPUID_H_
+#define _X86CPUID_H_
+
+/* http://www.sandpile.org/ia32/cpuid.htm */
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMX
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "community_source.h"
+#include "x86vendor.h"
+#include "vm_assert.h"
+
+/*
+ * The linux kernel's ptrace.h stupidly defines the bare
+ * EAX/EBX/ECX/EDX, which wrecks havoc with our preprocessor tricks.
+ */
+#undef EAX
+#undef EBX
+#undef ECX
+#undef EDX
+
+typedef struct CPUIDRegs {
+   uint32 eax, ebx, ecx, edx;
+} CPUIDRegs;
+
+typedef union CPUIDRegsUnion {
+   uint32 array[4];
+   CPUIDRegs regs;
+} CPUIDRegsUnion;
+
+/*
+ * Results of calling cpuid(eax, ecx) on all host logical CPU.
+ */
+#ifdef _MSC_VER
+#pragma warning (disable :4200) // non-std extension: zero-sized array in struct
+#endif
+
+typedef
+#include "vmware_pack_begin.h"
+struct CPUIDReply {
+   /*
+    * Unique host logical CPU identifier. It does not change across queries, so
+    * we use it to correlate the replies of multiple queries.
+    */
+   uint64 tag;                // OUT
+
+   CPUIDRegs regs;            // OUT
+}
+#include "vmware_pack_end.h"
+CPUIDReply;
+
+typedef
+#include "vmware_pack_begin.h"
+struct CPUIDQuery {
+   uint32 eax;                // IN
+   uint32 ecx;                // IN
+   uint32 numLogicalCPUs;     // IN/OUT
+   CPUIDReply logicalCPUs[0]; // OUT
+}
+#include "vmware_pack_end.h"
+CPUIDQuery;
+
+/*
+ * CPUID levels the monitor caches.
+ *
+ * The first parameter defines whether the level has its default masks
+ * generated from the values in this file.  Any level which is marked
+ * as FALSE here *must* have all monitor support types set to NA.  A
+ * static assert in lib/cpuidcompat/cpuidcompat.c will check this.
+ *
+ * The fourth parameter is a "sub leaf count", where 0 means that ecx
+ * is ignored, otherwise is the count of sub-leaves cached/supported.
+ */
+
+#define CPUID_CACHED_LEVELS                         \
+   CPUIDLEVEL(TRUE,  0,   0,          0)            \
+   CPUIDLEVEL(TRUE,  1,   1,          0)            \
+   CPUIDLEVEL(FALSE, 2,   2,          0)            \
+   CPUIDLEVEL(FALSE, 4,   4,          7)            \
+   CPUIDLEVEL(FALSE, 5,   5,          0)            \
+   CPUIDLEVEL(FALSE, 6,   6,          0)            \
+   CPUIDLEVEL(TRUE,  7,   7,          1)            \
+   CPUIDLEVEL(FALSE, A,   0xA,        0)            \
+   CPUIDLEVEL(FALSE, B,   0xB,        2)            \
+   CPUIDLEVEL(TRUE,  D,   0xD,        4)            \
+   CPUIDLEVEL(FALSE, 12,  0x12,       4)            \
+   CPUIDLEVEL(FALSE, 400, 0x40000000, 0)            \
+   CPUIDLEVEL(FALSE, 401, 0x40000001, 0)            \
+   CPUIDLEVEL(FALSE, 402, 0x40000002, 0)            \
+   CPUIDLEVEL(FALSE, 403, 0x40000003, 0)            \
+   CPUIDLEVEL(FALSE, 404, 0x40000004, 0)            \
+   CPUIDLEVEL(FALSE, 405, 0x40000005, 0)            \
+   CPUIDLEVEL(FALSE, 406, 0x40000006, 0)            \
+   CPUIDLEVEL(FALSE, 410, 0x40000010, 0)            \
+   CPUIDLEVEL(FALSE, 80,  0x80000000, 0)            \
+   CPUIDLEVEL(TRUE,  81,  0x80000001, 0)            \
+   CPUIDLEVEL(FALSE, 82,  0x80000002, 0)            \
+   CPUIDLEVEL(FALSE, 83,  0x80000003, 0)            \
+   CPUIDLEVEL(FALSE, 84,  0x80000004, 0)            \
+   CPUIDLEVEL(FALSE, 85,  0x80000005, 0)            \
+   CPUIDLEVEL(FALSE, 86,  0x80000006, 0)            \
+   CPUIDLEVEL(FALSE, 87,  0x80000007, 0)            \
+   CPUIDLEVEL(FALSE, 88,  0x80000008, 0)            \
+   CPUIDLEVEL(TRUE,  8A,  0x8000000A, 0)            \
+   CPUIDLEVEL(FALSE, 819, 0x80000019, 0)            \
+   CPUIDLEVEL(FALSE, 81A, 0x8000001A, 0)            \
+   CPUIDLEVEL(FALSE, 81B, 0x8000001B, 0)            \
+   CPUIDLEVEL(FALSE, 81C, 0x8000001C, 0)            \
+   CPUIDLEVEL(FALSE, 81D, 0x8000001D, 5)            \
+   CPUIDLEVEL(FALSE, 81E, 0x8000001E, 0)
+
+#define CPUID_ALL_LEVELS CPUID_CACHED_LEVELS
+
+/* Define cached CPUID levels in the form: CPUID_LEVEL_<ShortName> */
+typedef enum {
+#define CPUIDLEVEL(t, s, v, c) CPUID_LEVEL_##s,
+   CPUID_CACHED_LEVELS
+#undef CPUIDLEVEL
+   CPUID_NUM_CACHED_LEVELS
+} CpuidCachedLevel;
+
+/* Enum to translate between shorthand name and actual CPUID level value. */
+enum {
+#define CPUIDLEVEL(t, s, v, c) CPUID_LEVEL_VAL_##s = v,
+   CPUID_ALL_LEVELS
+#undef CPUIDLEVEL
+};
+
+
+/* Named feature leaves */
+#define CPUID_FEATURE_INFORMATION  0x01
+#define CPUID_PROCESSOR_TOPOLOGY   4
+#define CPUID_MWAIT_FEATURES       5
+#define CPUID_XSAVE_FEATURES       0xd
+#define CPUID_HYPERVISOR_LEVEL_0   0x40000000
+#define CPUID_SVM_FEATURES         0x8000000a
+
+
+/*
+ * CPUID result registers
+ */
+
+#define CPUID_REGS                              \
+   CPUIDREG(EAX, eax)                           \
+   CPUIDREG(EBX, ebx)                           \
+   CPUIDREG(ECX, ecx)                           \
+   CPUIDREG(EDX, edx)
+
+typedef enum {
+#define CPUIDREG(uc, lc) CPUID_REG_##uc,
+   CPUID_REGS
+#undef CPUIDREG
+   CPUID_NUM_REGS
+} CpuidReg;
+
+#define CPUID_INTEL_VENDOR_STRING       "GenuntelineI"
+#define CPUID_AMD_VENDOR_STRING         "AuthcAMDenti"
+#define CPUID_CYRIX_VENDOR_STRING       "CyriteadxIns"
+#define CPUID_VIA_VENDOR_STRING         "CentaulsaurH"
+
+#define CPUID_HYPERV_HYPERVISOR_VENDOR_STRING  "Microsoft Hv"
+#define CPUID_KVM_HYPERVISOR_VENDOR_STRING     "KVMKVMKVM\0\0\0"
+#define CPUID_VMWARE_HYPERVISOR_VENDOR_STRING  "VMwareVMware"
+#define CPUID_XEN_HYPERVISOR_VENDOR_STRING     "XenVMMXenVMM"
+
+#define CPUID_INTEL_VENDOR_STRING_FIXED "GenuineIntel"
+#define CPUID_AMD_VENDOR_STRING_FIXED   "AuthenticAMD"
+#define CPUID_CYRIX_VENDOR_STRING_FIXED "CyrixInstead"
+#define CPUID_VIA_VENDOR_STRING_FIXED   "CentaurHauls"
+
+/*
+ * FIELD can be defined to process the CPUID information provided
+ * in the following CPUID_FIELD_DATA macro.  The first parameter is
+ * the CPUID level of the feature (must be defined in
+ * CPUID_ALL_LEVELS, above.  The second parameter is the CPUID result
+ * register in which the field is returned (defined in CPUID_REGS).
+ * The third field is the vendor(s) this feature applies to.  "COMMON"
+ * means all vendors apply.  UNKNOWN may not be used here.  The fourth
+ * and fifth parameters are the bit position of the field and the
+ * width, respectively.  The sixth is the text name of the field.
+ *
+ * The seventh parameters specifies the monitor support
+ * characteristics for this field.  The value must be a valid
+ * CpuidFieldSupported value (omitting CPUID_FIELD_SUPPORT_ for
+ * convenience).  The meaning of those values are described below.
+ *
+ * The eighth parameter describes whether the feature is capable of
+ * being used by usermode code (TRUE), or just CPL0 kernel code
+ * (FALSE).
+ *
+ * FLAG is defined identically to FIELD, but its accessors are more
+ * appropriate for 1-bit flags, and compile-time asserts enforce that
+ * the size is 1 bit wide.
+ */
+
+
+/*
+ * CpuidFieldSupported is made up of the following values:
+ *
+ *     NO: A feature/field that IS NOT SUPPORTED by the monitor.  Even
+ *     if the host supports this feature, we will never expose it to
+ *     the guest.
+ *
+ *     YES: A feature/field that IS SUPPORTED by the monitor.  If the
+ *     host supports this feature, we will expose it to the guest.  If
+ *     not, then we will not set the feature.
+ *
+ *     ANY: A feature/field that IS ALWAYS SUPPORTED by the monitor.
+ *     Even if the host does not support the feature, the monitor can
+ *     expose the feature to the guest. As with "YES", the guest cpuid
+ *     value defaults to the host/evc cpuid value.  But usually the
+ *     guest cpuid value is recomputed at power on, ignoring the default
+ *     value.
+ *
+ *
+ *     NA: Only legal for levels not masked/tested by default (see
+ *     above for this definition).  Such fields must always be marked
+ *     as NA.
+ *
+ * These distinctions, when combined with the feature's CPL3
+ * properties can be translated into a common CPUID mask string as
+ * follows:
+ *
+ *     NO + CPL3 --> "R" (Reserved).  We don't support the feature,
+ *     but we can't properly hide this from applications when using
+ *     direct execution or HV with apps that do try/catch/fail, so we
+ *     must still perform compatibility checks.
+ *
+ *     NO + !CPL3 --> "0" (Masked).  We can hide this from the guest.
+ *
+ *     YES --> "H" (Host).  We support the feature, so show it to the
+ *     guest if the host has the feature.
+ *
+ *     ANY/NA --> "X" (Ignore).  By default, don't perform checks for
+ *     this feature bit.  Per-GOS masks may choose to set this bit in
+ *     the guest.  (e.g. the APIC feature bit is always set to 1.)
+ *
+ *     See lib/cpuidcompat/cpuidcompat.c for any possible overrides to
+ *     these defaults.
+ */
+typedef enum {
+   CPUID_FIELD_SUPPORTED_NO,
+   CPUID_FIELD_SUPPORTED_YES,
+   CPUID_FIELD_SUPPORTED_ANY,
+   CPUID_FIELD_SUPPORTED_NA,
+   CPUID_NUM_FIELD_SUPPORTEDS
+} CpuidFieldSupported;
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_0                                               \
+FIELD(  0,  0, EAX,  0, 32, NUMLEVELS,                             ANY, FALSE) \
+FIELD(  0,  0, EBX,  0, 32, VENDOR1,                               YES, TRUE)  \
+FIELD(  0,  0, ECX,  0, 32, VENDOR3,                               YES, TRUE)  \
+FIELD(  0,  0, EDX,  0, 32, VENDOR2,                               YES, TRUE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_1                                               \
+FIELD(  1,  0, EAX,  0,  4, STEPPING,                              ANY, FALSE) \
+FIELD(  1,  0, EAX,  4,  4, MODEL,                                 ANY, FALSE) \
+FIELD(  1,  0, EAX,  8,  4, FAMILY,                                YES, FALSE) \
+FIELD(  1,  0, EAX, 12,  2, TYPE,                                  ANY, FALSE) \
+FIELD(  1,  0, EAX, 16,  4, EXTENDED_MODEL,                        ANY, FALSE) \
+FIELD(  1,  0, EAX, 20,  8, EXTENDED_FAMILY,                       YES, FALSE) \
+FIELD(  1,  0, EBX,  0,  8, BRAND_ID,                              ANY, FALSE) \
+FIELD(  1,  0, EBX,  8,  8, CLFL_SIZE,                             ANY, FALSE) \
+FIELD(  1,  0, EBX, 16,  8, LCPU_COUNT,                            ANY, FALSE) \
+FIELD(  1,  0, EBX, 24,  8, APICID,                                ANY, FALSE) \
+FLAG(   1,  0, ECX,  0,  1, SSE3,                                  YES, TRUE)  \
+FLAG(   1,  0, ECX,  1,  1, PCLMULQDQ,                             YES, TRUE)  \
+FLAG(   1,  0, ECX,  2,  1, DTES64,                                NO,  FALSE) \
+FLAG(   1,  0, ECX,  3,  1, MWAIT,                                 YES, FALSE) \
+FLAG(   1,  0, ECX,  4,  1, DSCPL,                                 NO,  FALSE) \
+FLAG(   1,  0, ECX,  5,  1, VMX,                                   YES, FALSE) \
+FLAG(   1,  0, ECX,  6,  1, SMX,                                   NO,  FALSE) \
+FLAG(   1,  0, ECX,  7,  1, EIST,                                  NO,  FALSE) \
+FLAG(   1,  0, ECX,  8,  1, TM2,                                   NO,  FALSE) \
+FLAG(   1,  0, ECX,  9,  1, SSSE3,                                 YES, TRUE)  \
+FLAG(   1,  0, ECX, 10,  1, CNXTID,                                NO,  FALSE) \
+FLAG(   1,  0, ECX, 11,  1, SDBG,                                  NO,  FALSE) \
+FLAG(   1,  0, ECX, 12,  1, FMA,                                   YES, TRUE)  \
+FLAG(   1,  0, ECX, 13,  1, CMPXCHG16B,                            YES, TRUE)  \
+FLAG(   1,  0, ECX, 14,  1, xTPR,                                  NO,  FALSE) \
+FLAG(   1,  0, ECX, 15,  1, PDCM,                                  NO,  FALSE) \
+FLAG(   1,  0, ECX, 17,  1, PCID,                                  YES, FALSE) \
+FLAG(   1,  0, ECX, 18,  1, DCA,                                   NO,  FALSE) \
+FLAG(   1,  0, ECX, 19,  1, SSE41,                                 YES, TRUE)  \
+FLAG(   1,  0, ECX, 20,  1, SSE42,                                 YES, TRUE)  \
+FLAG(   1,  0, ECX, 21,  1, x2APIC,                                ANY, FALSE) \
+FLAG(   1,  0, ECX, 22,  1, MOVBE,                                 YES, TRUE)  \
+FLAG(   1,  0, ECX, 23,  1, POPCNT,                                YES, TRUE)  \
+FLAG(   1,  0, ECX, 24,  1, TSC_DEADLINE,                          ANY, FALSE) \
+FLAG(   1,  0, ECX, 25,  1, AES,                                   YES, TRUE)  \
+FLAG(   1,  0, ECX, 26,  1, XSAVE,                                 YES, FALSE) \
+FLAG(   1,  0, ECX, 27,  1, OSXSAVE,                               ANY, FALSE) \
+FLAG(   1,  0, ECX, 28,  1, AVX,                                   YES, FALSE) \
+FLAG(   1,  0, ECX, 29,  1, F16C,                                  YES, TRUE)  \
+FLAG(   1,  0, ECX, 30,  1, RDRAND,                                YES, TRUE)  \
+FLAG(   1,  0, ECX, 31,  1, HYPERVISOR,                            ANY, TRUE)  \
+FLAG(   1,  0, EDX,  0,  1, FPU,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX,  1,  1, VME,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  2,  1, DE,                                    YES, FALSE) \
+FLAG(   1,  0, EDX,  3,  1, PSE,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  4,  1, TSC,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX,  5,  1, MSR,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  6,  1, PAE,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  7,  1, MCE,                                   YES, FALSE) \
+FLAG(   1,  0, EDX,  8,  1, CX8,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX,  9,  1, APIC,                                  ANY, FALSE) \
+FLAG(   1,  0, EDX, 11,  1, SEP,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX, 12,  1, MTRR,                                  YES, FALSE) \
+FLAG(   1,  0, EDX, 13,  1, PGE,                                   YES, FALSE) \
+FLAG(   1,  0, EDX, 14,  1, MCA,                                   YES, FALSE) \
+FLAG(   1,  0, EDX, 15,  1, CMOV,                                  YES, TRUE)  \
+FLAG(   1,  0, EDX, 16,  1, PAT,                                   YES, FALSE) \
+FLAG(   1,  0, EDX, 17,  1, PSE36,                                 YES, FALSE) \
+FLAG(   1,  0, EDX, 18,  1, PSN,                                   YES, FALSE) \
+FLAG(   1,  0, EDX, 19,  1, CLFSH,                                 YES, TRUE)  \
+FLAG(   1,  0, EDX, 21,  1, DS,                                    YES, FALSE) \
+FLAG(   1,  0, EDX, 22,  1, ACPI,                                  ANY, FALSE) \
+FLAG(   1,  0, EDX, 23,  1, MMX,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX, 24,  1, FXSR,                                  YES, TRUE)  \
+FLAG(   1,  0, EDX, 25,  1, SSE,                                   YES, TRUE)  \
+FLAG(   1,  0, EDX, 26,  1, SSE2,                                  YES, TRUE)  \
+FLAG(   1,  0, EDX, 27,  1, SS,                                    YES, FALSE) \
+FLAG(   1,  0, EDX, 28,  1, HTT,                                   ANY, FALSE) \
+FLAG(   1,  0, EDX, 29,  1, TM,                                    NO,  FALSE) \
+FLAG(   1,  0, EDX, 30,  1, IA64,                                  NO,  FALSE) \
+FLAG(   1,  0, EDX, 31,  1, PBE,                                   NO,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_2                                               \
+FIELD(  2,  0, EAX,  0,  8, LEAF2_COUNT,                           NA, FALSE)  \
+FIELD(  2,  0, EAX,  8,  8, LEAF2_CACHE1,                          NA, FALSE)  \
+FIELD(  2,  0, EAX, 16,  8, LEAF2_CACHE2,                          NA, FALSE)  \
+FIELD(  2,  0, EAX, 24,  8, LEAF2_CACHE3,                          NA, FALSE)  \
+FIELD(  2,  0, EBX,  0,  8, LEAF2_CACHE4,                          NA, FALSE)  \
+FIELD(  2,  0, EBX,  8,  8, LEAF2_CACHE5,                          NA, FALSE)  \
+FIELD(  2,  0, EBX, 16,  8, LEAF2_CACHE6,                          NA, FALSE)  \
+FIELD(  2,  0, EBX, 24,  8, LEAF2_CACHE7,                          NA, FALSE)  \
+FIELD(  2,  0, ECX,  0,  8, LEAF2_CACHE8,                          NA, FALSE)  \
+FIELD(  2,  0, ECX,  8,  8, LEAF2_CACHE9,                          NA, FALSE)  \
+FIELD(  2,  0, ECX, 16,  8, LEAF2_CACHE10,                         NA, FALSE)  \
+FIELD(  2,  0, ECX, 24,  8, LEAF2_CACHE11,                         NA, FALSE)  \
+FIELD(  2,  0, EDX,  0,  8, LEAF2_CACHE12,                         NA, FALSE)  \
+FIELD(  2,  0, EDX,  8,  8, LEAF2_CACHE13,                         NA, FALSE)  \
+FIELD(  2,  0, EDX, 16,  8, LEAF2_CACHE14,                         NA, FALSE)  \
+FIELD(  2,  0, EDX, 24,  8, LEAF2_CACHE15,                         NA, FALSE)  \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_4                                               \
+FIELD(  4,  0, EAX,  0,  5, LEAF4_CACHE_TYPE,                      NA,  FALSE) \
+FIELD(  4,  0, EAX,  5,  3, LEAF4_CACHE_LEVEL,                     NA,  FALSE) \
+FLAG(   4,  0, EAX,  8,  1, LEAF4_CACHE_SELF_INIT,                 NA,  FALSE) \
+FLAG(   4,  0, EAX,  9,  1, LEAF4_CACHE_FULLY_ASSOC,               NA,  FALSE) \
+FIELD(  4,  0, EAX, 14, 12, LEAF4_CACHE_NUMHT_SHARING,             NA,  FALSE) \
+FIELD(  4,  0, EAX, 26,  6, LEAF4_CORE_COUNT,                      NA,  FALSE) \
+FIELD(  4,  0, EBX,  0, 12, LEAF4_CACHE_LINE,                      NA,  FALSE) \
+FIELD(  4,  0, EBX, 12, 10, LEAF4_CACHE_PART,                      NA,  FALSE) \
+FIELD(  4,  0, EBX, 22, 10, LEAF4_CACHE_WAYS,                      NA,  FALSE) \
+FIELD(  4,  0, ECX,  0, 32, LEAF4_CACHE_SETS,                      NA,  FALSE) \
+FLAG(   4,  0, EDX,  0,  1, LEAF4_CACHE_WBINVD_NOT_GUARANTEED,     NA,  FALSE) \
+FLAG(   4,  0, EDX,  1,  1, LEAF4_CACHE_IS_INCLUSIVE,              NA,  FALSE) \
+FLAG(   4,  0, EDX,  2,  1, LEAF4_CACHE_COMPLEX_INDEXING,          NA,  FALSE)
+
+/*     LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                 MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_5                                               \
+FIELD(  5,  0, EAX,  0, 16, MWAIT_MIN_SIZE,                        NA,  FALSE) \
+FIELD(  5,  0, EBX,  0, 16, MWAIT_MAX_SIZE,                        NA,  FALSE) \
+FLAG(   5,  0, ECX,  0,  1, MWAIT_EXTENSIONS,                      NA,  FALSE) \
+FLAG(   5,  0, ECX,  1,  1, MWAIT_INTR_BREAK,                      NA,  FALSE) \
+FIELD(  5,  0, EDX,  0,  4, MWAIT_C0_SUBSTATE,                     NA,  FALSE) \
+FIELD(  5,  0, EDX,  4,  4, MWAIT_C1_SUBSTATE,                     NA,  FALSE) \
+FIELD(  5,  0, EDX,  8,  4, MWAIT_C2_SUBSTATE,                     NA,  FALSE) \
+FIELD(  5,  0, EDX, 12,  4, MWAIT_C3_SUBSTATE,                     NA,  FALSE) \
+FIELD(  5,  0, EDX, 16,  4, MWAIT_C4_SUBSTATE,                     NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_6                                               \
+FLAG(   6,  0, EAX,  0,  1, THERMAL_SENSOR,                        NA,  FALSE) \
+FLAG(   6,  0, EAX,  1,  1, TURBO_MODE,                            NA,  FALSE) \
+FLAG(   6,  0, EAX,  2,  1, APIC_INVARIANT,                        NA,  FALSE) \
+FLAG(   6,  0, EAX,  4,  1, PLN,                                   NA,  FALSE) \
+FLAG(   6,  0, EAX,  5,  1, ECMD,                                  NA,  FALSE) \
+FLAG(   6,  0, EAX,  6,  1, PTM,                                   NA,  FALSE) \
+FLAG(   6,  0, EAX,  7,  1, HWP,                                   NA,  FALSE) \
+FLAG(   6,  0, EAX,  8,  1, HWP_NOTIFICATION,                      NA,  FALSE) \
+FLAG(   6,  0, EAX,  9,  1, HWP_ACTIVITY_WINDOW,                   NA,  FALSE) \
+FLAG(   6,  0, EAX, 10,  1, HWP_ENERGY_PERFORMANCE_PREFERENCE,     NA,  FALSE) \
+FLAG(   6,  0, EAX, 11,  1, HWP_PACKAGE_LEVEL_REQUEST,             NA,  FALSE) \
+FLAG(   6,  0, EAX, 13,  1, HDC,                                   NA,  FALSE) \
+FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,                   NA,  FALSE) \
+FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                     NA,  FALSE) \
+FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                      NA,  FALSE)
+
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_7                                               \
+FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                              YES, FALSE) \
+FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                            ANY, FALSE) \
+FLAG(   7,  0, EBX,  3,  1, BMI1,                                  YES, TRUE)  \
+FLAG(   7,  0, EBX,  2,  1, SGX,                                   NO,  FALSE) \
+FLAG(   7,  0, EBX,  4,  1, HLE,                                   YES, TRUE)  \
+FLAG(   7,  0, EBX,  5,  1, AVX2,                                  YES, TRUE)  \
+FLAG(   7,  0, EBX,  7,  1, SMEP,                                  YES, FALSE) \
+FLAG(   7,  0, EBX,  8,  1, BMI2,                                  YES, TRUE)  \
+FLAG(   7,  0, EBX,  9,  1, ENFSTRG,                               YES, FALSE) \
+FLAG(   7,  0, EBX, 10,  1, INVPCID,                               YES, FALSE) \
+FLAG(   7,  0, EBX, 11,  1, RTM,                                   YES, TRUE)  \
+FLAG(   7,  0, EBX, 12,  1, PQM,                                   NO,  FALSE) \
+FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                       ANY, TRUE)  \
+FLAG(   7,  0, EBX, 15,  1, PQE,                                   NO,  FALSE) \
+FLAG(   7,  0, EBX, 18,  1, RDSEED,                                YES, TRUE)  \
+FLAG(   7,  0, EBX, 19,  1, ADX,                                   YES, TRUE)  \
+FLAG(   7,  0, EBX, 20,  1, SMAP,                                  YES, FALSE) \
+FLAG(   7,  0, EBX, 25,  1, PT,                                    NO,  FALSE) \
+FLAG(   7,  0, ECX,  0,  1, PREFETCHWT1,                           NO,  TRUE)
+
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_A                                               \
+FIELD(  A,  0, EAX,  0,  8, PMC_VERSION,                           NA,  FALSE) \
+FIELD(  A,  0, EAX,  8,  8, PMC_NUM_GEN,                           NA,  FALSE) \
+FIELD(  A,  0, EAX, 16,  8, PMC_WIDTH_GEN,                         NA,  FALSE) \
+FIELD(  A,  0, EAX, 24,  8, PMC_EBX_LENGTH,                        NA,  FALSE) \
+FLAG(   A,  0, EBX,  0,  1, PMC_CORE_CYCLES,                       NA,  FALSE) \
+FLAG(   A,  0, EBX,  1,  1, PMC_INSTR_RETIRED,                     NA,  FALSE) \
+FLAG(   A,  0, EBX,  2,  1, PMC_REF_CYCLES,                        NA,  FALSE) \
+FLAG(   A,  0, EBX,  3,  1, PMC_LAST_LVL_CREF,                     NA,  FALSE) \
+FLAG(   A,  0, EBX,  4,  1, PMC_LAST_LVL_CMISS,                    NA,  FALSE) \
+FLAG(   A,  0, EBX,  5,  1, PMC_BR_INST_RETIRED,                   NA,  FALSE) \
+FLAG(   A,  0, EBX,  6,  1, PMC_BR_MISS_RETIRED,                   NA,  FALSE) \
+FIELD(  A,  0, EDX,  0,  5, PMC_NUM_FIXED,                         NA,  FALSE) \
+FIELD(  A,  0, EDX,  5,  8, PMC_WIDTH_FIXED,                       NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_B                                               \
+FIELD(  B,  0, EAX,  0,  5, TOPOLOGY_MASK_WIDTH,                   NA,  FALSE) \
+FIELD(  B,  0, EBX,  0, 16, TOPOLOGY_CPUS_SHARING_LEVEL,           NA,  FALSE) \
+FIELD(  B,  0, ECX,  0,  8, TOPOLOGY_LEVEL_NUMBER,                 NA,  FALSE) \
+FIELD(  B,  0, ECX,  8,  8, TOPOLOGY_LEVEL_TYPE,                   NA,  FALSE) \
+FIELD(  B,  0, EDX,  0, 32, TOPOLOGY_X2APIC_ID,                    NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_D                                               \
+FLAG(   D,  0, EAX,  0,  1, XCR0_MASTER_LEGACY_FP,                 YES, FALSE) \
+FLAG(   D,  0, EAX,  1,  1, XCR0_MASTER_SSE,                       YES, FALSE) \
+FLAG(   D,  0, EAX,  2,  1, XCR0_MASTER_YMM_H,                     YES, FALSE) \
+FIELD(  D,  0, EAX,  3, 29, XCR0_MASTER_LOWER,                     NO,  FALSE) \
+FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                    ANY, FALSE) \
+FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                        YES, FALSE) \
+FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                     NO,  FALSE) \
+FLAG(   D,  0, EDX, 30,  1, XCR0_MASTER_LWP,                       NO,  FALSE) \
+FLAG(   D,  0, EDX, 31,  1, XCR0_MASTER_EXTENDED_XSAVE,            NO,  FALSE) \
+FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                              YES, FALSE) \
+FLAG(   D,  1, EAX,  1,  1, XSAVEC,                                NO,  FALSE) \
+FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                           NO,  FALSE) \
+FLAG(   D,  1, EAX,  3,  1, XSAVES,                                NO,  FALSE) \
+FIELD(  D,  1, EBX,  0, 32, XSAVE_XSS_SIZE,                        NO,  FALSE) \
+FIELD(  D,  1, ECX,  0, 32, XSS_LOWER,                             NO,  FALSE) \
+FIELD(  D,  1, EDX,  0, 32, XSS_UPPER,                             NO,  FALSE) \
+FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                        YES, FALSE) \
+FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                      YES, FALSE) \
+FIELD(  D,  2, ECX,  0, 32, XSAVE_YMM_RSVD1,                       YES, FALSE) \
+FIELD(  D,  2, EDX,  0, 32, XSAVE_YMM_RSVD2,                       YES, FALSE) \
+FIELD(  D, 62, EAX,  0, 32, XSAVE_LWP_SIZE,                        NO,  FALSE) \
+FIELD(  D, 62, EBX,  0, 32, XSAVE_LWP_OFFSET,                      NO,  FALSE) \
+FIELD(  D, 62, ECX,  0, 32, XSAVE_LWP_RSVD1,                       NO,  FALSE) \
+FIELD(  D, 62, EDX,  0, 32, XSAVE_LWP_RSVD2,                       NO,  FALSE)
+
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_12                                              \
+FLAG(  12,  0, EAX,  0,  1, SGX1,                                  NA,  FALSE) \
+FLAG(  12,  0, EAX,  1,  1, SGX2,                                  NA,  FALSE) \
+FLAG(  12,  0, EBX, 31,  1, SGX_MISCSELECT,                        NA,  FALSE) \
+FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,                NA,  FALSE) \
+FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,                   NA,  FALSE) \
+FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                      NA,  FALSE) \
+FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                      NA,  FALSE) \
+FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                      NA,  FALSE) \
+FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                      NA,  FALSE) \
+FIELD( 12,  2, EAX,  0,  4, EPC00_VALID,                           NA,  FALSE) \
+FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                        NA,  FALSE) \
+FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                       NA,  FALSE) \
+FIELD( 12,  2, ECX,  0,  4, EPC00_PROTECTED,                       NA,  FALSE) \
+FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                        NA,  FALSE) \
+FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                       NA,  FALSE) \
+FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                           NA,  FALSE) \
+FIELD( 12,  3, EAX, 12, 20, EPC01_BASE_LOW,                        NA,  FALSE) \
+FIELD( 12,  3, EBX,  0, 20, EPC01_BASE_HIGH,                       NA,  FALSE) \
+FIELD( 12,  3, ECX,  0,  4, EPC01_PROTECTED,                       NA,  FALSE) \
+FIELD( 12,  3, ECX, 12, 20, EPC01_SIZE_LOW,                        NA,  FALSE) \
+FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                       NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_400                                             \
+FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                         NA,  FALSE) \
+FIELD(400,  0, EBX,  0, 32, HYPERVISOR_VENDOR0,                    NA,  FALSE) \
+FIELD(400,  0, ECX,  0, 32, HYPERVISOR_VENDOR1,                    NA,  FALSE) \
+FIELD(400,  0, EDX,  0, 32, HYPERVISOR_VENDOR2,                    NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_401                                             \
+FIELD(401,  0, EAX,  0, 32, HV_INTERFACE_SIGNATURE,                NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_402                                             \
+FIELD(402,  0, EAX,  0, 32, BUILD_NUMBER,                          NA,  FALSE) \
+FIELD(402,  0, EBX,  0, 16, MINOR_VERSION,                         NA,  FALSE) \
+FIELD(402,  0, EBX, 16, 16, MAJOR_VERSION,                         NA,  FALSE) \
+FIELD(402,  0, ECX,  0, 32, SERVICE_PACK,                          NA,  FALSE) \
+FIELD(402,  0, EDX,  0, 24, SERVICE_NUMBER,                        NA,  FALSE) \
+FIELD(402,  0, EDX, 24,  8, SERVICE_BRANCH,                        NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_403                                             \
+FLAG( 403,  0, EAX,  0,  1, VP_RUNTIME_AVAIL,                      NA,  FALSE) \
+FLAG( 403,  0, EAX,  1,  1, REF_COUNTER_AVAIL,                     NA,  FALSE) \
+FLAG( 403,  0, EAX,  2,  1, BASIC_SYNIC_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EAX,  3,  1, SYNTH_TIMER_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EAX,  4,  1, APIC_ACCESS_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EAX,  5,  1, HYPERCALL_MSRS_AVAIL,                  NA,  FALSE) \
+FLAG( 403,  0, EAX,  6,  1, VP_INDEX_MSR_AVAIL,                    NA,  FALSE) \
+FLAG( 403,  0, EAX,  7,  1, VIRT_RESET_MSR_AVAIL,                  NA,  FALSE) \
+FLAG( 403,  0, EAX,  8,  1, STATS_PAGES_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EAX,  9,  1, REF_TSC_AVAIL,                         NA,  FALSE) \
+FLAG( 403,  0, EAX, 10,  1, GUEST_IDLE_MSR_AVAIL,                  NA,  FALSE) \
+FLAG( 403,  0, EAX, 11,  1, FREQUENCY_MSRS_AVAIL,                  NA,  FALSE) \
+FLAG( 403,  0, EAX, 12,  1, SYNTH_DEBUG_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EBX,  0,  1, CREATE_PARTITIONS_FLAG,                NA,  FALSE) \
+FLAG( 403,  0, EBX,  1,  1, ACCESS_PARTITION_ID_FLAG,              NA,  FALSE) \
+FLAG( 403,  0, EBX,  2,  1, ACCESS_MEMORY_POOL_FLAG,               NA,  FALSE) \
+FLAG( 403,  0, EBX,  3,  1, ADJUST_MESSAGE_BUFFERS_FLAG,           NA,  FALSE) \
+FLAG( 403,  0, EBX,  4,  1, POST_MESSAGES_FLAG,                    NA,  FALSE) \
+FLAG( 403,  0, EBX,  5,  1, SIGNAL_EVENTS_FLAG,                    NA,  FALSE) \
+FLAG( 403,  0, EBX,  6,  1, CREATE_PORT_FLAG,                      NA,  FALSE) \
+FLAG( 403,  0, EBX,  7,  1, CONNECT_PORT_FLAG,                     NA,  FALSE) \
+FLAG( 403,  0, EBX,  8,  1, ACCESS_STATS_FLAG,                     NA,  FALSE) \
+FLAG( 403,  0, EBX, 11,  1, DEBUGGING_FLAG,                        NA,  FALSE) \
+FLAG( 403,  0, EBX, 12,  1, CPU_MANAGEMENT_FLAG,                   NA,  FALSE) \
+FLAG( 403,  0, EBX, 13,  1, CONFIGURE_PROFILER_FLAG,               NA,  FALSE) \
+FLAG( 403,  0, EBX, 14,  1, ENABLE_EXPANDED_STACKWALKING_FLAG,     NA,  FALSE) \
+FIELD(403,  0, ECX,  0,  4, MAX_POWER_STATE,                       NA,  FALSE) \
+FLAG( 403,  0, ECX,  4,  1, HPET_NEEDED_FOR_C3,                    NA,  FALSE) \
+FLAG( 403,  0, EDX,  0,  1, MWAIT_AVAIL,                           NA,  FALSE) \
+FLAG( 403,  0, EDX,  1,  1, GUEST_DEBUGGING_AVAIL,                 NA,  FALSE) \
+FLAG( 403,  0, EDX,  2,  1, PERFORMANCE_MONITOR_AVAIL,             NA,  FALSE) \
+FLAG( 403,  0, EDX,  3,  1, CPU_DYN_PARTITIONING_AVAIL,            NA,  FALSE) \
+FLAG( 403,  0, EDX,  4,  1, XMM_REGISTERS_FOR_HYPERCALL_AVAIL,     NA,  FALSE) \
+FLAG( 403,  0, EDX,  5,  1, GUEST_IDLE_AVAIL,                      NA,  FALSE) \
+FLAG( 403,  0, EDX,  6,  1, HYPERVISOR_SLEEP_STATE_AVAIL,          NA,  FALSE) \
+FLAG( 403,  0, EDX,  7,  1, NUMA_DISTANCE_QUERY_AVAIL,             NA,  FALSE) \
+FLAG( 403,  0, EDX,  8,  1, TIMER_FREQUENCY_AVAIL,                 NA,  FALSE) \
+FLAG( 403,  0, EDX,  9,  1, SYNTH_MACHINE_CHECK_AVAIL,             NA,  FALSE) \
+FLAG( 403,  0, EDX, 10,  1, GUEST_CRASH_MSRS_AVAIL,                NA,  FALSE) \
+FLAG( 403,  0, EDX, 11,  1, DEBUG_MSRS_AVAIL,                      NA,  FALSE) \
+FLAG( 403,  0, EDX, 12,  1, NPIEP1_AVAIL,                          NA,  FALSE) \
+FLAG( 403,  0, EDX, 13,  1, DISABLE_HYPERVISOR_AVAIL,              NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_404                                             \
+FLAG( 404,  0, EAX,  0,  1, USE_HYPERCALL_TO_SWITCH_ADDR_SPACE,    NA,  FALSE) \
+FLAG( 404,  0, EAX,  1,  1, USE_HYPERCALL_TO_FLUSH_TLB,            NA,  FALSE) \
+FLAG( 404,  0, EAX,  2,  1, USE_HYPERCALL_FOR_TLB_SHOOTDOWN,       NA,  FALSE) \
+FLAG( 404,  0, EAX,  3,  1, USE_MSRS_FOR_EOI_ICR_TPR,              NA,  FALSE) \
+FLAG( 404,  0, EAX,  4,  1, USE_MSR_FOR_RESET,                     NA,  FALSE) \
+FLAG( 404,  0, EAX,  5,  1, USE_RELAXED_TIMING,                    NA,  FALSE) \
+FLAG( 404,  0, EAX,  6,  1, USE_DMA_REMAPPING,                     NA,  FALSE) \
+FLAG( 404,  0, EAX,  7,  1, USE_INTERRUPT_REMAPPING,               NA,  FALSE) \
+FLAG( 404,  0, EAX,  8,  1, USE_X2APIC,                            NA,  FALSE) \
+FLAG( 404,  0, EAX,  9,  1, DEPRECATE_AUTOEOI,                     NA,  FALSE) \
+FIELD(404,  0, EBX,  0, 32, SPINLOCK_RETRIES,                      NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_405                                             \
+FIELD(405,  0, EAX,  0, 32, MAX_VCPU,                              NA,  FALSE) \
+FIELD(405,  0, EBX,  0, 32, MAX_LCPU,                              NA,  FALSE) \
+FIELD(405,  0, ECX,  0, 32, MAX_REMAPPABLE_VECTORS,                NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_406                                             \
+FLAG( 406,  0, EAX,  0,  1, APIC_OVERLAY_ASSIST,                   NA,  FALSE) \
+FLAG( 406,  0, EAX,  1,  1, MSR_BITMAPS,                           NA,  FALSE) \
+FLAG( 406,  0, EAX,  2,  1, ARCH_PMCS,                             NA,  FALSE) \
+FLAG( 406,  0, EAX,  3,  1, SLAT,                                  NA,  FALSE) \
+FLAG( 406,  0, EAX,  4,  1, DMA_REMAPPING,                         NA,  FALSE) \
+FLAG( 406,  0, EAX,  5,  1, INTERRUPT_REMAPPING,                   NA,  FALSE) \
+FLAG( 406,  0, EAX,  6,  1, MEMORY_PATROL_SCRUBBER,                NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_410                                             \
+FIELD(410,  0, EAX,  0, 32, TSC_HZ,                                NA,  FALSE) \
+FIELD(410,  0, EBX,  0, 32, ACPIBUS_HZ,                            NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_80                                              \
+FIELD( 80,  0, EAX,  0, 32, NUM_EXT_LEVELS,                        NA,  FALSE) \
+FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                        NA,  FALSE) \
+FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                        NA,  FALSE) \
+FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                        NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81                                              \
+FIELD( 81,  0, EAX,  0, 32, UNKNOWN81EAX,                          ANY, FALSE) \
+FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                       ANY, FALSE) \
+FIELD( 81,  0, EAX,  4,  4, LEAF81_MODEL,                          ANY, FALSE) \
+FIELD( 81,  0, EAX,  8,  4, LEAF81_FAMILY,                         ANY, FALSE) \
+FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                           ANY, FALSE) \
+FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,                 ANY, FALSE) \
+FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,                ANY, FALSE) \
+FIELD( 81,  0, EBX,  0, 32, UNKNOWN81EBX,                          ANY, FALSE) \
+FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                       ANY, FALSE) \
+FIELD( 81,  0, EBX, 16, 16, UNDEF,                                 ANY, FALSE) \
+FLAG(  81,  0, ECX,  0,  1, LAHF64,                                YES, TRUE)  \
+FLAG(  81,  0, ECX,  1,  1, CMPLEGACY,                             ANY, FALSE) \
+FLAG(  81,  0, ECX,  2,  1, SVM,                                   YES, FALSE) \
+FLAG(  81,  0, ECX,  3,  1, EXTAPICSPC,                            YES, FALSE) \
+FLAG(  81,  0, ECX,  4,  1, CR8AVAIL,                              YES, FALSE) \
+FLAG(  81,  0, ECX,  5,  1, ABM,                                   YES, TRUE)  \
+FLAG(  81,  0, ECX,  6,  1, SSE4A,                                 YES, TRUE)  \
+FLAG(  81,  0, ECX,  7,  1, MISALIGNED_SSE,                        YES, TRUE)  \
+FLAG(  81,  0, ECX,  8,  1, 3DNPREFETCH,                           YES, TRUE)  \
+FLAG(  81,  0, ECX,  9,  1, OSVW,                                  ANY, FALSE) \
+FLAG(  81,  0, ECX, 10,  1, IBS,                                   NO,  FALSE) \
+FLAG(  81,  0, ECX, 11,  1, XOP,                                   YES, TRUE)  \
+FLAG(  81,  0, ECX, 12,  1, SKINIT,                                NO,  FALSE) \
+FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                              NO,  FALSE) \
+FLAG(  81,  0, ECX, 15,  1, LWP,                                   NO,  FALSE) \
+FLAG(  81,  0, ECX, 16,  1, FMA4,                                  YES, TRUE)  \
+FLAG(  81,  0, ECX, 17,  1, TCE,                                   NO,  FALSE) \
+FLAG(  81,  0, ECX, 19,  1, NODEID_MSR,                            NO,  FALSE) \
+FLAG(  81,  0, ECX, 21,  1, TBM,                                   YES, TRUE)  \
+FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                              NO,  FALSE) \
+FLAG(  81,  0, ECX, 23,  1, PERFCORE,                              ANY, TRUE)  \
+FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                            YES, TRUE)  \
+FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  2,  1, LEAF81_DE,                             YES, FALSE) \
+FLAG(  81,  0, EDX,  3,  1, LEAF81_PSE,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  4,  1, LEAF81_TSC,                            YES, TRUE)  \
+FLAG(  81,  0, EDX,  5,  1, LEAF81_MSR,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  6,  1, LEAF81_PAE,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  7,  1, LEAF81_MCE,                            YES, FALSE) \
+FLAG(  81,  0, EDX,  8,  1, LEAF81_CX8,                            YES, TRUE)  \
+FLAG(  81,  0, EDX,  9,  1, LEAF81_APIC,                           ANY, FALSE) \
+FLAG(  81,  0, EDX, 11,  1, SYSC,                                  ANY, TRUE)  \
+FLAG(  81,  0, EDX, 12,  1, LEAF81_MTRR,                           YES, FALSE) \
+FLAG(  81,  0, EDX, 13,  1, LEAF81_PGE,                            YES, FALSE) \
+FLAG(  81,  0, EDX, 14,  1, LEAF81_MCA,                            YES, FALSE) \
+FLAG(  81,  0, EDX, 15,  1, LEAF81_CMOV,                           YES, TRUE)  \
+FLAG(  81,  0, EDX, 16,  1, LEAF81_PAT,                            YES, FALSE) \
+FLAG(  81,  0, EDX, 17,  1, LEAF81_PSE36,                          YES, FALSE) \
+FLAG(  81,  0, EDX, 20,  1, NX,                                    YES, FALSE) \
+FLAG(  81,  0, EDX, 22,  1, MMXEXT,                                YES, TRUE)  \
+FLAG(  81,  0, EDX, 23,  1, LEAF81_MMX,                            YES, TRUE)  \
+FLAG(  81,  0, EDX, 24,  1, LEAF81_FXSR,                           YES, TRUE)  \
+FLAG(  81,  0, EDX, 25,  1, FFXSR,                                 YES, FALSE) \
+FLAG(  81,  0, EDX, 26,  1, PDPE1GB,                               YES, FALSE) \
+FLAG(  81,  0, EDX, 27,  1, RDTSCP,                                YES, TRUE)  \
+FLAG(  81,  0, EDX, 29,  1, LM,                                    YES, FALSE) \
+FLAG(  81,  0, EDX, 30,  1, 3DNOWPLUS,                             YES, TRUE)  \
+FLAG(  81,  0, EDX, 31,  1, 3DNOW,                                 YES, TRUE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_82                                              \
+FIELD( 82,  0, EAX,  0, 32, LEAF82_BRAND_STRING_EAX,               NA,  FALSE) \
+FIELD( 82,  0, EBX,  0, 32, LEAF82_BRAND_STRING_EBX,               NA,  FALSE) \
+FIELD( 82,  0, ECX,  0, 32, LEAF82_BRAND_STRING_ECX,               NA,  FALSE) \
+FIELD( 82,  0, EDX,  0, 32, LEAF82_BRAND_STRING_EDX,               NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_83                                              \
+FIELD( 83,  0, EAX,  0, 32, LEAF83_BRAND_STRING_EAX,               NA,  FALSE) \
+FIELD( 83,  0, EBX,  0, 32, LEAF83_BRAND_STRING_EBX,               NA,  FALSE) \
+FIELD( 83,  0, ECX,  0, 32, LEAF83_BRAND_STRING_ECX,               NA,  FALSE) \
+FIELD( 83,  0, EDX,  0, 32, LEAF83_BRAND_STRING_EDX,               NA,  FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_84                                              \
+FIELD( 84,  0, EAX,  0, 32, LEAF84_BRAND_STRING_EAX,               NA,  FALSE) \
+FIELD( 84,  0, EBX,  0, 32, LEAF84_BRAND_STRING_EBX,               NA,  FALSE) \
+FIELD( 84,  0, ECX,  0, 32, LEAF84_BRAND_STRING_ECX,               NA,  FALSE) \
+FIELD( 84,  0, EDX,  0, 32, LEAF84_BRAND_STRING_EDX,               NA,  FALSE)
+
+#ifdef COMMUNITY_SOURCE_AMD_SECRET /* { */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_8A_EDX_11 \
+FLAG(  8A,  0, EDX, 11,  1, SKINIT_PATCH_RETAINED,                 NO,  FALSE)
+#define CPUID_8A_EDX_14_31 \
+FLAG(  8A,  0, EDX, 14,  1, SVM_X2APIC,                            NO,  FALSE) \
+FIELD( 8A,  0, EDX, 15, 17, SVMEDX_RSVD2,                          NO,  FALSE)
+#else
+#define CPUID_8A_EDX_11 \
+FLAG(  8A,  0, EDX, 11,  1, SVMEDX_RSVD1,                          NO,  FALSE)
+#define CPUID_8A_EDX_14_31 \
+FIELD( 8A,  0, EDX, 14, 18, SVMEDX_RSVD2,                          NO,  FALSE)
+#endif /* } COMMUNITY_SOURCE_AMD_SECRET */
+
+/*    LEVEL, REG, POS, SIZE, NAME,                             MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_8x                                              \
+FIELD( 85,  0, EAX,  0,  8, ITLB_ENTRIES_2M4M_PGS,                 NA,  FALSE) \
+FIELD( 85,  0, EAX,  8,  8, ITLB_ASSOC_2M4M_PGS,                   NA,  FALSE) \
+FIELD( 85,  0, EAX, 16,  8, DTLB_ENTRIES_2M4M_PGS,                 NA,  FALSE) \
+FIELD( 85,  0, EAX, 24,  8, DTLB_ASSOC_2M4M_PGS,                   NA,  FALSE) \
+FIELD( 85,  0, EBX,  0,  8, ITLB_ENTRIES_4K_PGS,                   NA,  FALSE) \
+FIELD( 85,  0, EBX,  8,  8, ITLB_ASSOC_4K_PGS,                     NA,  FALSE) \
+FIELD( 85,  0, EBX, 16,  8, DTLB_ENTRIES_4K_PGS,                   NA,  FALSE) \
+FIELD( 85,  0, EBX, 24,  8, DTLB_ASSOC_4K_PGS,                     NA,  FALSE) \
+FIELD( 85,  0, ECX,  0,  8, L1_DCACHE_LINE_SIZE,                   NA,  FALSE) \
+FIELD( 85,  0, ECX,  8,  8, L1_DCACHE_LINES_PER_TAG,               NA,  FALSE) \
+FIELD( 85,  0, ECX, 16,  8, L1_DCACHE_ASSOC,                       NA,  FALSE) \
+FIELD( 85,  0, ECX, 24,  8, L1_DCACHE_SIZE,                        NA,  FALSE) \
+FIELD( 85,  0, EDX,  0,  8, L1_ICACHE_LINE_SIZE,                   NA,  FALSE) \
+FIELD( 85,  0, EDX,  8,  8, L1_ICACHE_LINES_PER_TAG,               NA,  FALSE) \
+FIELD( 85,  0, EDX, 16,  8, L1_ICACHE_ASSOC,                       NA,  FALSE) \
+FIELD( 85,  0, EDX, 24,  8, L1_ICACHE_SIZE,                        NA,  FALSE) \
+FIELD( 86,  0, EAX,  0, 12, L2_ITLB_ENTRIES_2M4M_PGS,              NA,  FALSE) \
+FIELD( 86,  0, EAX, 12,  4, L2_ITLB_ASSOC_2M4M_PGS,                NA,  FALSE) \
+FIELD( 86,  0, EAX, 16, 12, L2_DTLB_ENTRIES_2M4M_PGS,              NA,  FALSE) \
+FIELD( 86,  0, EAX, 28,  4, L2_DTLB_ASSOC_2M4M_PGS,                NA,  FALSE) \
+FIELD( 86,  0, EBX,  0, 12, L2_ITLB_ENTRIES_4K_PGS,                NA,  FALSE) \
+FIELD( 86,  0, EBX, 12,  4, L2_ITLB_ASSOC_4K_PGS,                  NA,  FALSE) \
+FIELD( 86,  0, EBX, 16, 12, L2_DTLB_ENTRIES_4K_PGS,                NA,  FALSE) \
+FIELD( 86,  0, EBX, 28,  4, L2_DTLB_ASSOC_4K_PGS,                  NA,  FALSE) \
+FIELD( 86,  0, ECX,  0,  8, L2CACHE_LINE,                          NA,  FALSE) \
+FIELD( 86,  0, ECX,  8,  4, L2CACHE_LINE_PER_TAG,                  NA,  FALSE) \
+FIELD( 86,  0, ECX, 12,  4, L2CACHE_WAYS,                          NA,  FALSE) \
+FIELD( 86,  0, ECX, 16, 16, L2CACHE_SIZE,                          NA,  FALSE) \
+FIELD( 86,  0, EDX,  0,  8, L3CACHE_LINE,                          NA,  FALSE) \
+FIELD( 86,  0, EDX,  8,  4, L3CACHE_LINE_PER_TAG,                  NA,  FALSE) \
+FIELD( 86,  0, EDX, 12,  4, L3CACHE_WAYS,                          NA,  FALSE) \
+FIELD( 86,  0, EDX, 18, 14, L3CACHE_SIZE,                          NA,  FALSE) \
+FLAG(  87,  0, EDX,  0,  1, TS,                                    NA,  FALSE) \
+FLAG(  87,  0, EDX,  1,  1, FID,                                   NA,  FALSE) \
+FLAG(  87,  0, EDX,  2,  1, VID,                                   NA,  FALSE) \
+FLAG(  87,  0, EDX,  3,  1, TTP,                                   NA,  FALSE) \
+FLAG(  87,  0, EDX,  4,  1, LEAF87_TM,                             NA,  FALSE) \
+FLAG(  87,  0, EDX,  5,  1, STC,                                   NA,  FALSE) \
+FLAG(  87,  0, EDX,  6,  1, 100MHZSTEPS,                           NA,  FALSE) \
+FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                              NA,  FALSE) \
+FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                         NA,  FALSE) \
+FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                       NA,  FALSE) \
+FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                             NA,  FALSE) \
+FIELD( 88,  0, EAX,  8,  8, VIRT_BITS,                             NA,  FALSE) \
+FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                    NA,  FALSE) \
+FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                     NA,  FALSE) \
+FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                    NA,  FALSE) \
+FIELD( 8A,  0, EAX,  0,  8, SVM_REVISION,                          YES, FALSE) \
+FLAG(  8A,  0, EAX,  8,  1, SVM_HYPERVISOR,                        NO,  FALSE) \
+FIELD( 8A,  0, EAX,  9, 23, SVMEAX_RSVD,                           NO,  FALSE) \
+FIELD( 8A,  0, EBX,  0, 32, SVM_NUM_ASIDS,                         YES, FALSE) \
+FIELD( 8A,  0, ECX,  0, 32, SVMECX_RSVD,                           NO,  FALSE) \
+FLAG(  8A,  0, EDX,  0,  1, SVM_NPT,                               YES, FALSE) \
+FLAG(  8A,  0, EDX,  1,  1, SVM_LBR,                               NO,  FALSE) \
+FLAG(  8A,  0, EDX,  2,  1, SVM_LOCK,                              ANY, FALSE) \
+FLAG(  8A,  0, EDX,  3,  1, SVM_NRIP,                              YES, FALSE) \
+FLAG(  8A,  0, EDX,  4,  1, SVM_TSC_RATE_MSR,                      NO,  FALSE) \
+FLAG(  8A,  0, EDX,  5,  1, SVM_VMCB_CLEAN,                        YES, FALSE) \
+FLAG(  8A,  0, EDX,  6,  1, SVM_FLUSH_BY_ASID,                     YES, FALSE) \
+FLAG(  8A,  0, EDX,  7,  1, SVM_DECODE_ASSISTS,                    YES, FALSE) \
+FIELD( 8A,  0, EDX,  8,  2, SVMEDX_RSVD0,                          NO,  FALSE) \
+FLAG(  8A,  0, EDX, 10,  1, SVM_PAUSE_FILTER,                      NO,  FALSE) \
+CPUID_8A_EDX_11 \
+FLAG(  8A,  0, EDX, 12,  1, SVM_PAUSE_THRESHOLD,                   NO,  FALSE) \
+FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                              NO,  FALSE) \
+CPUID_8A_EDX_14_31
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81x                                             \
+FIELD(819,  0, EAX,  0, 12, L1_ITLB_ENTRIES_1G_PGS,                NA,  FALSE) \
+FIELD(819,  0, EAX, 12,  4, L1_ITLB_ASSOC_1G_PGS,                  NA,  FALSE) \
+FIELD(819,  0, EAX, 16, 12, L1_DTLB_ENTRIES_1G_PGS,                NA,  FALSE) \
+FIELD(819,  0, EAX, 28,  4, L1_DTLB_ASSOC_1G_PGS,                  NA,  FALSE) \
+FIELD(819,  0, EBX,  0, 12, L2_ITLB_ENTRIES_1G_PGS,                NA,  FALSE) \
+FIELD(819,  0, EBX, 12,  4, L2_ITLB_ASSOC_1G_PGS,                  NA,  FALSE) \
+FIELD(819,  0, EBX, 16, 12, L2_DTLB_ENTRIES_1G_PGS,                NA,  FALSE) \
+FIELD(819,  0, EBX, 28,  4, L2_DTLB_ASSOC_1G_PGS,                  NA,  FALSE) \
+FLAG( 81A,  0, EAX,  0,  1, FP128,                                 NA,  FALSE) \
+FLAG( 81A,  0, EAX,  1,  1, MOVU,                                  NA,  FALSE) \
+FLAG( 81B,  0, EAX,  0,  1, IBS_FFV,                               NA,  FALSE) \
+FLAG( 81B,  0, EAX,  1,  1, IBS_FETCHSAM,                          NA,  FALSE) \
+FLAG( 81B,  0, EAX,  2,  1, IBS_OPSAM,                             NA,  FALSE) \
+FLAG( 81B,  0, EAX,  3,  1, RW_OPCOUNT,                            NA,  FALSE) \
+FLAG( 81B,  0, EAX,  4,  1, OPCOUNT,                               NA,  FALSE) \
+FLAG( 81B,  0, EAX,  5,  1, BRANCH_TARGET_ADDR,                    NA,  FALSE) \
+FLAG( 81B,  0, EAX,  6,  1, OPCOUNT_EXT,                           NA,  FALSE) \
+FLAG( 81B,  0, EAX,  7,  1, RIP_INVALID_CHECK,                     NA,  FALSE) \
+FLAG( 81C,  0, EAX,  0,  1, LWP_AVAIL,                             NA,  FALSE) \
+FLAG( 81C,  0, EAX,  1,  1, LWP_VAL_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  2,  1, LWP_IRE_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  3,  1, LWP_BRE_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  4,  1, LWP_DME_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  5,  1, LWP_CNH_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX,  6,  1, LWP_RNH_AVAIL,                         NA,  FALSE) \
+FLAG( 81C,  0, EAX, 31,  1, LWP_INT_AVAIL,                         NA,  FALSE) \
+FIELD(81C,  0, EBX,  0,  8, LWP_CB_SIZE,                           NA,  FALSE) \
+FIELD(81C,  0, EBX,  8,  8, LWP_EVENT_SIZE,                        NA,  FALSE) \
+FIELD(81C,  0, EBX, 16,  8, LWP_MAX_EVENTS,                        NA,  FALSE) \
+FIELD(81C,  0, EBX, 24,  8, LWP_EVENT_OFFSET,                      NA,  FALSE) \
+FIELD(81C,  0, ECX,  0,  4, LWP_LATENCY_MAX,                       NA,  FALSE) \
+FLAG( 81C,  0, ECX,  5,  1, LWP_DATA_ADDR_VALID,                   NA,  FALSE) \
+FIELD(81C,  0, ECX,  6,  3, LWP_LATENCY_ROUND,                     NA,  FALSE) \
+FIELD(81C,  0, ECX,  9,  7, LWP_VERSION,                           NA,  FALSE) \
+FIELD(81C,  0, ECX, 16,  8, LWP_MIN_BUF_SIZE,                      NA,  FALSE) \
+FLAG( 81C,  0, ECX, 28,  1, LWP_BRANCH_PRED,                       NA,  FALSE) \
+FLAG( 81C,  0, ECX, 29,  1, LWP_IP_FILTERING,                      NA,  FALSE) \
+FLAG( 81C,  0, ECX, 30,  1, LWP_CACHE_LEVEL,                       NA,  FALSE) \
+FLAG( 81C,  0, ECX, 31,  1, LWP_CACHE_LATENCY,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  0,  1, LWP_SUPPORTED,                         NA,  FALSE) \
+FLAG( 81C,  0, EDX,  1,  1, LWP_VAL_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  2,  1, LWP_IRE_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  3,  1, LWP_BRE_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  4,  1, LWP_DME_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  5,  1, LWP_CNH_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX,  6,  1, LWP_RNH_SUPPORTED,                     NA,  FALSE) \
+FLAG( 81C,  0, EDX, 31,  1, LWP_INT_SUPPORTED,                     NA,  FALSE) \
+FIELD(81D,  0, EAX,  0,  5, LEAF81D_CACHE_TYPE,                    NA,  FALSE) \
+FIELD(81D,  0, EAX,  5,  3, LEAF81D_CACHE_LEVEL,                   NA,  FALSE) \
+FLAG( 81D,  0, EAX,  8,  1, LEAF81D_CACHE_SELF_INIT,               NA,  FALSE) \
+FLAG( 81D,  0, EAX,  9,  1, LEAF81D_CACHE_FULLY_ASSOC,             NA,  FALSE) \
+FIELD(81D,  0, EAX, 14, 12, LEAF81D_NUM_SHARING_CACHE,             NA,  FALSE) \
+FIELD(81D,  0, EBX,  0, 12, LEAF81D_CACHE_LINE_SIZE,               NA,  FALSE) \
+FIELD(81D,  0, EBX, 12, 10, LEAF81D_CACHE_PHYS_PARTITIONS,         NA,  FALSE) \
+FIELD(81D,  0, EBX, 22, 10, LEAF81D_CACHE_WAYS,                    NA,  FALSE) \
+FIELD(81D,  0, ECX,  0, 32, LEAF81D_CACHE_NUM_SETS,                NA,  FALSE) \
+FLAG( 81D,  0, EDX,  0,  1, LEAF81D_CACHE_WBINVD,                  NA,  FALSE) \
+FLAG( 81D,  0, EDX,  1,  1, LEAF81D_CACHE_INCLUSIVE,               NA,  FALSE) \
+FIELD(81E,  0, EAX,  0, 32, EXTENDED_APICID,                       NA,  FALSE) \
+FIELD(81E,  0, EBX,  0,  8, COMPUTE_UNIT_ID,                       NA,  FALSE) \
+FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,                NA,  FALSE) \
+FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                            NA,  FALSE) \
+FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                         NA,  FALSE)
+
+#define INTEL_CPUID_FIELD_DATA
+
+#ifdef COMMUNITY_SOURCE_AMD_SECRET
+/* These CPUID bit definitions are not yet public either. */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+#define AMD_CPUID_FIELD_DATA                                                   \
+FLAG(  81,  0, ECX, 14,  1, TBM0,                                  NO,  FALSE) \
+FLAG(  81,  0, ECX, 23,  1, PERFCTR_EXT_NB,                        NO,  FALSE) \
+FLAG(  81,  0, ECX, 24,  1, PERFCTR_EXT_CORE,                      NO,  FALSE)
+#else
+#define AMD_CPUID_FIELD_DATA
+#endif
+
+#define CPUID_FIELD_DATA                                              \
+   CPUID_FIELD_DATA_LEVEL_0                                           \
+   CPUID_FIELD_DATA_LEVEL_1                                           \
+   CPUID_FIELD_DATA_LEVEL_2                                           \
+   CPUID_FIELD_DATA_LEVEL_4                                           \
+   CPUID_FIELD_DATA_LEVEL_5                                           \
+   CPUID_FIELD_DATA_LEVEL_6                                           \
+   CPUID_FIELD_DATA_LEVEL_7                                           \
+   CPUID_FIELD_DATA_LEVEL_A                                           \
+   CPUID_FIELD_DATA_LEVEL_B                                           \
+   CPUID_FIELD_DATA_LEVEL_D                                           \
+   CPUID_FIELD_DATA_LEVEL_12                                          \
+   CPUID_FIELD_DATA_LEVEL_400                                         \
+   CPUID_FIELD_DATA_LEVEL_401                                         \
+   CPUID_FIELD_DATA_LEVEL_402                                         \
+   CPUID_FIELD_DATA_LEVEL_403                                         \
+   CPUID_FIELD_DATA_LEVEL_404                                         \
+   CPUID_FIELD_DATA_LEVEL_405                                         \
+   CPUID_FIELD_DATA_LEVEL_406                                         \
+   CPUID_FIELD_DATA_LEVEL_410                                         \
+   CPUID_FIELD_DATA_LEVEL_80                                          \
+   CPUID_FIELD_DATA_LEVEL_81                                          \
+   CPUID_FIELD_DATA_LEVEL_82                                          \
+   CPUID_FIELD_DATA_LEVEL_83                                          \
+   CPUID_FIELD_DATA_LEVEL_84                                          \
+   CPUID_FIELD_DATA_LEVEL_8x                                          \
+   CPUID_FIELD_DATA_LEVEL_81x                                         \
+   INTEL_CPUID_FIELD_DATA                                             \
+   AMD_CPUID_FIELD_DATA
+
+/*
+ * Define all field and flag values as an enum.  The result is a full
+ * set of values taken from the table above in the form:
+ *
+ * CPUID_<name>_MASK  == mask for feature/field
+ * CPUID_<name>_SHIFT == offset of field
+ *
+ * e.g. - CPUID_VIRT_BITS_MASK  = 0xff00
+ *      - CPUID_VIRT_BITS_SHIFT = 8
+ *
+ * Note: The MASK definitions must use some gymnastics to get
+ * around a warning when shifting left by 32.
+ */
+#define VMW_BIT_MASK(shift)  (((1 << (shift - 1)) << 1) - 1)
+
+#define FIELD(lvl, ecxIn, reg, bitpos, size, name, s, c3)      \
+   CPUID_##name##_SHIFT        = bitpos,                       \
+   CPUID_##name##_MASK         = VMW_BIT_MASK(size) << bitpos, \
+   CPUID_INTERNAL_SHIFT_##name = bitpos,                       \
+   CPUID_INTERNAL_MASK_##name  = VMW_BIT_MASK(size) << bitpos, \
+   CPUID_INTERNAL_REG_##name   = CPUID_REG_##reg,              \
+   CPUID_INTERNAL_EAXIN_##name = CPUID_LEVEL_VAL_##lvl,        \
+   CPUID_INTERNAL_ECXIN_##name = ecxIn,
+
+#define FLAG FIELD
+
+enum {
+   /* Define data for every CPUID field we have */
+   CPUID_FIELD_DATA
+};
+#undef VMW_BIT_MASK
+#undef FIELD
+#undef FLAG
+
+/*
+ * Legal CPUID config file mask characters.  For a description of the
+ * cpuid masking system, please see:
+ *
+ * http://vmweb.vmware.com/~mts/cgi-bin/view.cgi/Apps/CpuMigrationChecks
+ */
+
+#define CPUID_MASK_HIDE_CHR    '0'
+#define CPUID_MASK_HIDE_STR    "0"
+#define CPUID_MASK_FORCE_CHR   '1'
+#define CPUID_MASK_FORCE_STR   "1"
+#define CPUID_MASK_PASS_CHR    '-'
+#define CPUID_MASK_PASS_STR    "-"
+#define CPUID_MASK_TRUE_CHR    'T'
+#define CPUID_MASK_TRUE_STR    "T"
+#define CPUID_MASK_FALSE_CHR   'F'
+#define CPUID_MASK_FALSE_STR   "F"
+#define CPUID_MASK_IGNORE_CHR  'X'
+#define CPUID_MASK_IGNORE_STR  "X"
+#define CPUID_MASK_HOST_CHR    'H'
+#define CPUID_MASK_HOST_STR    "H"
+#define CPUID_MASK_RSVD_CHR    'R'
+#define CPUID_MASK_RSVD_STR    "R"
+#define CPUID_MASK_INSTALL_CHR 'I'
+#define CPUID_MASK_INSTALL_STR "I"
+
+/*
+ * When LM is disabled, we overlay the following masks onto the
+ * guest's default masks.  Any level that is not defined below should
+ * be treated as all "-"s
+ */
+
+#define CPT_ID1ECX_LM_DISABLED  "----:----:----:----:--0-:----:----:----"
+#define CPT_ID81EDX_LM_DISABLED "--0-:----:----:----:----:----:----:----"
+#define CPT_ID81ECX_LM_DISABLED "----:----:----:----:----:----:----:---0"
+
+#define CPT_GET_LM_DISABLED_MASK(lvl, reg)                                  \
+   ((lvl == 1 && reg == CPUID_REG_ECX) ? CPT_ID1ECX_LM_DISABLED :           \
+    (lvl == 0x80000001 && reg == CPUID_REG_ECX) ? CPT_ID81ECX_LM_DISABLED : \
+    (lvl == 0x80000001 && reg == CPUID_REG_EDX) ? CPT_ID81EDX_LM_DISABLED : \
+    NULL)
+
+/*
+ * CPUID_MASK --
+ * CPUID_SHIFT --
+ * CPUID_ISSET --
+ * CPUID_GET --
+ * CPUID_SET --
+ * CPUID_CLEAR --
+ * CPUID_SETTO --
+ *
+ * Accessor macros for all CPUID consts/fields/flags.  Level and reg are not
+ * required, but are used to force compile-time asserts which help verify that
+ * the flag is being used on the right CPUID input and result register.
+ *
+ * Note: ASSERT_ON_COMPILE is duplicated rather than factored into its own
+ * macro, because token concatenation does not work as expected if an input is
+ * #defined (e.g. APIC) when macros are nested.  Also, compound statements
+ * within parenthes is a GCC extension, so we must use runtime asserts with
+ * other compilers.
+ */
+
+#if defined(__GNUC__) && !defined(__clang__)
+
+#define CPUID_MASK(eaxIn, reg, flag)                                    \
+   ({                                                                   \
+      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
+              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
+      CPUID_INTERNAL_MASK_##flag;                                       \
+   })
+
+#define CPUID_SHIFT(eaxIn, reg, flag)                                   \
+   ({                                                                   \
+      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
+              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
+      CPUID_INTERNAL_SHIFT_##flag;                                      \
+   })
+
+#define CPUID_ISSET(eaxIn, reg, flag, data)                             \
+   ({                                                                   \
+      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
+              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
+      (((data) & CPUID_INTERNAL_MASK_##flag) != 0);                     \
+   })
+
+#define CPUID_GET(eaxIn, reg, field, data)                              \
+   ({                                                                   \
+      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##field &&        \
+              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field); \
+      (((uint32)(data) & CPUID_INTERNAL_MASK_##field) >>                \
+       CPUID_INTERNAL_SHIFT_##field);                                   \
+   })
+
+#else
+
+/*
+ * CPUIDCheck --
+ *
+ * Return val after verifying parameters.
+ */
+
+static INLINE uint32
+CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
+           CpuidReg reg, CpuidReg regCheck, uint32 val)
+{
+   ASSERT(eaxIn == eaxInCheck && reg == regCheck);
+   return val;
+}
+
+#define CPUID_MASK(eaxIn, reg, flag)                                    \
+   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                       \
+              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,     \
+              CPUID_INTERNAL_MASK_##flag)
+
+#define CPUID_SHIFT(eaxIn, reg, flag)                                   \
+   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                       \
+              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,     \
+              CPUID_INTERNAL_SHIFT_##flag)
+
+#define CPUID_ISSET(eaxIn, reg, flag, data)                             \
+   (CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                      \
+               CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,    \
+               CPUID_INTERNAL_MASK_##flag & (data)) != 0)
+
+#define CPUID_GET(eaxIn, reg, field, data)                              \
+   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##field,                      \
+              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##field,    \
+              ((uint32)(data) & CPUID_INTERNAL_MASK_##field) >>         \
+              CPUID_INTERNAL_SHIFT_##field)
+
+#endif
+
+
+#define CPUID_SET(eaxIn, reg, flag, dataPtr)                            \
+   do {                                                                 \
+      ASSERT_ON_COMPILE(                                                \
+         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##flag &&      \
+         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);       \
+      *(dataPtr) |= CPUID_INTERNAL_MASK_##flag;                         \
+   } while (0)
+
+#define CPUID_CLEAR(eaxIn, reg, flag, dataPtr)                          \
+   do {                                                                 \
+      ASSERT_ON_COMPILE(                                                \
+         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##flag &&      \
+         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);       \
+      *(dataPtr) &= ~CPUID_INTERNAL_MASK_##flag;                        \
+   } while (0)
+
+#define CPUID_SETTO(eaxIn, reg, field, dataPtr, val)                    \
+   do {                                                                 \
+      uint32 _v = val;                                                  \
+      uint32 *_d = dataPtr;                                             \
+      ASSERT_ON_COMPILE(                                                \
+         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##field &&     \
+         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field);      \
+      *_d = (*_d & ~CPUID_INTERNAL_MASK_##field) |                      \
+         (_v << CPUID_INTERNAL_SHIFT_##field);                          \
+      ASSERT(_v == (*_d & CPUID_INTERNAL_MASK_##field) >>               \
+             CPUID_INTERNAL_SHIFT_##field);                             \
+   } while (0)
+
+#define CPUID_SETTO_SAFE(eaxIn, reg, field, dataPtr, val)               \
+   do {                                                                 \
+      uint32 _v = val &                                                 \
+         (CPUID_INTERNAL_MASK_##field >> CPUID_INTERNAL_SHIFT_##field); \
+      uint32 *_d = dataPtr;                                             \
+      ASSERT_ON_COMPILE(                                                \
+         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##field &&     \
+         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field);      \
+      *_d = (*_d & ~CPUID_INTERNAL_MASK_##field) |                      \
+         (_v << CPUID_INTERNAL_SHIFT_##field);                          \
+   } while (0)
+
+
+/*
+ * Definitions of various fields' values and more complicated
+ * macros/functions for reading cpuid fields.
+ */
+
+#define CPUID_FAMILY_EXTENDED        15
+
+/* Effective Intel CPU Families */
+#define CPUID_FAMILY_486              4
+#define CPUID_FAMILY_P5               5
+#define CPUID_FAMILY_P6               6
+#define CPUID_FAMILY_P4              15
+
+/* Effective AMD CPU Families */
+#define CPUID_FAMILY_5x86            0x4
+#define CPUID_FAMILY_K5              0x5
+#define CPUID_FAMILY_K6              0x5
+#define CPUID_FAMILY_K7              0x6
+#define CPUID_FAMILY_K8              0xf
+#define CPUID_FAMILY_K8L             0x10
+#define CPUID_FAMILY_K8MOBILE        0x11
+#define CPUID_FAMILY_LLANO           0x12
+#define CPUID_FAMILY_BOBCAT          0x14
+#define CPUID_FAMILY_BULLDOZER       0x15  // Bulldozer Piledriver Steamroller
+#define CPUID_FAMILY_KYOTO           0x16  // Note: Jaguar microarch
+
+/* Effective VIA CPU Families */
+#define CPUID_FAMILY_C7               6
+
+/* Intel model information */
+#define CPUID_MODEL_PPRO              1
+#define CPUID_MODEL_PII_03            3
+#define CPUID_MODEL_PII_05            5
+#define CPUID_MODEL_CELERON_06        6
+#define CPUID_MODEL_PM_09             9
+#define CPUID_MODEL_PM_0D            13
+#define CPUID_MODEL_PM_0E            14  // Yonah / Sossaman
+#define CPUID_MODEL_CORE_0F          15  // Conroe / Merom
+#define CPUID_MODEL_CORE_17        0x17  // Penryn
+#define CPUID_MODEL_NEHALEM_1A     0x1a  // Nehalem / Gainestown
+#define CPUID_MODEL_ATOM_1C        0x1c  // Silverthorne / Diamondville
+#define CPUID_MODEL_CORE_1D        0x1d  // Dunnington
+#define CPUID_MODEL_NEHALEM_1E     0x1e  // Lynnfield
+#define CPUID_MODEL_NEHALEM_1F     0x1f  // Havendale
+#define CPUID_MODEL_NEHALEM_25     0x25  // Westmere / Clarkdale
+#define CPUID_MODEL_ATOM_26        0x26  // Lincroft
+#define CPUID_MODEL_ATOM_27        0x27  // Saltwell
+#define CPUID_MODEL_SANDYBRIDGE_2A 0x2a  // Sandybridge (desktop/mobile)
+#define CPUID_MODEL_NEHALEM_2C     0x2c  // Westmere-EP
+#define CPUID_MODEL_SANDYBRIDGE_2D 0x2d  // Sandybridge-EP
+#define CPUID_MODEL_NEHALEM_2E     0x2e  // Nehalem-EX
+#define CPUID_MODEL_NEHALEM_2F     0x2f  // Westmere-EX
+#define CPUID_MODEL_ATOM_35        0x35  // Cloverview
+#define CPUID_MODEL_ATOM_36        0x36  // Cedarview
+#define CPUID_MODEL_ATOM_37        0x37  // Bay Trail
+#define CPUID_MODEL_SANDYBRIDGE_3A 0x3a  // Ivy Bridge
+#define CPUID_MODEL_HASWELL_3C     0x3c  // Haswell DT
+#define CPUID_MODEL_BROADWELL_3D   0x3d  // Broadwell-Ult
+#define CPUID_MODEL_SANDYBRIDGE_3E 0x3e  // Ivy Bridge-EP
+#define CPUID_MODEL_HASWELL_3F     0x3f  // Haswell EP/EN/EX
+#define CPUID_MODEL_HASWELL_45     0x45  // Haswell Ultrathin
+#define CPUID_MODEL_HASWELL_46     0x46  // Haswell (Crystal Well)
+#define CPUID_MODEL_BROADWELL_47   0x47  // Broadwell (Denlow)
+#define CPUID_MODEL_ATOM_4A        0x4a  // Future Silvermont
+#define CPUID_MODEL_ATOM_4C        0x4c  // Airmont
+#define CPUID_MODEL_ATOM_4D        0x4d  // Avoton
+#define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y
+#define CPUID_MODEL_BROADWELL_4F   0x4f  // Broadwell EP/EN/EX
+#define CPUID_MODEL_BROADWELL_56   0x56  // Broadwell DE
+#define CPUID_MODEL_ATOM_5A        0x5a  // Future Silvermont
+#define CPUID_MODEL_ATOM_5D        0x5d  // Future Silvermont
+#define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S
+
+#define CPUID_MODEL_PIII_07    7
+#define CPUID_MODEL_PIII_08    8
+#define CPUID_MODEL_PIII_0A    10
+
+/* AMD model information */
+#define CPUID_MODEL_BARCELONA_02      0x02 // Barcelona (Opteron & Phenom)
+#define CPUID_MODEL_SHANGHAI_04       0x04 // Shanghai RB
+#define CPUID_MODEL_SHANGHAI_05       0x05 // Shanghai BL
+#define CPUID_MODEL_SHANGHAI_06       0x06 // Shanghai DA
+#define CPUID_MODEL_ISTANBUL_MAGNY_08 0x08 // Istanbul (6 core) & Magny-cours (12) HY
+#define CPUID_MODEL_ISTANBUL_MAGNY_09 0x09 // HY - G34 package
+#define CPUID_MODEL_PHAROAH_HOUND_0A  0x0A // Pharoah Hound
+#define CPUID_MODEL_PILEDRIVER_1F     0x1F // Max piledriver model defined in BKDG
+#define CPUID_MODEL_PILEDRIVER_10     0x10 // family == CPUID_FAMILY_BULLDOZER
+#define CPUID_MODEL_PILEDRIVER_02     0x02 // family == CPUID_FAMILY_BULLDOZER
+#define CPUID_MODEL_OPTERON_REVF_41   0x41 // family == CPUID_FAMILY_K8
+#define CPUID_MODEL_KYOTO_00          0x00 // family == CPUID_FAMILY_KYOTO
+#ifdef COMMUNITY_SOURCE_AMD_SECRET /* { */
+#define CPUID_MODEL_STEAMROLLER_3F    0x3F // Max Steamroller model defined in BKDG
+#define CPUID_MODEL_STEAMROLLER_30    0x30 // family == CPUID_FAMILY_BULLDOZER
+#endif /* } COMMUNITY_SOURCE_AMD_SECRET */
+
+/* VIA model information */
+#define CPUID_MODEL_NANO       15     // Isaiah
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_IsVendor{AMD,Intel,VIA} --
+ *
+ *      Determines if the vendor string in cpuid id0 is from {AMD,Intel,VIA}.
+ *
+ * Results:
+ *      True iff vendor string is CPUID_{AMD,INTEL,VIA}_VENDOR_STRING
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+CPUID_IsRawVendor(CPUIDRegs *id0, const char* vendor)
+{
+   // hard to get strcmp() in some environments, so do it in the raw
+   return (id0->ebx == *(const uint32 *) (vendor + 0) &&
+           id0->ecx == *(const uint32 *) (vendor + 4) &&
+           id0->edx == *(const uint32 *) (vendor + 8));
+}
+
+static INLINE Bool
+CPUID_IsVendorAMD(CPUIDRegs *id0)
+{
+   return CPUID_IsRawVendor(id0, CPUID_AMD_VENDOR_STRING);
+}
+
+static INLINE Bool
+CPUID_IsVendorIntel(CPUIDRegs *id0)
+{
+   return CPUID_IsRawVendor(id0, CPUID_INTEL_VENDOR_STRING);
+}
+
+static INLINE Bool
+CPUID_IsVendorVIA(CPUIDRegs *id0)
+{
+   return CPUID_IsRawVendor(id0, CPUID_VIA_VENDOR_STRING);
+}
+
+static INLINE uint32
+CPUID_EFFECTIVE_FAMILY(uint32 v) /* %eax from CPUID with %eax=1. */
+{
+   uint32 f = CPUID_GET(1, EAX, FAMILY, v);
+   return f != CPUID_FAMILY_EXTENDED ? f : f +
+      CPUID_GET(1, EAX, EXTENDED_FAMILY, v);
+}
+
+/* Normally only used when FAMILY==CPUID_FAMILY_EXTENDED, but Intel is
+ * now using the extended model field for FAMILY==CPUID_FAMILY_P6 to
+ * refer to the newer Core2 CPUs
+ */
+static INLINE uint32
+CPUID_EFFECTIVE_MODEL(uint32 v) /* %eax from CPUID with %eax=1. */
+{
+   uint32 m = CPUID_GET(1, EAX, MODEL, v);
+   uint32 em = CPUID_GET(1, EAX, EXTENDED_MODEL, v);
+   return m + (em << 4);
+}
+
+/*
+ * Notice that CPUID families for Intel and AMD overlap. The following macros
+ * should only be used AFTER the manufacturer has been established (through
+ * the use of CPUID standard function 0).
+ */
+static INLINE Bool
+CPUID_FAMILY_IS_486(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_486;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_P5(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P5;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_P6(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P6;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_PENTIUM4(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P4;
+}
+
+/*
+ * Intel Pentium M processors are Yonah/Sossaman or an older P-M
+ */
+static INLINE Bool
+CPUID_UARCH_IS_PENTIUM_M(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_09 ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_0D ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_0E);
+}
+
+/*
+ * Intel Core processors are Merom, Conroe, Woodcrest, Clovertown,
+ * Penryn, Dunnington, Kentsfield, Yorktown, Harpertown, ........
+ */
+static INLINE Bool
+CPUID_UARCH_IS_CORE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   uint32 model = CPUID_EFFECTIVE_MODEL(v);
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          model >= CPUID_MODEL_CORE_0F &&
+          (model < CPUID_MODEL_NEHALEM_1A ||
+           model == CPUID_MODEL_CORE_1D);
+}
+
+/*
+ * Intel Nehalem processors are: Nehalem, Gainestown, Lynnfield, Clarkdale.
+ */
+static INLINE Bool
+CPUID_UARCH_IS_NEHALEM(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_NEHALEM_1A ||
+           effectiveModel == CPUID_MODEL_NEHALEM_1E ||
+           effectiveModel == CPUID_MODEL_NEHALEM_1F ||
+           effectiveModel == CPUID_MODEL_NEHALEM_25 ||
+           effectiveModel == CPUID_MODEL_NEHALEM_2C ||
+           effectiveModel == CPUID_MODEL_NEHALEM_2E ||
+           effectiveModel == CPUID_MODEL_NEHALEM_2F);
+}
+
+
+static INLINE Bool
+CPUID_UARCH_IS_SANDYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_SANDYBRIDGE_2A ||
+           effectiveModel == CPUID_MODEL_SANDYBRIDGE_2D ||
+           effectiveModel == CPUID_MODEL_SANDYBRIDGE_3E ||
+           effectiveModel == CPUID_MODEL_SANDYBRIDGE_3A);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_BROADWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_BROADWELL_3D ||
+           effectiveModel == CPUID_MODEL_BROADWELL_47 ||
+           effectiveModel == CPUID_MODEL_BROADWELL_4F ||
+           effectiveModel == CPUID_MODEL_BROADWELL_56);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_HASWELL_3C ||
+           effectiveModel == CPUID_MODEL_HASWELL_3F ||
+           effectiveModel == CPUID_MODEL_HASWELL_45 ||
+           effectiveModel == CPUID_MODEL_HASWELL_46);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E);
+}
+
+
+static INLINE Bool
+CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) && CPUID_MODEL_IS_SKYLAKE(v);
+}
+
+
+static INLINE Bool
+CPUID_UARCH_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_MODEL_IS_BROADWELL(v) || CPUID_MODEL_IS_HASWELL(v));
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_CENTERTON(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_1C;
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_AVOTON(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_4D;
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_WESTMERE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_NEHALEM_25 || // Clarkdale
+           effectiveModel == CPUID_MODEL_NEHALEM_2C || // Westmere-EP
+           effectiveModel == CPUID_MODEL_NEHALEM_2F);  // Westmere-EX
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_SANDYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) &&
+          (effectiveModel == CPUID_MODEL_SANDYBRIDGE_2A ||
+           effectiveModel == CPUID_MODEL_SANDYBRIDGE_2D);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_IVYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
+
+   return CPUID_FAMILY_IS_P6(v) && (
+       effectiveModel == CPUID_MODEL_SANDYBRIDGE_3E ||
+       effectiveModel == CPUID_MODEL_SANDYBRIDGE_3A);
+}
+
+
+static INLINE Bool
+CPUID_FAMILY_IS_K7(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K7;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8EXT(uint32 eax)
+{
+   /*
+    * We check for this pattern often enough that it's
+    * worth a separate function, for syntactic sugar.
+    */
+   return CPUID_FAMILY_IS_K8(eax) &&
+          CPUID_GET(1, EAX, EXTENDED_MODEL, eax) != 0;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8L(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8L ||
+          CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_LLANO;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_LLANO(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_LLANO;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8MOBILE(uint32 eax)
+{
+   /* Essentially a K8 (not K8L) part, but with mobile features. */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8MOBILE;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_K8STAR(uint32 eax)
+{
+   /*
+    * Read function name as "K8*", as in wildcard.
+    * Matches K8 or K8L or K8MOBILE
+    */
+   return CPUID_FAMILY_IS_K8(eax) || CPUID_FAMILY_IS_K8L(eax) ||
+          CPUID_FAMILY_IS_K8MOBILE(eax);
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_BOBCAT(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BOBCAT;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_BULLDOZER(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER;
+}
+
+static INLINE Bool
+CPUID_FAMILY_IS_KYOTO(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_KYOTO;
+}
+
+/*
+ * AMD Barcelona (of either Opteron or Phenom kind).
+ */
+static INLINE Bool
+CPUID_MODEL_IS_BARCELONA(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is AMD. */
+   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
+          CPUID_EFFECTIVE_MODEL(v)  == CPUID_MODEL_BARCELONA_02;
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_SHANGHAI(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is AMD. */
+   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
+          (CPUID_MODEL_SHANGHAI_04  <= CPUID_EFFECTIVE_MODEL(v) &&
+           CPUID_EFFECTIVE_MODEL(v) <= CPUID_MODEL_SHANGHAI_06);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_ISTANBUL_MAGNY(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is AMD. */
+   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
+          (CPUID_MODEL_ISTANBUL_MAGNY_08 <= CPUID_EFFECTIVE_MODEL(v) &&
+           CPUID_EFFECTIVE_MODEL(v)      <= CPUID_MODEL_ISTANBUL_MAGNY_09);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_PHAROAH_HOUND(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is AMD. */
+   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
+          CPUID_EFFECTIVE_MODEL(v)  == CPUID_MODEL_PHAROAH_HOUND_0A;
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_BULLDOZER(uint32 eax)
+{
+   /*
+    * Bulldozer is models of family 0x15 that are below 10 excluding
+    * Piledriver 02.
+    */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
+          CPUID_EFFECTIVE_MODEL(eax)  < CPUID_MODEL_PILEDRIVER_10 &&
+          CPUID_EFFECTIVE_MODEL(eax) != CPUID_MODEL_PILEDRIVER_02;
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_PILEDRIVER(uint32 eax)
+{
+   /* Piledriver is models 0x02 & 0x10 of family 0x15 (so far). */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
+          ((CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_PILEDRIVER_10 &&
+            CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_PILEDRIVER_1F) ||
+           CPUID_EFFECTIVE_MODEL(eax) == CPUID_MODEL_PILEDRIVER_02);
+}
+
+
+#ifdef COMMUNITY_SOURCE_AMD_SECRET /* { */
+static INLINE Bool
+CPUID_MODEL_IS_STEAMROLLER(uint32 eax)
+{
+   /* Steamroller is model 0x30 of family 0x15 (so far). */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
+          (CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_STEAMROLLER_30 &&
+           CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_STEAMROLLER_3F);
+}
+#endif /* } COMMUNITY_SOURCE_AMD_SECRET */
+
+
+static INLINE Bool
+CPUID_MODEL_IS_KYOTO(uint32 eax)
+{
+   /* Kyoto is models 0x00 of family 0x16 (so far). */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_KYOTO &&
+          CPUID_EFFECTIVE_MODEL(eax) == CPUID_MODEL_KYOTO_00;
+}
+
+#define CPUID_TYPE_PRIMARY     0
+#define CPUID_TYPE_OVERDRIVE   1
+#define CPUID_TYPE_SECONDARY   2
+
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_NULL      0
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_DATA      1
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_INST      2
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_UNIF      3
+#define CPUID_LEAF4_CACHE_TYPE_NULL      0
+#define CPUID_LEAF4_CACHE_TYPE_DATA      1
+#define CPUID_LEAF4_CACHE_TYPE_INST      2
+#define CPUID_LEAF4_CACHE_TYPE_UNIF      3
+#define CPUID_LEAF4_CACHE_INDEXING_DIRECT  0
+#define CPUID_LEAF4_CACHE_INDEXING_COMPLEX 1
+
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_SELF_INIT      0x00000100
+#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_FULLY_ASSOC    0x00000200
+#define CPUID_LEAF4_CACHE_SELF_INIT      0x00000100
+#define CPUID_LEAF4_CACHE_FULLY_ASSOC    0x00000200
+
+#define CPUID_INTEL_IDBECX_LEVEL_TYPE_INVALID   0
+#define CPUID_INTEL_IDBECX_LEVEL_TYPE_SMT       1
+#define CPUID_INTEL_IDBECX_LEVEL_TYPE_CORE      2
+#define CPUID_TOPOLOGY_LEVEL_TYPE_INVALID   0
+#define CPUID_TOPOLOGY_LEVEL_TYPE_SMT       1
+#define CPUID_TOPOLOGY_LEVEL_TYPE_CORE      2
+
+
+/*
+ * For certain AMD processors, an lfence instruction is necessary at various
+ * places to ensure ordering.
+ */
+
+static INLINE Bool
+CPUID_VendorRequiresFence(CpuidVendor vendor)
+{
+   return vendor == CPUID_VENDOR_AMD;
+}
+
+static INLINE Bool
+CPUID_VersionRequiresFence(uint32 version)
+{
+   return CPUID_EFFECTIVE_FAMILY(version) == CPUID_FAMILY_K8 &&
+          CPUID_EFFECTIVE_MODEL(version) < 0x40;
+}
+
+static INLINE Bool
+CPUID_ID0RequiresFence(CPUIDRegs *id0)
+{
+   if (id0->eax == 0) {
+      return FALSE;
+   }
+   return CPUID_IsVendorAMD(id0);
+}
+
+static INLINE Bool
+CPUID_ID1RequiresFence(CPUIDRegs *id1)
+{
+   return CPUID_VersionRequiresFence(id1->eax);
+}
+
+static INLINE Bool
+CPUID_RequiresFence(CpuidVendor vendor, // IN
+                    uint32 version)      // IN: %eax from CPUID with %eax=1.
+{
+   return CPUID_VendorRequiresFence(vendor) &&
+          CPUID_VersionRequiresFence(version);
+}
+
+
+/*
+ * The following low-level functions compute the number of
+ * cores per cpu.  They should be used cautiously because
+ * they do not necessarily work on all types of CPUs.
+ * High-level functions that are correct for all CPUs are
+ * available elsewhere: see lib/cpuidInfo/cpuidInfo.c.
+ */
+
+static INLINE uint32
+CPUID_IntelCoresPerPackage(uint32 v) /* %eax from CPUID with %eax=4 and %ecx=0. */
+{
+   // Note: This is not guaranteed to work on older Intel CPUs.
+   return 1 + CPUID_GET(4, EAX, LEAF4_CORE_COUNT, v);
+}
+
+
+static INLINE uint32
+CPUID_AMDCoresPerPackage(uint32 v) /* %ecx from CPUID with %eax=0x80000008. */
+{
+   // Note: This is not guaranteed to work on older AMD CPUs.
+   return 1 + CPUID_GET(0x80000008, ECX, LEAF88_CORE_COUNT, v);
+}
+
+
+/*
+ * Hypervisor CPUID space is 0x400000XX.
+ */
+static INLINE Bool
+CPUID_IsHypervisorLevel(uint32 level)
+{
+   return (level & 0xffffff00) == 0x40000000;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_LevelUsesEcx --
+ *
+ *      Returns TRUE for leaves that support input ECX != 0 (subleaves).
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+CPUID_LevelUsesEcx(uint32 level) {
+   return level == 4 || level == 7 || level == 0xb || level == 0xd ||
+          level == 0x8000001d;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_IsValid*Subleaf --
+ *
+ *      Functions to determine the last subleaf for the level specified
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+CPUID_IsValidBSubleaf(uint32 ebx)  // IN: %ebx = cpuid.b.sublevel.ebx
+{
+   return ebx != 0;
+}
+
+static INLINE Bool
+CPUID_IsValid4Subleaf(uint32 eax)  // IN: %eax = cpuid.4.sublevel.eax
+{
+   return eax != 0;
+}
+
+static INLINE Bool
+CPUID_IsValid7Subleaf(uint32 eax, uint32 subleaf)  // IN: %eax = cpuid.7.0.eax
+{
+   /*
+    * cpuid.7.0.eax is the max ecx (subleaf) index
+    */
+   return subleaf <= eax;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_IsValidDSubleaf --
+ *
+ *    It is the caller's repsonsibility to determine if the processor
+ *    supports XSAVE and therefore has D sub-leaves.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+CPUID_IsValidDSubleaf(uint32 subleaf)  // IN: subleaf to check
+{
+   return subleaf <= 63;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_SupportsMsrPlatformInfo --
+ *
+ *    Uses vendor and cpuid.1.0.eax to determine if the processor
+ *    supports MSR_PLATFORM_INFO.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+CPUID_SupportsMsrPlatformInfo(CpuidVendor vendor, uint32 version)
+{
+   return vendor == CPUID_VENDOR_INTEL &&
+          (CPUID_UARCH_IS_NEHALEM(version)     ||
+           CPUID_UARCH_IS_SANDYBRIDGE(version) ||
+           CPUID_UARCH_IS_HASWELL(version)     ||
+           CPUID_UARCH_IS_SKYLAKE(version)     ||
+           CPUID_MODEL_IS_AVOTON(version));
+}
+
+#endif

From 2a214307b9e55da062203c61488b26f955a7bc50 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Wed, 31 May 2017 10:17:49 +0200
Subject: [PATCH 02/41] import Workstation 12.5.6 module sources

---
 vmmon-only/include/compat_cred.h |  4 ++++
 vmmon-only/linux/driver.c        | 12 ++++++++++--
 vmmon-only/linux/hostif.c        |  5 ++++-
 vmnet-only/userif.c              |  3 +++
 4 files changed, 21 insertions(+), 3 deletions(-)

diff --git a/vmmon-only/include/compat_cred.h b/vmmon-only/include/compat_cred.h
index 95a7baa7..4c6d940f 100644
--- a/vmmon-only/include/compat_cred.h
+++ b/vmmon-only/include/compat_cred.h
@@ -24,7 +24,11 @@
  * Include linux/cred.h via linux/sched.h - it is not nice, but
  * as cpp does not have #ifexist...
  */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 11, 0)
 #include <linux/sched.h>
+#else
+#include <linux/cred.h>
+#endif
 
 #if !defined(current_fsuid) && LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 29)
 #define current_uid() (current->uid)
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 87cf45be..8acdc02b 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -104,7 +104,9 @@ long LinuxDriver_Ioctl(struct file *filp, u_int iocmd,
 
 static int LinuxDriver_Close(struct inode *inode, struct file *filp);
 static unsigned int LinuxDriverPoll(struct file *file, poll_table *wait);
-#if defined(VMW_NOPAGE_2624)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
+static int LinuxDriverFault(struct vm_fault *fault);
+#elif defined(VMW_NOPAGE_2624)
 static int LinuxDriverFault(struct vm_area_struct *vma, struct vm_fault *fault);
 #else
 static struct page *LinuxDriverNoPage(struct vm_area_struct *vma,
@@ -881,7 +883,10 @@ LinuxDriverPollTimeout(unsigned long clientData)  // IN:
  *-----------------------------------------------------------------------------
  */
 
-#if defined(VMW_NOPAGE_2624)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
+static int
+LinuxDriverFault(struct vm_fault *fault)     //IN/OUT
+#elif defined(VMW_NOPAGE_2624)
 static int LinuxDriverFault(struct vm_area_struct *vma, //IN
                             struct vm_fault *fault)     //IN/OUT
 #else
@@ -890,6 +895,9 @@ static struct page *LinuxDriverNoPage(struct vm_area_struct *vma, //IN
                                       int *type)                  //OUT: Fault type
 #endif
 {
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
+   struct vm_area_struct *vma = fault->vma;
+#endif
    VMLinux *vmLinux = (VMLinux *) vma->vm_file->private_data;
    unsigned long pg;
    struct page* page;
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index fd320130..fb9934ca 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -73,7 +73,10 @@
 #include <linux/capability.h>
 #include <linux/kthread.h>
 #include <linux/wait.h>
-
+#include <linux/signal.h>
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
+#include <linux/taskstats_kern.h> // For linux/sched/signal.h without version check
+#endif
 
 #include "vmware.h"
 #include "x86apic.h"
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index 94146f61..a7aee049 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -36,6 +36,9 @@
 #include <linux/slab.h>
 #include <linux/version.h>
 #include <linux/wait.h>
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
+#include <linux/taskstats_kern.h>  // For <linux/sched/signal.h> without version dependency
+#endif
 
 #include <net/checksum.h>
 #include <net/sock.h>

From 2bd541e26541d9389207a17f6127e8f3fda43b0b Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 23 Jun 2017 09:12:56 +0200
Subject: [PATCH 03/41] import Workstation 12.5.7 module sources

---
 vmmon-only/common/hostif.h          |  16 +-
 vmmon-only/common/memtrack.c        |  24 +-
 vmmon-only/common/memtrack.h        |  12 +-
 vmmon-only/common/task.c            |  32 ++-
 vmmon-only/common/vmx86.c           |  31 ++-
 vmmon-only/common/vmx86.h           |   3 +-
 vmmon-only/include/compat_pgtable.h |  96 ++------
 vmmon-only/include/pgtbl.h          | 352 +++++-----------------------
 vmmon-only/linux/driver.c           |  11 +-
 vmmon-only/linux/hostif.c           | 133 +++++++++--
 vmmon-only/vmcore/moduleloop.c      |   4 +-
 vmnet-only/bridge.c                 |  15 +-
 12 files changed, 297 insertions(+), 432 deletions(-)

diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index 865abc00..2b94ce1e 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -122,14 +122,10 @@ EXTERN MPN HostIF_GetNextAnonPage(VMDriver *vm, MPN mpn);
 EXTERN int HostIF_GetLockedPageList(VMDriver *vm, VA64 uAddr,
                                     unsigned int numPages);
 
-EXTERN int HostIF_ReadPage(MPN mpn, VA64 addr, Bool kernelBuffer);
-EXTERN int HostIF_WritePage(MPN mpn, VA64 addr, Bool kernelBuffer);
-#ifdef _WIN32
-/* Add a HostIF_ReadMachinePage() if/when needed */
+EXTERN int HostIF_ReadPage(VMDriver *vm, MPN mpn, VA64 addr, Bool kernelBuffer);
+EXTERN int HostIF_WritePage(VMDriver *vm, MPN mpn, VA64 addr,
+                            Bool kernelBuffer);
 EXTERN int HostIF_WriteMachinePage(MPN mpn, VA64 addr);
-#else
-#define HostIF_WriteMachinePage(_a, _b) HostIF_WritePage((_a), (_b), TRUE)
-#endif
 #if defined __APPLE__
 // There is no need for a fast clock lock on Mac OS.
 #define HostIF_FastClockLock(_callerID) do {} while (0)
@@ -145,4 +141,8 @@ EXTERN void HostIF_FreeMachinePage(MPN mpn);
 
 EXTERN int HostIF_SafeRDMSR(uint32 msr, uint64 *val);
 
+#if defined __APPLE__
+EXTERN void HostIF_PageUnitTest(void);
+#endif
+
 #endif // ifdef _HOSTIF_H_
diff --git a/vmmon-only/common/memtrack.c b/vmmon-only/common/memtrack.c
index e53daebc..eec98441 100644
--- a/vmmon-only/common/memtrack.c
+++ b/vmmon-only/common/memtrack.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -88,6 +88,7 @@
 
 #include "vmware.h"
 #include "hostif.h"
+#include "vmx86.h"
 
 #include "memtrack.h"
 
@@ -146,12 +147,11 @@ typedef struct MemTrackHT {
 typedef uint64 MemTrackHTKey;
 
 typedef struct MemTrack {
+   VMDriver         *vm;            /* The VM instance. */
    unsigned          numPages;      /* Number of pages tracked. */
    MemTrackDir1      dir1;          /* First level directory. */
    MemTrackHT        vpnHashTable;  /* VPN to entry hashtable. */
-#if defined(MEMTRACK_MPN_LOOKUP)
    MemTrackHT        mpnHashTable;  /* MPN to entry hashtable. */
-#endif
 } MemTrack;
 
 /*
@@ -304,11 +304,9 @@ MemTrackCleanup(MemTrack *mt)    // IN
       if (mt->vpnHashTable.pages[idx] != NULL) {
          HostIF_FreePage(mt->vpnHashTable.pages[idx]);
       }
-#if defined(MEMTRACK_MPN_LOOKUP)
       if (mt->mpnHashTable.pages[idx] != NULL) {
          HostIF_FreePage(mt->mpnHashTable.pages[idx]);
       }
-#endif
    }
 
    HostIF_FreeKernelMem(mt);
@@ -332,7 +330,7 @@ MemTrackCleanup(MemTrack *mt)    // IN
  */
 
 MemTrack *
-MemTrack_Init(void)
+MemTrack_Init(VMDriver *vm) // IN:
 {
    MemTrack *mt;
    unsigned idx;
@@ -349,6 +347,7 @@ MemTrack_Init(void)
       goto error;
    }
    memset(mt, 0, sizeof *mt);
+   mt->vm = vm;
 
    for (idx = 0; idx < MEMTRACK_HT_PAGES; idx++) {
       MemTrackHTPage *htPage = MemTrackAllocPage();
@@ -360,7 +359,6 @@ MemTrack_Init(void)
       mt->vpnHashTable.pages[idx] = htPage;
    }
 
-#if defined(MEMTRACK_MPN_LOOKUP)
    for (idx = 0; idx < MEMTRACK_HT_PAGES; idx++) {
       MemTrackHTPage *htPage = MemTrackAllocPage();
 
@@ -370,7 +368,6 @@ MemTrack_Init(void)
       }
       mt->mpnHashTable.pages[idx] = htPage;
    }
-#endif
 
    return mt;
 
@@ -409,6 +406,8 @@ MemTrack_Add(MemTrack *mt,    // IN
    MemTrackDir3 *dir3;
    MEMTRACK_IDX2DIR(idx, p1, p2, p3);
 
+   ASSERT(HostIF_VMLockIsHeld(mt->vm));
+
    if (p1 >= MEMTRACK_DIR1_ENTRIES ||
        p2 >= MEMTRACK_DIR2_ENTRIES ||
        p3 >= MEMTRACK_DIR3_ENTRIES) {
@@ -430,9 +429,7 @@ MemTrack_Add(MemTrack *mt,    // IN
    ent->mpn = mpn;
 
    MemTrackHTInsert(&mt->vpnHashTable, ent, &ent->vpnChain, ent->vpn);
-#if defined(MEMTRACK_MPN_LOOKUP)
    MemTrackHTInsert(&mt->mpnHashTable, ent, &ent->mpnChain, ent->mpn);
-#endif
 
    mt->numPages++;
 
@@ -461,6 +458,7 @@ MemTrack_LookupVPN(MemTrack *mt, // IN
                    VPN64 vpn)    // IN
 {
    MemTrackEntry *next = *MemTrackHTLookup(&mt->vpnHashTable, vpn);
+   ASSERT(HostIF_VMLockIsHeld(mt->vm));
 
    while (next != NULL) {
       if (next->vpn == vpn) {
@@ -473,7 +471,6 @@ MemTrack_LookupVPN(MemTrack *mt, // IN
 }
 
 
-#if defined(MEMTRACK_MPN_LOOKUP)
 /*
  *----------------------------------------------------------------------
  *
@@ -493,7 +490,9 @@ MemTrackEntry *
 MemTrack_LookupMPN(MemTrack *mt, // IN
                    MPN mpn)      // IN
 {
-   MemTrackEntry *next = *MemTrackHTLookup(&mt->mpnHashTable, mpn);
+   MemTrackEntry *next;
+   ASSERT(HostIF_VMLockIsHeld(mt->vm));
+   next = *MemTrackHTLookup(&mt->mpnHashTable, mpn);
 
    while (next != NULL) {
       if (next->mpn == mpn) {
@@ -504,7 +503,6 @@ MemTrack_LookupMPN(MemTrack *mt, // IN
 
    return NULL;
 }
-#endif
 
 
 /*
diff --git a/vmmon-only/common/memtrack.h b/vmmon-only/common/memtrack.h
index 977c5af3..6d104ad1 100644
--- a/vmmon-only/common/memtrack.h
+++ b/vmmon-only/common/memtrack.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,30 +31,22 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
-#if defined(VMX86_DEBUG)
-#define MEMTRACK_MPN_LOOKUP
-#endif
-
 struct MemTrack;
 
 typedef struct MemTrackEntry {
    VPN64                   vpn;
    MPN                     mpn;
    struct MemTrackEntry   *vpnChain;
-#if defined(MEMTRACK_MPN_LOOKUP)
    struct MemTrackEntry   *mpnChain;
-#endif
 } MemTrackEntry;
 
 typedef void (MemTrackCleanupCb)(void *cData, MemTrackEntry *entry);
 
-extern struct MemTrack *MemTrack_Init(void);
+extern struct MemTrack *MemTrack_Init(VMDriver *vm);
 extern unsigned MemTrack_Cleanup(struct MemTrack *mt, MemTrackCleanupCb *cb,
                                  void *cbData);
 extern MemTrackEntry *MemTrack_Add(struct MemTrack *mt, VPN64 vpn, MPN mpn);
 extern MemTrackEntry *MemTrack_LookupVPN(struct MemTrack *mt, VPN64 vpn);
-#if defined(MEMTRACK_MPN_LOOKUP)
 extern MemTrackEntry *MemTrack_LookupMPN(struct MemTrack *mt, MPN mpn);
-#endif
 
 #endif // _MEMTRACK_H_
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index de2429ef..228996e3 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,6 +39,9 @@
 #   include <linux/string.h> /* memset() in the kernel */
 
 #   define EXPORT_SYMTAB
+#   if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 12, 0)
+#      define LINUX_GDT_IS_RO
+#   endif
 #else
 #   include <string.h>
 #endif
@@ -60,6 +63,13 @@
 #include "apic.h"
 #include "x86perfctr.h"
 
+#ifdef LINUX_GDT_IS_RO
+#   include <asm/desc.h>
+#   define default_rw_gdt get_current_gdt_rw()
+#else
+#   define default_rw_gdt NULL
+#endif
+
 #if defined(_WIN64)
 #   include "x86.h"
 #   include "vmmon-asm-x86-64.h"
@@ -691,11 +701,28 @@ TaskRestoreHostGDTTRLDT(Descriptor *tempGDTBase,
        */
 
       desc = (Descriptor *)((VA)HOST_KERNEL_LA_2_VA(hostGDT64.offset + tr));
+#ifdef LINUX_GDT_IS_RO
+      /*
+       * If GDT is read-only, we must always load TR from alternative gdt,
+       * otherwise CPU gets page fault when marking TR busy.
+       */
+      {
+         DTR64 rwGDT64;
+
+         rwGDT64.offset = (unsigned long)tempGDTBase;
+         rwGDT64.limit = hostGDT64.limit;
+         Desc_SetType((Descriptor *)((unsigned long)tempGDTBase + tr), TASK_DESC);
+         _Set_GDT((DTR *)&rwGDT64);
+         SET_TR(tr);
+         _Set_GDT((DTR *)&hostGDT64);
+      }
+#else
       if (Desc_Type(desc) == TASK_DESC_BUSY) {
          Desc_SetType(desc, TASK_DESC);
       }
       _Set_GDT((DTR *)&hostGDT64);
       SET_TR(tr);
+#endif
       SET_LDT(ldt);
    }
 }
@@ -1747,7 +1774,8 @@ Task_Switch(VMDriver *vm,  // IN
    ASSERT(pCPU < ARRAYSIZE(hvRootPage) && pCPU < ARRAYSIZE(tmpGDT));
 
    hvRootMPN = Atomic_Read64(&hvRootPage[pCPU]);
-   tempGDTBase = USE_TEMPORARY_GDT ? Atomic_ReadPtr(&tmpGDT[pCPU]) : NULL;
+   tempGDTBase = USE_TEMPORARY_GDT ? Atomic_ReadPtr(&tmpGDT[pCPU])
+                                   : default_rw_gdt;
 
    /*
     * We can't allocate memory with interrupts disabled on all hosts
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index dbe794c5..156e94a9 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -720,6 +720,35 @@ Vmx86_CreateVM(void)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_LookupUserMPN --
+ *
+ *      Look up the MPN of a locked user page by user VA under the VM lock.
+ *
+ * Results:
+ *      A status code and the MPN on success.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+int
+Vmx86_LookupUserMPN(VMDriver *vm, // IN: VMDriver
+                    VA64 uAddr,   // IN: user VA of the page
+                    MPN *mpn)     // OUT
+{
+   int ret;
+   HostIF_VMLock(vm, 38);
+   ret = HostIF_LookupUserMPN(vm, uAddr, mpn);
+   HostIF_VMUnlock(vm, 38);
+   return ret;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index 71ea01b9..9e227ca4 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013,2015-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -106,6 +106,7 @@ extern PseudoTSC pseudoTSC;
 #define MAX_LOCKED_PAGES (-1)
 
 extern VMDriver *Vmx86_CreateVM(void);
+extern int Vmx86_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
 extern int Vmx86_ReleaseVM(VMDriver *vm);
 extern int Vmx86_InitVM(VMDriver *vm, InitBlock *initParams);
 extern int Vmx86_LateInitVM(VMDriver *vm);
diff --git a/vmmon-only/include/compat_pgtable.h b/vmmon-only/include/compat_pgtable.h
index dedc25ad..4722d4e4 100644
--- a/vmmon-only/include/compat_pgtable.h
+++ b/vmmon-only/include/compat_pgtable.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -30,80 +30,32 @@
 #include <asm/pgtable.h>
 
 
-/* pte_page() API modified in 2.3.23 to return a struct page * --hpreg */
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 23)
-#   define compat_pte_page pte_page
-#else
-#   include "compat_page.h"
-
-#   define compat_pte_page(_pte) virt_to_page(pte_page(_pte))
-#endif
-
-
-/* Appeared in 2.5.5 --hpreg */
-#ifndef pte_offset_map
-/*  Appeared in SuSE 8.0's 2.4.18 --hpreg */
-#   ifdef pte_offset_atomic
-#      define pte_offset_map pte_offset_atomic
-#      define pte_unmap pte_kunmap
-#   else
-#      define pte_offset_map pte_offset
-#      define pte_unmap(_pte)
-#   endif
-#endif
-
-
-/* Appeared in 2.5.74-mmX --petr */
-#ifndef pmd_offset_map
-#   define pmd_offset_map(pgd, address) pmd_offset(pgd, address)
-#   define pmd_unmap(pmd)
-#endif
-
-
 /*
- * Appeared in 2.6.10-rc2-mm1.  Older kernels did L4 page tables as 
- * part of pgd_offset, or they did not have L4 page tables at all.
- * In 2.6.11 pml4 -> pgd -> pmd -> pte hierarchy was replaced by
- * pgd -> pud -> pmd -> pte hierarchy.
+ * p4d level appeared in 4.12.
  */
-#ifdef PUD_MASK
-#   define compat_pgd_offset(mm, address)   pgd_offset(mm, address)
-#   define compat_pgd_present(pgd)          pgd_present(pgd)
-#   define compat_pud_offset(pgd, address)  pud_offset(pgd, address)
-#   define compat_pud_present(pud)          pud_present(pud)
-typedef pgd_t  compat_pgd_t;
-typedef pud_t  compat_pud_t;
-#elif defined(pml4_offset)
-#   define compat_pgd_offset(mm, address)   pml4_offset(mm, address)
-#   define compat_pgd_present(pml4)         pml4_present(pml4)
-#   define compat_pud_offset(pml4, address) pml4_pgd_offset(pml4, address)
-#   define compat_pud_present(pgd)          pgd_present(pgd)
-typedef pml4_t compat_pgd_t;
-typedef pgd_t  compat_pud_t;
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 12, 0)
+#   define compat_p4d_offset(pgd, address)  p4d_offset(pgd, address)
+#   define compat_p4d_present(p4d)          p4d_present(p4d)
+#   define compat_p4d_large(p4d)            p4d_large(p4d)
+#   define compat_p4d_pfn(p4d)              p4d_pfn(p4d)
+#   define COMPAT_P4D_MASK                  P4D_MASK
+typedef p4d_t compat_p4d_t;
 #else
-#   define compat_pgd_offset(mm, address)   pgd_offset(mm, address)
-#   define compat_pgd_present(pgd)          pgd_present(pgd)
-#   define compat_pud_offset(pgd, address)  (pgd)
-#   define compat_pud_present(pud)          (1)
-typedef pgd_t  compat_pgd_t;
-typedef pgd_t  compat_pud_t;
+#   define compat_p4d_offset(pgd, address)  (pgd)
+#   define compat_p4d_present(p4d)          (1)
+#   define compat_p4d_large(p4d)            (0)
+#   define compat_p4d_pfn(p4d)              INVALID_MPN  /* Not used */
+#   define COMPAT_P4D_MASK                  0            /* Not used */
+typedef pgd_t compat_p4d_t;
 #endif
-
-
-#define compat_pgd_offset_k(mm, address) pgd_offset_k(address)
-
-
-/* Introduced somewhere in 2.6.0, + backported to some 2.4 RedHat kernels */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0) && !defined(pte_pfn)
-#   define pte_pfn(pte) page_to_pfn(compat_pte_page(pte))
+/* p[gu]d_large did not exist before 2.6.25 */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 25)
+#   define pud_large(pud) 0
+#   define pgd_large(pgd) 0
 #endif
-
-
-/* A page_table_lock field is added to struct mm_struct in 2.3.10 --hpreg */
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 3, 10)
-#   define compat_get_page_table_lock(_mm) (&(_mm)->page_table_lock)
-#else
-#   define compat_get_page_table_lock(_mm) NULL
+/* pud_pfn did not exist before 3.8. */
+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 8, 0)
+#   define pud_pfn(pud)  INVALID_MPN
 #endif
 
 
@@ -128,12 +80,8 @@ typedef pgd_t  compat_pud_t;
 #define VM_PAGE_KERNEL_EXEC PAGE_KERNEL
 #endif
 #else
-#ifdef PAGE_KERNEL_EXECUTABLE
-#define VM_PAGE_KERNEL_EXEC PAGE_KERNEL_EXECUTABLE
-#else
 #define VM_PAGE_KERNEL_EXEC PAGE_KERNEL_EXEC
 #endif
-#endif
 
 
 #endif /* __COMPAT_PGTABLE_H__ */
diff --git a/vmmon-only/include/pgtbl.h b/vmmon-only/include/pgtbl.h
index 39ef4e19..0935e090 100644
--- a/vmmon-only/include/pgtbl.h
+++ b/vmmon-only/include/pgtbl.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002,2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002,2014-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -26,154 +26,14 @@
 #include "compat_spinlock.h"
 #include "compat_page.h"
 
-/*
- *-----------------------------------------------------------------------------
- *
- * PgtblPte2MPN --
- *
- *    Returns the page structure associated to a Page Table Entry.
- *
- *    This function is not allowed to schedule() because it can be called while
- *    holding a spinlock --hpreg
- *
- * Results:
- *    INVALID_MPN on failure
- *    mpn         on success
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE MPN
-PgtblPte2MPN(pte_t *pte)   // IN
-{
-   MPN mpn;
-   if (pte_present(*pte) == 0) {
-      return INVALID_MPN;
-   }
-   mpn = pte_pfn(*pte);
-   if (mpn >= INVALID_MPN) {
-      return INVALID_MPN;
-   }
-   return mpn;
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * PgtblPte2Page --
- *
- *    Returns the page structure associated to a Page Table Entry.
- *
- *    This function is not allowed to schedule() because it can be called while
- *    holding a spinlock --hpreg
- *
- * Results:
- *    The page structure if the page table entry points to a physical page
- *    NULL if the page table entry does not point to a physical page
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE struct page *
-PgtblPte2Page(pte_t *pte) // IN
-{
-   if (pte_present(*pte) == 0) {
-      return NULL;
-   }
-
-   return compat_pte_page(*pte);
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * PgtblPGD2PTELocked --
- *
- *    Walks through the hardware page tables to try to find the pte
- *    associated to a virtual address.
- *
- * Results:
- *    pte. Caller must call pte_unmap if valid pte returned.
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE pte_t *
-PgtblPGD2PTELocked(compat_pgd_t *pgd,    // IN: PGD to start with
-                   VA addr)              // IN: Address in the virtual address
-                                         //     space of that process
-{
-   compat_pud_t *pud;
-   pmd_t *pmd;
-   pte_t *pte;
-
-   if (compat_pgd_present(*pgd) == 0) {
-      return NULL;
-   }
-
-   pud = compat_pud_offset(pgd, addr);
-   if (compat_pud_present(*pud) == 0) {
-      return NULL;
-   }
-
-   pmd = pmd_offset_map(pud, addr);
-   if (pmd_present(*pmd) == 0) {
-      pmd_unmap(pmd);
-      return NULL;
-   }
-
-   pte = pte_offset_map(pmd, addr);
-   pmd_unmap(pmd);
-   return pte;
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * PgtblVa2PTELocked --
- *
- *    Walks through the hardware page tables to try to find the pte
- *    associated to a virtual address.
- *
- * Results:
- *    pte. Caller must call pte_unmap if valid pte returned.
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE pte_t *
-PgtblVa2PTELocked(struct mm_struct *mm, // IN: Mm structure of a process
-                  VA addr)              // IN: Address in the virtual address
-                                        //     space of that process
-{
-   return PgtblPGD2PTELocked(compat_pgd_offset(mm, addr), addr);
-}
-
 
 /*
  *-----------------------------------------------------------------------------
  *
  * PgtblVa2MPNLocked --
  *
- *    Retrieve MPN for a given va.
- *
- *    Caller must call pte_unmap if valid pte returned. The mm->page_table_lock
- *    must be held, so this function is not allowed to schedule() --hpreg
+ *    Walks through the hardware page tables to try to find the pte
+ *    associated to a virtual address.  Then maps PTE to MPN.
  *
  * Results:
  *    INVALID_MPN on failure
@@ -188,89 +48,64 @@ PgtblVa2PTELocked(struct mm_struct *mm, // IN: Mm structure of a process
 static INLINE MPN
 PgtblVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a process
                   VA addr)              // IN: Address in the virtual address
+                                        //     space of that process
 {
-   pte_t *pte;
+   pgd_t *pgd;
+   compat_p4d_t *p4d;
+   MPN mpn;
 
-   pte = PgtblVa2PTELocked(mm, addr);
-   if (pte != NULL) {
-      MPN mpn = PgtblPte2MPN(pte);
-      pte_unmap(pte);
-      return mpn;
+   pgd = pgd_offset(mm, addr);
+   if (pgd_present(*pgd) == 0) {
+      return INVALID_MPN;
    }
-   return INVALID_MPN;
-}
-
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
-/*
- *-----------------------------------------------------------------------------
- *
- * PgtblKVa2MPNLocked --
- *
- *    Retrieve MPN for a given kernel va.
- *
- *    Caller must call pte_unmap if valid pte returned. The mm->page_table_lock
- *    must be held, so this function is not allowed to schedule() --hpreg
- *
- * Results:
- *    INVALID_MPN on failure
- *    mpn         on success
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE MPN
-PgtblKVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a caller
-                   VA addr)              // IN: Address in the virtual address
-{
-   pte_t *pte;
-
-   pte = PgtblPGD2PTELocked(compat_pgd_offset_k(mm, addr), addr);
-   if (pte != NULL) {
-      MPN mpn = PgtblPte2MPN(pte);
-      pte_unmap(pte);
-      return mpn;
+   if (pgd_large(*pgd)) {
+      /* Linux kernel does not support PGD huge pages. */
+      /* return pgd_pfn(*pgd) + ((addr & PGD_MASK) >> PAGE_SHIFT); */
+      return INVALID_MPN;
    }
-   return INVALID_MPN;
-}
-#endif
-
 
-/*
- *-----------------------------------------------------------------------------
- *
- * PgtblVa2PageLocked --
- *
- *    Return the "page" struct for a given va.
- *
- * Results:
- *    struct page or NULL.  The mm->page_table_lock must be held, so this 
- *    function is not allowed to schedule() --hpreg
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE struct page *
-PgtblVa2PageLocked(struct mm_struct *mm, // IN: Mm structure of a process
-                   VA addr)              // IN: Address in the virtual address
-{
-   pte_t *pte;
-
-   pte = PgtblVa2PTELocked(mm, addr);
-   if (pte != NULL) {
-      struct page *page = PgtblPte2Page(pte);
-      pte_unmap(pte);
-      return page;
+   p4d = compat_p4d_offset(pgd, addr);
+   if (compat_p4d_present(*p4d) == 0) {
+      return INVALID_MPN;
+   }
+   if (compat_p4d_large(*p4d)) {
+      mpn = compat_p4d_pfn(*p4d) + ((addr & ~COMPAT_P4D_MASK) >> PAGE_SHIFT);
    } else {
-      return NULL;
+      pud_t *pud;
+
+      pud = pud_offset(p4d, addr);
+      if (pud_present(*pud) == 0) {
+         return INVALID_MPN;
+      }
+      if (pud_large(*pud)) {
+         mpn = pud_pfn(*pud) + ((addr & ~PUD_MASK) >> PAGE_SHIFT);
+      } else {
+         pmd_t *pmd;
+
+         pmd = pmd_offset(pud, addr);
+         if (pmd_present(*pmd) == 0) {
+            return INVALID_MPN;
+         }
+         if (pmd_large(*pmd)) {
+            mpn = pmd_pfn(*pmd) + ((addr & ~PMD_MASK) >> PAGE_SHIFT);
+         } else {
+            pte_t *pte;
+
+            pte = pte_offset_map(pmd, addr);
+            if (pte_present(*pte) == 0) {
+               pte_unmap(pte);
+               return INVALID_MPN;
+            }
+            mpn = pte_pfn(*pte);
+            pte_unmap(pte);
+         }
+      }
+   }
+   if (mpn >= INVALID_MPN) {
+      mpn = INVALID_MPN;
    }
-} 
+   return mpn;
+}
 
 
 /*
@@ -298,85 +133,10 @@ PgtblVa2MPN(VA addr)  // IN
 
    /* current->mm is NULL for kernel threads, so use active_mm. */
    mm = current->active_mm;
-   if (compat_get_page_table_lock(mm)) {
-      spin_lock(compat_get_page_table_lock(mm));
-   }
+   spin_lock(&mm->page_table_lock);
    mpn = PgtblVa2MPNLocked(mm, addr);
-   if (compat_get_page_table_lock(mm)) {
-      spin_unlock(compat_get_page_table_lock(mm));
-   }
+   spin_unlock(&mm->page_table_lock);
    return mpn;
 }
 
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
-/*
- *-----------------------------------------------------------------------------
- *
- * PgtblKVa2MPN --
- *
- *    Walks through the hardware page tables of the current process to try to
- *    find the page structure associated to a virtual address.
- *
- * Results:
- *    Same as PgtblVa2MPNLocked()
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE MPN
-PgtblKVa2MPN(VA addr)  // IN
-{
-   struct mm_struct *mm = current->active_mm;
-   MPN mpn;
-
-   if (compat_get_page_table_lock(mm)) {
-      spin_lock(compat_get_page_table_lock(mm));
-   }
-   mpn = PgtblKVa2MPNLocked(mm, addr);
-   if (compat_get_page_table_lock(mm)) {
-      spin_unlock(compat_get_page_table_lock(mm));
-   }
-   return mpn;
-}
-#endif
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * PgtblVa2Page --
- *
- *    Walks through the hardware page tables of the current process to try to
- *    find the page structure associated to a virtual address.
- *
- * Results:
- *    Same as PgtblVa2PageLocked()
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE struct page *
-PgtblVa2Page(VA addr) // IN
-{
-   struct mm_struct *mm = current->active_mm;
-   struct page *page;
-
-   if (compat_get_page_table_lock(mm)) {
-      spin_lock(compat_get_page_table_lock(mm));
-   }
-   page = PgtblVa2PageLocked(mm, addr);
-   if (compat_get_page_table_lock(mm)) {
-      spin_unlock(compat_get_page_table_lock(mm));
-   }
-   return page;
-}
-
-
 #endif /* __PGTBL_H__ */
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 8acdc02b..35952379 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -1358,7 +1358,6 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_CREATE_VM:
    case IOCTL_VMX86_INIT_CROSSGDT:
    case IOCTL_VMX86_SET_UID:
-   case IOCTL_VMX86_LOOK_UP_MPN:
    case IOCTL_VMX86_GET_NUM_VMS:
    case IOCTL_VMX86_GET_TOTAL_MEM_USAGE:
    case IOCTL_VMX86_SET_HARD_LIMIT:
@@ -1368,8 +1367,6 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_GET_KHZ_ESTIMATE:
    case IOCTL_VMX86_GET_ALL_CPUID:
    case IOCTL_VMX86_GET_ALL_MSRS:
-   case IOCTL_VMX86_READ_PAGE:
-   case IOCTL_VMX86_WRITE_PAGE:
    case IOCTL_VMX86_SET_POLL_TIMEOUT_PTR:
    case IOCTL_VMX86_GET_KERNEL_CLOCK_RATE:
    case IOCTL_VMX86_GET_REFERENCE_CLOCK_HZ:
@@ -1530,7 +1527,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       if (retval) {
          break;
       }
-      args.ret.status = HostIF_LookupUserMPN(vm, args.uAddr, &args.ret.mpn);
+      args.ret.status = Vmx86_LookupUserMPN(vm, args.uAddr, &args.ret.mpn);
       retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
       break;
    }
@@ -1849,7 +1846,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
          if (retval) {
             break;
          }
-         retval = HostIF_ReadPage(req.mpn, req.uAddr, FALSE);
+         retval = HostIF_ReadPage(vm, req.mpn, req.uAddr, FALSE);
          break;
       }
 
@@ -1860,7 +1857,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
          if (retval) {
             break;
          }
-         retval = HostIF_WritePage(req.mpn, req.uAddr, FALSE);
+         retval = HostIF_WritePage(vm, req.mpn, req.uAddr, FALSE);
          break;
       }
 
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index fb9934ca..80b57877 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -82,13 +82,13 @@
 #include "x86apic.h"
 #include "vm_asm.h"
 #include "modulecall.h"
+#include "driver.h"
 #include "memtrack.h"
 #include "phystrack.h"
 #include "cpuid.h"
 #include "cpuid_info.h"
 #include "hostif.h"
 #include "hostif_priv.h"
-#include "driver.h"
 #include "vmhost.h"
 #include "x86msr.h"
 #include "apic.h"
@@ -1009,7 +1009,7 @@ HostIF_FreeLockedPages(VMDriver *vm,	     // IN: VM instance pointer
 int
 HostIF_Init(VMDriver *vm)  // IN:
 {
-   vm->memtracker = MemTrack_Init();
+   vm->memtracker = MemTrack_Init(vm);
    if (vm->memtracker == NULL) {
       return -1;
    }
@@ -2001,15 +2001,15 @@ HostIF_MapCrossPage(VMDriver *vm, // IN
       return NULL;
    }
    vPgAddr = (VA) MapCrossPage(page);
-   HostIF_GlobalLock(16);
+   HostIF_VMLock(vm, 27);
    if (vm->vmhost->crosspagePagesCount >= MAX_INITBLOCK_CPUS) {
-      HostIF_GlobalUnlock(16);
+      HostIF_VMUnlock(vm, 27);
       UnmapCrossPage(page, (void*)vPgAddr);
 
       return NULL;
    }
    vm->vmhost->crosspagePages[vm->vmhost->crosspagePagesCount++] = page;
-   HostIF_GlobalUnlock(16);
+   HostIF_VMUnlock(vm, 27);
 
    ret = vPgAddr | (((VA)p) & (PAGE_SIZE - 1));
 
@@ -2817,13 +2817,75 @@ HostIF_CallOnEachCPU(void (*func)(void*), // IN: function to call
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIFCheckTrackedMPN --
+ *
+ *      Check if a given MPN is tracked for the specified VM.
+ *
+ * Result:
+ *      TRUE if the MPN is tracked in one of the trackers for the specified VM,
+ *      FALSE otherwise.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+HostIFCheckTrackedMPN(VMDriver *vm, // IN: The VM instance
+                      MPN mpn)      // IN: The MPN
+{
+   VMHost * const vmh = vm->vmhost;
+
+   if (vmh == NULL) {
+      return FALSE;
+   }
+
+   HostIF_VMLock(vm, 32); // Debug version of PhysTrack wants VM's lock.
+   if (vmh->lockedPages) {
+      if (PhysTrack_Test(vmh->lockedPages, mpn)) {
+         HostIF_VMUnlock(vm, 32);
+         return TRUE;
+      }
+   }
+
+   if (vmh->AWEPages) {
+      if (PhysTrack_Test(vmh->AWEPages, mpn)) {
+         HostIF_VMUnlock(vm, 32);
+         return TRUE;
+      }
+   }
+
+   if (vm->memtracker) {
+      if (MemTrack_LookupMPN(vm->memtracker, mpn) != NULL) {
+         HostIF_VMUnlock(vm, 32);
+         return TRUE;
+      }
+   }
+   HostIF_VMUnlock(vm, 32);
+
+   if (vmx86_debug) {
+      /*
+       * The monitor may have old KSeg mappings to pages which it no longer
+       * owns.  Minimize customer noise by only logging this for developers.
+       */
+      Log("%s: MPN %" FMT64 "x not owned by this VM\n", __FUNCTION__, mpn);
+   }
+   return FALSE;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
  * HostIF_ReadPage --
  *
- *      puts the content of a machine page into a kernel or user mode 
- *      buffer. 
+ *      Reads one page of data from a machine page and returns it in the
+ *      specified kernel or user buffer.  The machine page must be owned by
+ *      the specified VM.
  *
  * Results:
  *      0 on success
@@ -2836,7 +2898,8 @@ HostIF_CallOnEachCPU(void (*func)(void*), // IN: function to call
  */
 
 int
-HostIF_ReadPage(MPN mpn,             // MPN of the page
+HostIF_ReadPage(VMDriver *vm,        // IN: The VM instance
+                MPN mpn,             // MPN of the page
                 VA64 addr,           // buffer for data
                 Bool kernelBuffer)   // is the buffer in kernel space?
 {
@@ -2848,6 +2911,9 @@ HostIF_ReadPage(MPN mpn,             // MPN of the page
    if (mpn == INVALID_MPN) {
       return -EFAULT;
    }
+   if (HostIFCheckTrackedMPN(vm, mpn) == FALSE) {
+      return -EFAULT;
+   }
 
    page = pfn_to_page(mpn);
    ptr = kmap(page);
@@ -2871,8 +2937,8 @@ HostIF_ReadPage(MPN mpn,             // MPN of the page
  *
  * HostIF_WritePage --
  *
- *      Put the content of a kernel or user mode buffer into a machine 
- *      page.
+ *      Writes one page of data from a kernel or user buffer onto the specified
+ *      machine page.  The machine page must be owned by the specified VM.
  *
  * Results:
  *      0 on success
@@ -2885,9 +2951,9 @@ HostIF_ReadPage(MPN mpn,             // MPN of the page
  */
 
 int
-HostIF_WritePage(MPN mpn,              // MPN of the page
-                 VA64 addr,            // data to write to the page
-                 Bool kernelBuffer)    // is the buffer in kernel space?
+HostIFWritePageWork(MPN mpn,              // MPN of the page
+                    VA64 addr,            // data to write to the page
+                    Bool kernelBuffer)    // is the buffer in kernel space?
 {
    void const *buf = VA64ToPtr(addr);
    int ret = 0;
@@ -2914,6 +2980,45 @@ HostIF_WritePage(MPN mpn,              // MPN of the page
    return ret;
 }
 
+int
+HostIF_WritePage(VMDriver *vm,      // IN: The VM instance
+                 MPN mpn,              // MPN of the page
+                 VA64 addr,            // data to write to the page
+                 Bool kernelBuffer)    // is the buffer in kernel space?
+{
+   if (HostIFCheckTrackedMPN(vm, mpn) == FALSE) {
+      return -EFAULT;
+   }
+   return HostIFWritePageWork(mpn, addr, kernelBuffer);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_WriteMachinePage --
+ *
+ *      Puts the content of a machine page into a kernel or user mode
+ *      buffer.  This should only be used for host-global pages, not any
+ *      VM-owned pages.
+ *
+ * Results:
+ *      On success: 0
+ *      On failure: a negative error code
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+int
+HostIF_WriteMachinePage(MPN mpn,   // IN: MPN of the page
+                        VA64 addr) // IN: data to write to the page
+{
+   return HostIFWritePageWork(mpn, addr, TRUE);
+}
+
 
 /*
  *----------------------------------------------------------------------
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/vmcore/moduleloop.c
index 94aab9eb..a6b2c1a8 100644
--- a/vmmon-only/vmcore/moduleloop.c
+++ b/vmmon-only/vmcore/moduleloop.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -205,11 +205,13 @@ skipTaskSwitch:;
          uint32 nPages = (uint32)crosspage->args[1];
          VA64   uAddr  = (VA64)VPN_2_VA(vpn);
          ASSERT(nPages <= MODULECALL_NUM_ARGS);
+         HostIF_VMLock(vm, 38);
          for (i = 0; i < nPages; i++) {
             MPN mpn;
             HostIF_LookupUserMPN(vm, uAddr + i * PAGE_SIZE, &mpn);
             crosspage->args[i] = mpn;
          }
+         HostIF_VMUnlock(vm, 38);
          break;
       }
 
diff --git a/vmnet-only/bridge.c b/vmnet-only/bridge.c
index ba8bd822..8cdaf11d 100644
--- a/vmnet-only/bridge.c
+++ b/vmnet-only/bridge.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2013, 2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -1104,7 +1104,7 @@ VNetBridgeNotifyLogBridgeUpError(int errno,        // IN: the error number
       case -ENODEV:
          LOG(0, (KERN_WARNING "bridge-%s: interface %s not found or not "
                  "up\n", bridgeName, devName));
-	 break;
+         break;
       case -EINVAL:
          LOG(0, (KERN_WARNING "bridge-%s: interface %s is not a valid "
                  "Ethernet interface\n", bridgeName, devName));
@@ -1143,11 +1143,16 @@ VNetBridgeNotifyLogBridgeUpError(int errno,        // IN: the error number
 static int
 VNetBridgeNotify(struct notifier_block *this, // IN: callback data (bridge)
                  u_long msg,                  // IN: type of event
-                 void *data)                  // IN: device pertaining to event
+                 void *data)                  // IN: net_device or notifier info
 {
    VNetBridge *bridge = list_entry(this, VNetBridge, notifier);
-   struct net_device *dev = (struct net_device *) data;
+   struct net_device *dev;
 
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 11, 0)
+   dev = netdev_notifier_info_to_dev(data);
+#else
+   dev = (struct net_device *)data;
+#endif
    switch (msg) {
    case NETDEV_UNREGISTER:
       LOG(2, (KERN_DEBUG "bridge-%s: interface %s is unregistering\n",
@@ -1179,7 +1184,7 @@ VNetBridgeNotify(struct notifier_block *this, // IN: callback data (bridge)
 
          LOG(1, (KERN_DEBUG "bridge-%s: enabling the bridge on dev up\n",
                  bridge->name));
-	 errno = VNetBridgeUp(bridge, FALSE);
+         errno = VNetBridgeUp(bridge, FALSE);
          if (errno != 0) {
             VNetBridgeNotifyLogBridgeUpError(errno, bridge->name, dev->name);
          }

From e4df7e3461e7bf2fa3a4aae5cc2740c911ded9aa Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 30 Sep 2017 21:05:11 +0200
Subject: [PATCH 04/41] import Workstation 14.0.0 module sources

---
 vmmon-only/Makefile                           |   12 +-
 vmmon-only/Makefile.kernel                    |    8 +-
 vmmon-only/Makefile.normal                    |   26 +-
 vmmon-only/README                             |    4 +-
 vmmon-only/autoconf/smpcall.c                 |   37 -
 .../tsc_khz.c => bootstrap/bootstrap.c}       |   37 +-
 vmmon-only/bootstrap/monLoader.c              |  997 +++++++++
 vmmon-only/bootstrap/monLoaderVmmon.c         |  411 ++++
 vmmon-only/common/apic.c                      |    8 +-
 vmmon-only/common/comport.c                   |   16 +-
 vmmon-only/common/cpuid.c                     |   65 +-
 vmmon-only/common/cpuid.h                     |    8 +-
 vmmon-only/common/hashFunc.c                  |    6 +-
 vmmon-only/common/hostif.h                    |   26 +-
 vmmon-only/common/memtrack.c                  |   26 +-
 vmmon-only/common/memtrack.h                  |    4 +-
 vmmon-only/common/phystrack.c                 |    6 +-
 vmmon-only/common/task.c                      |  935 +++++++--
 vmmon-only/common/task.h                      |   10 +-
 vmmon-only/common/vmx86.c                     |  747 ++++---
 vmmon-only/common/vmx86.h                     |   37 +-
 vmmon-only/include/address_defs.h             |   10 +
 vmmon-only/include/basic_initblock.h          |    7 +-
 vmmon-only/include/bootstrap_vmm.h            |   65 +
 vmmon-only/include/circList.h                 |  239 ++-
 vmmon-only/include/community_source.h         |    2 +-
 vmmon-only/include/compat_cred.h              |   51 -
 vmmon-only/include/compat_highmem.h           |   32 -
 vmmon-only/include/compat_interrupt.h         |   55 -
 vmmon-only/include/compat_ioport.h            |   63 -
 vmmon-only/include/compat_pci.h               |   72 -
 vmmon-only/include/compat_pgtable.h           |    5 -
 vmmon-only/include/compat_semaphore.h         |   49 -
 vmmon-only/include/cpuid_info.h               |   11 +-
 vmmon-only/include/crossgdt.h                 |   25 +-
 vmmon-only/include/iocontrols.h               |   82 +-
 vmmon-only/include/memDefaults.h              |   11 +-
 vmmon-only/include/modulecall.h               |  138 +-
 vmmon-only/include/modulecallstructs.h        |    5 +-
 vmmon-only/include/monAddrLayout.h            |   57 +
 vmmon-only/include/monLoader.h                |  302 +++
 vmmon-only/include/monLoaderLog.h             |   66 +
 vmmon-only/include/mon_assert.h               |   17 +-
 vmmon-only/include/monitorAction_exported.h   |   16 +-
 vmmon-only/include/numa_defs.h                |   11 +-
 vmmon-only/include/pagelist.h                 |   22 +-
 vmmon-only/include/pshare_ext.h               |   13 +-
 vmmon-only/include/ptsc.h                     |    1 -
 vmmon-only/include/rateconv.h                 |   16 +-
 vmmon-only/include/vcpuid.h                   |   16 +-
 vmmon-only/include/vcpuset.h                  |    6 +-
 vmmon-only/include/vcpuset_types.h            |   22 +-
 vmmon-only/include/versioned_atomic.h         |  240 ++-
 vmmon-only/include/vm_asm_x86.h               |    9 +-
 vmmon-only/include/vm_asm_x86_64.h            |    3 +-
 vmmon-only/include/vm_assert.h                |   19 +-
 vmmon-only/include/vm_atomic.h                | 1817 ++++++++---------
 vmmon-only/include/vm_basic_asm.h             |  102 +-
 vmmon-only/include/vm_basic_asm_x86.h         |   12 +-
 vmmon-only/include/vm_basic_asm_x86_64.h      |   15 +-
 vmmon-only/include/vm_basic_asm_x86_common.h  |  163 +-
 vmmon-only/include/vm_basic_defs.h            |   72 +-
 vmmon-only/include/vm_basic_math.h            |   37 +-
 vmmon-only/include/vm_basic_types.h           |   76 +-
 vmmon-only/include/vm_pagetable.h             |  128 ++
 vmmon-only/include/vmm_constants.h            |    3 -
 vmmon-only/include/vmmem_shared.h             |   14 +-
 vmmon-only/include/vmware.h                   |    2 +-
 vmmon-only/include/vmware_pack_begin.h        |    2 +-
 vmmon-only/include/vmware_pack_end.h          |    2 +-
 vmmon-only/include/vmware_pack_init.h         |    2 +-
 vmmon-only/include/x86_basic_defs.h           |   31 +-
 vmmon-only/include/x86apic.h                  |    3 +-
 vmmon-only/include/x86cpuid.h                 | 1638 +++++++++------
 vmmon-only/include/x86cpuid_asm.h             |   33 +-
 vmmon-only/include/x86msr.h                   |  151 +-
 vmmon-only/include/x86paging_64.h             |   87 +
 vmmon-only/include/x86paging_common.h         |  113 +
 vmmon-only/include/x86perfctr.h               |   65 +-
 vmmon-only/include/x86sel.h                   |   10 +
 vmmon-only/include/x86svm.h                   |    6 +-
 vmmon-only/include/x86types.h                 |   13 +-
 vmmon-only/include/x86vendor.h                |    2 +-
 vmmon-only/include/x86vt-exit-reasons.h       |   97 +
 vmmon-only/include/x86vt-vmcs-fields.h        |  818 ++++++--
 vmmon-only/include/x86vt.h                    |  292 ++-
 vmmon-only/include/x86vtinstr.h               |  124 +-
 vmmon-only/linux/driver.c                     |  717 ++-----
 vmmon-only/linux/driver.h                     |   26 +-
 vmmon-only/linux/hostif.c                     |  933 +++------
 vmmon-only/linux/hostif_priv.h                |   10 +-
 vmmon-only/linux/vmhost.h                     |   10 +-
 vmmon-only/linux/vmmonInt.h                   |  109 -
 vmmon-only/vmcore/moduleloop.c                |   29 +-
 vmnet-only/Makefile                           |   12 +-
 vmnet-only/Makefile.kernel                    |    4 -
 vmnet-only/Makefile.normal                    |    4 -
 vmnet-only/bridge.c                           |  195 +-
 vmnet-only/community_source.h                 |    2 +-
 vmnet-only/compat_netdevice.h                 |    4 +-
 vmnet-only/driver.c                           |    4 -
 vmnet-only/monitorAction_exported.h           |  156 --
 vmnet-only/net.h                              |    2 +-
 vmnet-only/netdev_has_dev_net.c               |   37 -
 vmnet-only/netdev_has_net.c                   |   43 -
 vmnet-only/nfhook_uses_skb.c                  |   45 -
 vmnet-only/skblin.c                           |   41 -
 vmnet-only/smac.c                             |   17 +-
 vmnet-only/userif.c                           |   85 +-
 vmnet-only/vm_assert.h                        |   19 +-
 vmnet-only/vm_atomic.h                        | 1817 ++++++++---------
 vmnet-only/vm_basic_asm.h                     |  102 +-
 vmnet-only/vm_basic_asm_x86.h                 |   12 +-
 vmnet-only/vm_basic_asm_x86_64.h              |   15 +-
 vmnet-only/vm_basic_asm_x86_common.h          |  163 +-
 vmnet-only/vm_basic_defs.h                    |   72 +-
 vmnet-only/vm_basic_types.h                   |   76 +-
 vmnet-only/vm_device_version.h                |   71 +-
 vmnet-only/vm_oui.h                           |    8 +
 vmnet-only/vmnetInt.h                         |   39 +-
 vmnet-only/vmware_pack_begin.h                |   43 -
 vmnet-only/vmware_pack_end.h                  |   44 -
 vmnet-only/vmware_pack_init.h                 |   65 -
 vmnet-only/vnet.h                             |   24 +-
 vmnet-only/vnetFilterInt.h                    |    0
 vmnet-only/x86cpuid.h                         | 1815 ----------------
 126 files changed, 9623 insertions(+), 8361 deletions(-)
 delete mode 100644 vmmon-only/autoconf/smpcall.c
 rename vmmon-only/{autoconf/tsc_khz.c => bootstrap/bootstrap.c} (51%)
 create mode 100644 vmmon-only/bootstrap/monLoader.c
 create mode 100644 vmmon-only/bootstrap/monLoaderVmmon.c
 create mode 100644 vmmon-only/include/bootstrap_vmm.h
 delete mode 100644 vmmon-only/include/compat_cred.h
 delete mode 100644 vmmon-only/include/compat_highmem.h
 delete mode 100644 vmmon-only/include/compat_interrupt.h
 delete mode 100644 vmmon-only/include/compat_ioport.h
 delete mode 100644 vmmon-only/include/compat_pci.h
 delete mode 100644 vmmon-only/include/compat_semaphore.h
 create mode 100644 vmmon-only/include/monAddrLayout.h
 create mode 100644 vmmon-only/include/monLoader.h
 create mode 100644 vmmon-only/include/monLoaderLog.h
 create mode 100644 vmmon-only/include/vm_pagetable.h
 create mode 100644 vmmon-only/include/x86paging_64.h
 create mode 100644 vmmon-only/include/x86paging_common.h
 create mode 100644 vmmon-only/include/x86vt-exit-reasons.h
 delete mode 100644 vmmon-only/linux/vmmonInt.h
 delete mode 100644 vmnet-only/monitorAction_exported.h
 delete mode 100644 vmnet-only/netdev_has_dev_net.c
 delete mode 100644 vmnet-only/netdev_has_net.c
 delete mode 100644 vmnet-only/nfhook_uses_skb.c
 delete mode 100644 vmnet-only/skblin.c
 delete mode 100644 vmnet-only/vmware_pack_begin.h
 delete mode 100644 vmnet-only/vmware_pack_end.h
 delete mode 100644 vmnet-only/vmware_pack_init.h
 delete mode 100644 vmnet-only/vnetFilterInt.h
 delete mode 100644 vmnet-only/x86cpuid.h

diff --git a/vmmon-only/Makefile b/vmmon-only/Makefile
index de8162e8..ccdd2959 100644
--- a/vmmon-only/Makefile
+++ b/vmmon-only/Makefile
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+# Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -84,8 +84,6 @@ endif
 
 ifneq ($(VM_KBUILD), no)
 
-VMCCVER := $(shell $(CC) -dumpversion)
-
 # If there is no version defined, we are in toplevel pass, not yet in kernel makefiles...
 ifeq ($(VERSION),)
 
@@ -100,14 +98,6 @@ auto-build: $(DRIVER_KO)
 $(DRIVER): $(DRIVER_KO)
 	if [ $< -nt $@ ] || [ ! -e $@ ] ; then cp -f $< $@; fi
 
-# Pass gcc version down the chain, so we can detect if kernel attempts to use unapproved compiler
-VM_CCVER := $(VMCCVER)
-export VM_CCVER
-VM_CC := $(CC)
-export VM_CC
-
-MAKEOVERRIDES := $(filter-out CC=%,$(MAKEOVERRIDES))
-
 #
 # Define a setup target that gets built before the actual driver.
 # This target may not be used at all, but if it is then it will be defined
diff --git a/vmmon-only/Makefile.kernel b/vmmon-only/Makefile.kernel
index bf805e02..385068da 100644
--- a/vmmon-only/Makefile.kernel
+++ b/vmmon-only/Makefile.kernel
@@ -24,16 +24,14 @@ INCLUDE := -I$(SRCROOT)/include -I$(SRCROOT)/common -I$(SRCROOT)/linux \
 
 EXTRA_CFLAGS := $(CC_OPTS) $(INCLUDE)
 
-EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/autoconf/smpcall.c, -DVMW_HAVE_SMP_CALL_3ARG, )
-EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/autoconf/tsc_khz.c, -DVMW_HAVE_TSC_KHZ, )
-
 obj-m += $(DRIVER).o
 
 $(DRIVER)-y := $(subst $(SRCROOT)/, , $(patsubst %.c, %.o, \
-		$(wildcard $(SRCROOT)/linux/*.c $(SRCROOT)/common/*.c $(SRCROOT)/vmcore/*.c)))
+		$(wildcard $(SRCROOT)/linux/*.c $(SRCROOT)/common/*.c $(SRCROOT)/vmcore/*.c \
+		$(SRCROOT)/bootstrap/*.c)))
 
 clean:
 	rm -rf $(wildcard $(DRIVER).mod.c $(DRIVER).ko .tmp_versions \
 		Module.symvers Modules.symvers Module.markers modules.order \
-		$(foreach dir,linux/ common/ vmcore/ \
+		$(foreach dir,linux/ common/ vmcore/ bootstrap/ \
 		./,$(addprefix $(dir),.*.cmd .*.o.flags *.o)))
diff --git a/vmmon-only/Makefile.normal b/vmmon-only/Makefile.normal
index 9e26a969..a38a6dae 100644
--- a/vmmon-only/Makefile.normal
+++ b/vmmon-only/Makefile.normal
@@ -26,7 +26,7 @@ vm_check_build = $(shell if $(CC) $(CC_OPTS) $(INCLUDE) -Werror -S -o /dev/null
 DESTDIR := driver-$(VM_UNAME)
 
 ####
-####  DRIVERNAME should be untouched unless you have a good reason to change 
+####  DRIVERNAME should be untouched unless you have a good reason to change
 #### it.  The form below is how the scripts expect it.
 ####
 DRIVERNAME := $(DRIVER)-xxx-$(VM_UNAME)
@@ -49,7 +49,7 @@ endif
 #### If desparate, I think that bringing in <linux/bitops.h> might
 #### suffice.
 ####
-CC_WARNINGS := -Wall -Wstrict-prototypes 
+CC_WARNINGS := -Wall -Wstrict-prototypes
 # Don't use -pipe or egcs-2.91.66 (shipped with RedHat) will die
 CC_KFLAGS := -D__KERNEL__ -fno-strength-reduce -fno-omit-frame-pointer \
 	     -fno-common -DKBUILD_MODNAME=$(DRIVER)
@@ -63,7 +63,7 @@ else
 CC_KFLAGS += -DCPU=586 $(call check_gcc,-march=i586,-m486)
 endif
 
-CC_OPTS := -O2 -DMODULE -DVMMON -DVMCORE $(GLOBAL_DEFS) $(CC_KFLAGS) $(CC_WARNINGS) 
+CC_OPTS := -O2 -DMODULE -DVMMON -DVMCORE $(GLOBAL_DEFS) $(CC_KFLAGS) $(CC_WARNINGS)
 
 INCLUDE := -I$(SRCROOT)/include -I$(SRCROOT)/common -I$(SRCROOT)/linux \
 	   -I$(SRCROOT)/vmcore -I$(HEADER_DIR)
@@ -71,16 +71,16 @@ INCLUDE := -I$(SRCROOT)/include -I$(SRCROOT)/common -I$(SRCROOT)/linux \
 INCLUDE += $(shell $(CC) $(INCLUDE) -E $(SRCROOT)/autoconf/geninclude.c \
 	   | sed -n -e 's!^APATH!-I$(HEADER_DIR)/asm!p')
 
-CC_OPTS += $(call vm_check_build, $(SRCROOT)/autoconf/smpcall.c, -DVMW_HAVE_SMP_CALL_3ARG, )
-CC_OPTS += $(call vm_check_build, $(SRCROOT)/autoconf/tsc_khz.c, -DVMW_HAVE_TSC_KHZ, )
-
 C_TARGETS_LINUX  := driver.o hostif.o driverLog.o
 C_TARGETS_COMMON := vmx86.o memtrack.o phystrack.o cpuid.o task.o hashFunc.o
 C_TARGETS_VMCORE := moduleloop.o
+C_TARGETS_BOOTSTRAP := bootstrap.o
 C_TARGETS_LINUX_D := ${C_TARGETS_LINUX:.o=.d}
 C_TARGETS_COMMON_D := ${C_TARGETS_COMMON:.o=.d}
 C_TARGETS_VMCORE_D := ${C_TARGETS_VMCORE:.o=.d}
-C_TARGETS := $(C_TARGETS_LINUX) $(C_TARGETS_COMMON) $(C_TARGETS_VMCORE)
+C_TARGETS_BOOTSTRAP_D := ${C_TARGETS_BOOTSTRAP:.o=.d}
+C_TARGETS := $(C_TARGETS_LINUX) $(C_TARGETS_COMMON) $(C_TARGETS_VMCORE) \
+             $(C_TARGETS_BOOTSTRAP)
 
 ####
 #### Make Targets are beneath here.
@@ -116,6 +116,10 @@ $(C_TARGETS_VMCORE): %.o: $(SRCROOT)/vmcore/%.c
 	$(ECHO) "Compiling  vmcore/$(<F)"
 	$(CC) $(CC_OPTS) $(INCLUDE) -c $<
 
+$(C_TARGETS_BOOTSTRAP): %.o: $(SRCROOT)/bootstrap/%.c
+	$(ECHO) "Compiling  bootstrap/$(<F)"
+	$(CC) $(CC_OPTS) $(INCLUDE) -c $<
+
 clean:
 	rm -rf $(DESTDIR)/
 
@@ -131,8 +135,12 @@ $(C_TARGETS_VMCORE_D): %.d: $(SRCROOT)/vmcore/%.c
 	$(ECHO) "Dependencies for $(<F)"
 	$(CC) -MM $(CC_OPTS) $(INCLUDE) $< > $@
 
-deps: setup 
-	$(MAKE) -C $(DESTDIR) -f ../Makefile SRCROOT=../$(SRCROOT) driver_deps 
+$(C_TARGETS_BOOTSTRAP_D): %.d: $(SRCROOT)/bootstrap/%.c
+	$(ECHO) "Dependencies for $(<F)"
+	$(CC) -MM $(CC_OPTS) $(INCLUDE) $< > $@
+
+deps: setup
+	$(MAKE) -C $(DESTDIR) -f ../Makefile SRCROOT=../$(SRCROOT) driver_deps
 
 driver_deps: ${C_TARGETS:.o=.d}
 
diff --git a/vmmon-only/README b/vmmon-only/README
index 6a4da4c4..ef162c3e 100644
--- a/vmmon-only/README
+++ b/vmmon-only/README
@@ -3,11 +3,11 @@ portion of the VMware Virtual Machine Monitor.  In order to build, make
 certain the Makefile is correct, especially in whether or not your system
 is multi-processor and then just type
 
-	make
+        make
 
 from this directory.  A copy of the module will be left in
 
-	driver-<kernel version>/vmmon.o
+        driver-<kernel version>/vmmon.o
 
 (e.g. driver-up-2.0.32/vmmon.o).
 
diff --git a/vmmon-only/autoconf/smpcall.c b/vmmon-only/autoconf/smpcall.c
deleted file mode 100644
index e27a873a..00000000
--- a/vmmon-only/autoconf/smpcall.c
+++ /dev/null
@@ -1,37 +0,0 @@
-/*********************************************************
- * Copyright (C) 2008 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * Detect whether smp_call_function has 4 or 3 arguments.
- * Change happened between 2.6.26 and 2.6.27-rc1.
- */
-
-#include "compat_version.h"
-#include "compat_autoconf.h"
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 26)
-#   error This compile test intentionally fails.
-#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 27)
-#   include <linux/smp.h>
-
-int
-vmware_smp_call_function(void (*func)(void *info), void *info, int wait)
-{
-   return smp_call_function(func, info, wait);
-}
-#endif
diff --git a/vmmon-only/autoconf/tsc_khz.c b/vmmon-only/bootstrap/bootstrap.c
similarity index 51%
rename from vmmon-only/autoconf/tsc_khz.c
rename to vmmon-only/bootstrap/bootstrap.c
index f2f262f7..24ede075 100644
--- a/vmmon-only/autoconf/tsc_khz.c
+++ b/vmmon-only/bootstrap/bootstrap.c
@@ -17,16 +17,37 @@
  *********************************************************/
 
 /*
- * Detect if tsc_khz is available.
+ * bootstrap.c --
+ *
+ *    Implements the early VMM bootstraping code that is executed
+ *    by the host (vmmon/VMKernel) to create the VMM context.
  */
 
-#include "compat_version.h"
-#include "compat_autoconf.h"
-
-#include <linux/cpu.h>
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "bootstrap_vmm.h"
 
-int
-vmw_tsc_khz(void)
+/*
+ *---------------------------------------------------------------------
+ *
+ * BSVMM_Validate --
+ *
+ *    Validates the VMM bootstrap blob. For now, we do it by checking
+ *    the magic number. Returns the bootstrap parameter table if
+ *    successful, NULL otherwise.
+ *
+ *---------------------------------------------------------------------
+ */
+BSVMM_HostParams *
+BSVMM_Validate(void *buf, uint32 nbytes)
 {
-    return tsc_khz;
+   BSVMM_HostParams *bsParams = buf;
+
+   if (nbytes < sizeof *bsParams) {
+      return NULL;
+   }
+   if (bsParams->magic != BOOTSTRAP_MAGIC) {
+      return NULL;
+   }
+   return bsParams;
 }
diff --git a/vmmon-only/bootstrap/monLoader.c b/vmmon-only/bootstrap/monLoader.c
new file mode 100644
index 00000000..34797cf5
--- /dev/null
+++ b/vmmon-only/bootstrap/monLoader.c
@@ -0,0 +1,997 @@
+/*********************************************************
+ * Copyright (C) 2015-2017 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * monLoader.c --
+ *
+ *      Processes the monitor loader header.
+ *
+ *      See monLoader.h for a full description.
+ */
+
+#ifdef VMX86_VMX
+
+#include <string.h>
+#include <limits.h>
+#include "vmx.h"
+#include "vm_assert.h"
+
+#elif defined VMKERNEL
+
+#include "vmkernel.h"
+#include "libc.h"
+#include "vm_libc.h"
+
+#define UINT_MAX (~0U)
+
+#elif defined VMMON
+
+#include "hostKernel.h"
+
+#ifdef __linux__
+#   include "driver-config.h"
+#   include <linux/string.h>
+#   include <linux/kernel.h>
+#elif defined __APPLE__
+#   include <machine/limits.h>
+#   include <string.h>
+#else
+#   include <limits.h>
+#   include <string.h>
+#endif
+
+#include "vm_assert.h"
+
+#else /* !defined VMX86_VMX && !defined VMKERNEL && !defined VMMON */
+#error MonLoader cannot be built as part of this environment
+#endif
+
+#include "vm_basic_types.h"
+#include "monLoader.h"
+#include "vcpuid.h"
+#include "x86types.h"
+#include "x86paging_64.h"
+#include "monLoaderLog.h"
+
+#define CANONICAL_MASK MASK64(36)
+/* The index of VPN v within an array of LxEs where index 0 maps VPN b. */
+#define L4EArrayIdx(b,v) ((unsigned)((((v) - (b)) & CANONICAL_MASK) >> 36))
+#define L3EArrayIdx(b,v) ((unsigned)((((v) - (b)) & CANONICAL_MASK) >> 27))
+#define L2EArrayIdx(b,v) ((unsigned)((((v) - (b)) & CANONICAL_MASK) >> 18))
+#define L1EArrayIdx(b,v) ((unsigned)((((v) - (b)) & CANONICAL_MASK) >> 9))
+
+/*
+ * Import address space from VMX rather than building it.  Once monitor loading
+ * is removed from VMX entirely, code to import will be deleted.
+ */
+#define IMPORT_AS_FROM_VMX (TRUE)
+
+/* The maximum (canonical-address) VPN */
+#define VPN_MAX MASK64(52)
+
+/* Sufficient MPN counts to accommodate the monitor's top 64MB. */
+#define L4MPNCOUNTMAX  1
+#define L3MPNCOUNTMAX  1
+#define L2MPNCOUNTMAX  1
+#define L1MPNCOUNTMAX 32
+
+#define LINE_INVALID  ((unsigned)-1)
+
+typedef struct MonPTMPNs {
+   MPN L4MPNs[L4MPNCOUNTMAX]; /* The page root.  Definitely only one page. */
+   MPN L3MPNs[L3MPNCOUNTMAX];
+   MPN L2MPNs[L2MPNCOUNTMAX];
+   MPN L1MPNs[L1MPNCOUNTMAX];
+   unsigned L4MPNCount;
+   unsigned L3MPNCount;
+   unsigned L2MPNCount;
+   unsigned L1MPNCount;
+} MonPTMPNs;
+ 
+typedef struct MonLoaderContext {
+   MonLoaderEnvContext *envCtx; /* Environment-specific context */
+   struct {
+      MonPTMPNs    ptMPNs;      /* Mappings into the AS for the current VCPU. */
+      VPN          ASFirstVPN;  /* first VPN in the address space */
+      VPN          ASLastVPN;   /* last VPN in the address space (inclusive) */
+      uint64       ASPTEFlags;  /* PTE flags for L4->L1 connection. */
+      Vcpuid       currentVCPU;
+      Bool         ASImported;  /* Was this AS imported or created anew? */
+      Bool         hasAddrSpace;
+   } vcpu;
+} MonLoaderContext;
+
+
+static const Bool importFromVMX = IMPORT_AS_FROM_VMX;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderTranslateMonVPNToL1E --
+ *
+ *      Translates a monitor VPN to a level 1 page table entry, for the current
+ *      VCPU.  Assumes preallocated and connected page tables, so only the L1
+ *      table is examined.
+ *
+ * Result:
+ *      ML_OK and a PTE if successful, some other value on error.  Fails if a
+ *      page table page is not already allocated or the VPN is not in the
+ *      context's address space's defined range.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderTranslateMonVPNToL1E(MonLoaderContext *ctx,    // IN/OUT
+                              VPN               monVPN, // IN
+                              PT_L1E           *pte)    // OUT
+{
+   Vcpuid vcpu = ctx->vcpu.currentVCPU;
+   /* Only modify the L1E as L4->L1 are guaranteed connected already. */
+   unsigned L1Off = PT_LPN_2_L1OFF(monVPN);
+   unsigned L1Page = L1EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
+
+   if (monVPN < ctx->vcpu.ASFirstVPN || monVPN > ctx->vcpu.ASLastVPN) {
+      return ML_ERROR_INVALID_VPN; /* Address is outside address space. */
+   }
+   if (ctx->vcpu.ptMPNs.L1MPNs[L1Page] == INVALID_MPN) {
+      return ML_ERROR_MAP; /* Page table not sufficiently preallocated. */
+   }
+   if (!MonLoaderCallout_GetPTE(ctx->envCtx, ctx->vcpu.ptMPNs.L1MPNs[L1Page],
+                                L1Off, vcpu, pte)) {
+      return ML_ERROR_CALLOUT_GETPTE;
+   }
+   return ML_OK;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderIsMapped --
+ *
+ *      Checks whether a VPN has an existing mapping on the current VCPU.
+ *      Assumes preallocated and connected page tables.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.  Fails if a page table
+ *      page is not already allocated or the VPN is not in the context's
+ *      address space's defined range.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderIsMapped(MonLoaderContext *ctx,    // IN/OUT
+                  VPN               monVPN, // IN
+                  Bool             *mapped) // OUT
+{
+   PT_L1E pte;
+   MonLoaderError ret = MonLoaderTranslateMonVPNToL1E(ctx, monVPN, &pte);
+
+   if (ret != ML_OK) {
+      return ret;
+   }
+   *mapped = PTE_PRESENT(pte);
+   return ML_OK;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderAllocMPN --
+ *
+ *      Allocates a new MPN.
+ *
+ * Result:
+ *      ML_OK and an MPN, on success.  An error and no MPN on failure.
+ *
+ * Side effects:
+ *      An MPN may be allocated.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderAllocMPN(MonLoaderContext *ctx, // IN
+                  MPN *mpn)              // OUT
+{
+   *mpn = MonLoaderCallout_AllocMPN(ctx->envCtx, ctx->vcpu.currentVCPU);
+   if (*mpn == INVALID_MPN) {
+      return ML_ERROR_ALLOC;
+   }
+   return ML_OK;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderMapMPN --
+ *
+ *      Maps an MPN into the current VCPU's address space at a VPN.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.  Fails if a page table
+ *      page is not already allocated or the VPN is not in the context's
+ *      address space's defined range.
+ *
+ * Side effects:
+ *      An MPN is mapped on success.  Nothing on failure.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderMapMPN(MonLoaderContext *ctx,    // IN/OUT
+                MPN               mpn,    // IN
+                uint64            flags,  // IN
+                VPN               monVPN) // IN
+{
+   MonPTMPNs *ptMPNs = &ctx->vcpu.ptMPNs;
+   /* Only modify the L1E, as L4->L1 are guaranteed connected already. */
+   unsigned L1Off = PT_LPN_2_L1OFF(monVPN);
+   unsigned L1Page = L1EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
+
+   if (vmx86_debug) {
+      MonLoaderError ret;
+      Bool mapped;
+      if (monVPN < ctx->vcpu.ASFirstVPN || monVPN > ctx->vcpu.ASLastVPN) {
+         LOG(5, "%s: monVPN=0x%"FMTVPN"x, AS=0x%"FMTVPN"x-0x%"FMTVPN"x\n",
+                 __FUNCTION__, monVPN, ctx->vcpu.ASFirstVPN,
+                 ctx->vcpu.ASLastVPN);
+         return ML_ERROR_INVALID_VPN; /* Address is outside address space. */
+      }
+      if (ptMPNs->L1MPNs[L1Page] == INVALID_MPN) {
+         return ML_ERROR_MAP; /* Page table not sufficiently preallocated. */
+      }
+      ret = MonLoaderIsMapped(ctx, monVPN, &mapped);
+      if (ret != ML_OK) {
+         return ret;
+      }
+      if (mapped) {
+         return ML_ERROR_ALREADY_MAPPED;
+      }
+   }
+   if (!MonLoaderCallout_MapMPNInPTE(ctx->envCtx, ptMPNs->L1MPNs[L1Page], L1Off,
+                                     flags, mpn, ctx->vcpu.currentVCPU)) {
+      return ML_ERROR_CALLOUT_MAPINPTE;
+   }
+   return ML_OK;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCreateAddressSpace --
+ *
+ *      Creates or (if importAS is set) verifies an address space.  The VPN
+ *      range specified by firstVPN and size is used to determine page counts
+ *      at each page table level to map every page.  Sufficient pages are then
+ *      allocated or verified.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.
+ *
+ * Side effects:
+ *      MPNs are allocated if not importing.  Sets ctx->vcpu.hasAddrSpace.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
+                            VPN               firstVPN, // IN
+                            uint64            flags,    // IN
+                            uint64            monPages, // IN
+                            Bool              importAS) // IN
+{
+   Vcpuid vcpu = ctx->vcpu.currentVCPU;
+   VPN lastVPN = firstVPN + monPages - 1;
+   unsigned L3MPNsNeeded = L3EArrayIdx(0, lastVPN) -
+                           L3EArrayIdx(0, firstVPN) + 1;
+   unsigned L2MPNsNeeded = L2EArrayIdx(0, lastVPN) -
+                           L2EArrayIdx(0, firstVPN) + 1;
+   unsigned L1MPNsNeeded = L1EArrayIdx(0, lastVPN) -
+                           L1EArrayIdx(0, firstVPN) + 1;
+   unsigned i;
+   MPN mpn;
+   MonPTMPNs *ptMPNs;
+
+   if (vcpu == VCPUID_INVALID) {
+      return ML_ERROR_ARGS;
+   }
+
+   /* Verify MonPTMPNs is large enough for this address space. */
+   if (L3MPNsNeeded > L3MPNCOUNTMAX || L2MPNsNeeded > L2MPNCOUNTMAX ||
+       L1MPNsNeeded > L1MPNCOUNTMAX) {
+      return ML_ERROR_ADDRSPACE_TOO_LARGE;
+   }
+   ctx->vcpu.ASFirstVPN = firstVPN;
+   ctx->vcpu.ASLastVPN = lastVPN;
+   ctx->vcpu.ASPTEFlags = flags;
+   ctx->vcpu.ASImported = importAS;
+
+   ptMPNs = &ctx->vcpu.ptMPNs;
+
+   if (importAS) {
+      mpn = MonLoaderCallout_GetPageRoot(ctx->envCtx, vcpu);
+      if (mpn == INVALID_MPN) {
+         return ML_ERROR_CALLOUT_PAGEROOT_GET;
+      }
+      LOG(5, "%s: vcpu %u page root=0x%"FMT64"x\n", __FUNCTION__, vcpu, mpn);
+      ptMPNs->L4MPNs[0] = mpn;
+      MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
+   } else {
+      NOT_IMPLEMENTED();
+   }
+   ptMPNs->L4MPNCount = 1;
+
+   for (i = 0; i < L3MPNsNeeded; i++) {
+      if (importAS) {
+         VPN monVPN = firstVPN + i * PT_PAGES_PER_L4E;
+         unsigned L4Off = PT_LPN_2_L4OFF(monVPN);
+         PT_L1E pte;
+         if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L4MPNs[0], L4Off,
+                                      vcpu, &pte)) {
+            return ML_ERROR_CALLOUT_GETPTE;
+         }
+         LOG(5, "%s: monVPN=0x%"FMTVPN"x: L4E=0x%"FMT64"x\n", __FUNCTION__,
+                 monVPN, pte);
+         mpn = LM_PTE_2_PFN(pte);
+         if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
+            return ML_ERROR_PAGE_TABLE_IMPORT;
+         }
+         MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
+      } else {
+         NOT_IMPLEMENTED();
+      }
+      ptMPNs->L3MPNs[i] = mpn;
+   }
+   ptMPNs->L3MPNCount = L3MPNsNeeded;
+      
+   for (i = 0; i < L2MPNsNeeded; i++) {
+      if (importAS) {
+         VPN monVPN = firstVPN + i * PT_PAGES_PER_L3E;
+         unsigned L3Off = PT_LPN_2_L3OFF(monVPN);
+         unsigned L3Page = L3EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
+         PT_L1E pte;
+         if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L3MPNs[L3Page],
+                                      L3Off, vcpu, &pte)) {
+            return ML_ERROR_CALLOUT_GETPTE;
+         }
+         LOG(5, "%s: monVPN=0x%"FMTVPN"x: L3E=0x%"FMT64"x\n", __FUNCTION__,
+                 monVPN, pte);
+         mpn = LM_PTE_2_PFN(pte);
+         if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
+            return ML_ERROR_PAGE_TABLE_IMPORT;
+         }
+         MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
+      } else {
+         NOT_IMPLEMENTED();
+      }
+      ptMPNs->L2MPNs[i] = mpn;
+   }
+   ptMPNs->L2MPNCount = L2MPNsNeeded;
+
+   for (i = 0; i < L1MPNsNeeded; i++) {
+      if (importAS) {
+         VPN monVPN = firstVPN + i * PT_PAGES_PER_L2E;
+         unsigned L2Off = PT_LPN_2_L2OFF(monVPN);
+         unsigned L2Page = L2EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
+         PT_L1E pte;
+         if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L2MPNs[L2Page],
+                                      L2Off, vcpu, &pte)) {
+            return ML_ERROR_CALLOUT_GETPTE;
+         }
+         LOG(5, "%s: monVPN=0x%"FMTVPN"x: L2E=0x%"FMT64"x\n", __FUNCTION__,
+                 monVPN, pte);
+         mpn = LM_PTE_2_PFN(pte);
+         if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
+            return ML_ERROR_PAGE_TABLE_IMPORT;
+         }
+         MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
+      } else {
+         NOT_IMPLEMENTED();
+      }
+      ptMPNs->L1MPNs[i] = mpn;
+   }
+   ptMPNs->L1MPNCount = L1MPNsNeeded;
+
+   ctx->vcpu.hasAddrSpace = TRUE;
+   return ML_OK;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderMapPageTables --
+ *
+ *      Maps in the page tables for the specified level, or verifies that the
+ *      existing mappings match internal state and flags if the address space
+ *      was imported.  Assumes pre-allocated memory at all levels and
+ *      pre-connected L4->L1 page tables.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.
+ *
+ * Side effects:
+ *      Page tables are updated if mappings are created.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderMapPageTables(MonLoaderContext *ctx,      // IN/OUT
+                       unsigned          level,    // IN
+                       uint64            flags,    // IN
+                       VPN               monVPN,   // IN
+                       uint64            monPages) // IN
+{
+   Bool verify = ctx->vcpu.ASImported;
+   uint64    i;
+   unsigned  count;
+   MPN      *ptMPNs;
+
+   if (vmx86_debug) {
+      if (!ctx->vcpu.hasAddrSpace) {
+         return ML_ERROR_NO_ADDRSPACE;
+      }
+      if (level < 1 || level > 4) {
+         return ML_ERROR_ARGS;
+      }
+   }
+
+   switch (level) {
+      case 4:
+         count = ctx->vcpu.ptMPNs.L4MPNCount;
+         ptMPNs = ctx->vcpu.ptMPNs.L4MPNs;
+         break;
+      case 3:
+         count = ctx->vcpu.ptMPNs.L3MPNCount;
+         ptMPNs = ctx->vcpu.ptMPNs.L3MPNs;
+         break;
+      case 2:
+         count = ctx->vcpu.ptMPNs.L2MPNCount;
+         ptMPNs = ctx->vcpu.ptMPNs.L2MPNs;
+         break;
+      case 1:
+         count = ctx->vcpu.ptMPNs.L1MPNCount;
+         ptMPNs = ctx->vcpu.ptMPNs.L1MPNs;
+         break;
+      default:
+         return ML_ERROR_ARGS;
+         break;
+
+      if (monPages != count) {
+         return ML_ERROR_PAGE_TABLE_MAP_SIZE;
+      }
+      
+      for (i = 0; i < monPages; i++) {
+         VPN vpn = monVPN + i;
+         if (verify) {
+            PT_L1E l1e;
+            if (MonLoaderTranslateMonVPNToL1E(ctx, vpn, &l1e) != ML_OK ||
+                LM_PTE_2_PFN(l1e) != ptMPNs[i] || !ML_PERMS_MATCH(l1e, flags)) {
+               return ML_ERROR_PAGE_TABLE_VERIFY;
+            }
+         } else {
+            NOT_IMPLEMENTED();
+         }
+      }
+   }
+   return ML_OK;
+} 
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderZero --
+ *
+ *      Allocates new pages, zeroes them and maps them on the current VCPU.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.  The number of
+ *      MPNs allocated in *allocs is incremented.
+ *
+ * Side effects:
+ *      Allocations, zeroing, mapping and accounting are performed.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderZero(MonLoaderContext *ctx,      // IN/OUT
+              uint64            flags,    // IN
+              VPN               monVPN,   // IN
+              uint64            numPages, // IN
+              uint64            monPages, // IN
+              unsigned         *allocs)   // IN/OUT
+{
+   uint64 i;
+
+   if (numPages == 0 || numPages > monPages) {
+      return ML_ERROR_SIZE;
+   }
+   for (i = 0; i < numPages; i++) {
+      MPN mpn;
+      MonLoaderError ret = MonLoaderAllocMPN(ctx, &mpn);
+      if (ret != ML_OK) {
+         return ret;
+      }
+      if (!MonLoaderCallout_FillPage(ctx->envCtx, 0, mpn,
+                                     ctx->vcpu.currentVCPU)) {
+         return ML_ERROR_CALLOUT_ZERO;
+      }
+      ret = MonLoaderMapMPN(ctx, mpn, flags, monVPN + i);
+      if (ret != ML_OK) {
+         return ret;
+      }
+      *allocs += 1;
+   }
+   return ML_OK;
+}
+   
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCopyFromBlob --
+ *
+ *      Allocates new pages, copies blob contents and maps the pages.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.  The number of
+ *      MPNs allocated in *allocs is incremented.
+ *
+ * Side effects:
+ *      Allocations, copying, mapping and accounting are performed.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderCopyFromBlob(MonLoaderContext *ctx,        // IN/OUT
+                      uint64            flags,      // IN
+                      VPN               monVPN,     // IN
+                      uint64            monBytes,   // IN
+                      uint64            blobOffset, // IN
+                      uint64            blobSize,   // IN
+                      unsigned         *allocs)     // IN/OUT
+{
+   uint64 bytesLeft = blobSize;
+
+   if (blobSize > monBytes || blobSize == 0) {
+      return ML_ERROR_SIZE; /* Entry corrupt: size mismatch. */
+   }
+   while (bytesLeft) {
+      MPN mpn;
+      uint64 toCopy = MIN(bytesLeft, PAGE_SIZE);
+
+      MonLoaderError ret = MonLoaderAllocMPN(ctx, &mpn);
+      if (ret != ML_OK) {
+         return ret;
+      }
+
+      ret = MonLoaderMapMPN(ctx, mpn, flags, monVPN);
+      if (ret != ML_OK) {
+         return ret;
+      }
+
+      if (!MonLoaderCallout_CopyFromBlob(ctx->envCtx, blobOffset, toCopy, mpn,
+                                         ctx->vcpu.currentVCPU)) {
+         return ML_ERROR_CALLOUT_COPY;
+      }
+
+      monVPN++;
+      blobOffset += toCopy;
+      bytesLeft -= toCopy;
+      *allocs += 1;
+   }
+   return ML_OK;
+}
+ 
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderShareWork --
+ *
+ *      Maps user or host pages in.  monPages is a maximum, so partial sharing
+ *      is considered successful and remaining monitor pages will not be mapped.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.
+ *
+ * Side effects:
+ *      User pages may be mapped in.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderShareWork(MonLoaderContext *ctx,        // IN/OUT
+                   uint64            flags,      // IN
+                   VPN               monVPN,     // IN
+                   uint64            monPages,   // IN
+                   uint64            subIndex,   // IN
+                   Bool              user)       // IN
+{
+   Vcpuid vcpu = ctx->vcpu.currentVCPU;
+   uint64 i;
+
+   if (monPages == 0 || monPages > UINT_MAX) {
+      return ML_ERROR_SIZE; /* Entry corrupt: size mismatch. */
+   }
+   for (i = 0; i < monPages; i++) {
+      MPN mpn;
+      MonLoaderError ret;
+      unsigned pgNum = (unsigned)i;
+
+      if (user) {
+         mpn = MonLoaderCallout_GetSharedUserPage(ctx->envCtx, subIndex, pgNum,
+                                                  vcpu);
+      } else {
+         mpn = MonLoaderCallout_GetSharedHostPage(ctx->envCtx, subIndex, pgNum,
+                                                  vcpu);
+      }
+      if (mpn == INVALID_MPN) {
+         /* Partial sharing is allowed.  Return success if any occurred. */
+         return i != 0 ? ML_OK : ML_ERROR_SHARE;
+      }
+      ret = MonLoaderMapMPN(ctx, mpn, flags, monVPN + i);
+      if (ret != ML_OK) {
+         return ret;
+      }
+   }
+   return ML_OK;
+}
+
+
+#ifndef VMMON
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderSetEntrypoint --
+ *
+ *      Calls out to set the code and stack entrypoint.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.
+ *
+ * Side effects:
+ *      The monitor entrypoint for the current VCPU may be set.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderSetEntrypoint(MonLoaderContext *ctx,           // IN
+                       uint16            codeSelector,  // IN
+                       VA64              code,          // IN
+                       uint16            stackSelector, // IN
+                       VA64              stack)         // IN
+{
+   if (VA_2_VPN(code) < ctx->vcpu.ASFirstVPN  ||
+       VA_2_VPN(code) > ctx->vcpu.ASLastVPN   ||
+       VA_2_VPN(stack) < ctx->vcpu.ASFirstVPN ||
+       VA_2_VPN(stack) > ctx->vcpu.ASLastVPN) {
+      return ML_ERROR_INVALID_VPN; /* Address is outside address space. */
+   }
+   if (MonLoaderCallout_SetEntrypoint(ctx->envCtx, codeSelector, code,
+                                      stackSelector, stack)) {
+      return ML_OK;
+   } else {
+      return ML_ERROR_CALLOUT_ENTRYPOINT;
+   }
+}
+#endif
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderShareFromUser --
+ *
+ *      Maps user pages in.  monPages is a maximum, so partial sharing is
+ *      considered successful and remaining monitor pages will not be mapped.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.
+ *
+ * Side effects:
+ *      User pages may be mapped in.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderShareFromUser(MonLoaderContext *ctx,        // IN/OUT
+                       uint64            flags,      // IN
+                       VPN               monVPN,     // IN
+                       uint64            monPages,   // IN
+                       uint64            subIndex)   // IN
+{
+   return MonLoaderShareWork(ctx, flags, monVPN, monPages, subIndex, TRUE);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderShareFromHost --
+ *
+ *      Maps host pages in.  monPages is a maximum, so partial sharing is
+ *      considered successful and remaining monitor pages will not be mapped.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.
+ *
+ * Side effects:
+ *      Host pages may be mapped in.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderShareFromHost(MonLoaderContext *ctx,        // IN/OUT
+                       uint64            flags,      // IN
+                       VPN               monVPN,     // IN
+                       uint64            monPages,   // IN
+                       uint64            subIndex)   // IN
+{
+   return MonLoaderShareWork(ctx, flags, monVPN, monPages, subIndex, FALSE);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderShareFromBlob --
+ *
+ *      Maps blob pages in. monPages is a maximum, so partial sharing is
+ *      considered successful and remaining monitor pages will not be
+ *      mapped. blobOffset must be page-aligned and blobSize must be a
+ *      multiple of PAGE_SIZE. Writeable mappings are not allowed.
+ *
+ *     Result:
+ *          ML_OK if successful, some other value on error.
+ *
+ *     Side effects:
+ *          Blob pages may be mapped in.
+ *
+ *----------------------------------------------------------------------
+ */
+static MonLoaderError
+MonLoaderShareFromBlob(MonLoaderContext *ctx,        // IN/OUT
+                       uint64            flags,      // IN
+                       VPN               monVPN,     // IN
+                       uint64            monBytes,   // IN
+                       uint64            blobOffset, // IN
+                       uint64            blobSize)   // IN
+{
+   uint64 endOff = blobOffset + blobSize;
+
+   if ((blobOffset & PAGE_MASK) != 0 || (blobSize & PAGE_MASK) != 0 ||
+       (flags & PTE_RW) != 0) {
+      return ML_ERROR_SHARE;
+   }
+   if (blobSize > monBytes || blobSize == 0) {
+      return ML_ERROR_SIZE;
+   }
+   while (blobOffset < endOff) {
+      MonLoaderError ret;
+      MPN mpn = MonLoaderCallout_GetBlobMpn(ctx->envCtx, blobOffset);
+      if (mpn == INVALID_MPN) {
+         return ML_ERROR_INVALID_VPN;
+      }
+      ret = MonLoaderMapMPN(ctx, mpn, flags, monVPN);
+      if (ret != ML_OK) {
+         return ret;
+      }
+      blobOffset += PAGE_SIZE;
+      monVPN++;
+   }
+   ASSERT(blobOffset == endOff);
+   return ML_OK;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoader_Process --
+ *
+ *      Builds and populates a monitor address space per the given a header and
+ *      VCPU count.  Calls out to support functions.
+ *
+ * Result:
+ *      ML_OK if successful, some other value on error.  If an error occurs,
+ *      *line contains the line in the table at which the failure occurred and
+ *      *vcpu contains the VCPU for which processing was running.
+ *
+ * Side effects:
+ *      An address space and page table mappings are created or verified, for
+ *      all VCPUs.  Callouts are called.
+ *
+ *----------------------------------------------------------------------
+ */
+MonLoaderError
+MonLoader_Process(MonLoaderHeader  *header,   // IN/OUT
+                  unsigned          numVCPUs, // IN
+                  void             *args,     // IN
+                  unsigned         *line,     // OUT
+                  Vcpuid           *vcpu)     // OUT
+{
+   unsigned i;
+   MonLoaderError ret;
+   MonLoaderContext ctx;
+
+   if (numVCPUs > MAX_VCPUS) {
+      return ML_ERROR_ARGS;
+   }
+
+   if (header->magic != LOADER_HEADER_MAGIC) {
+      return ML_ERROR_MAGIC;
+   }
+
+   if (vmx86_debug && !line) {
+      return ML_ERROR_ARGS;
+   }
+   *line = LINE_INVALID;
+
+   if (header->entries == 0 || header->count == 0) {
+      return ML_ERROR_TABLE_MISSING;
+   }
+
+   if (!MonLoaderCallout_Init(args, &ctx.envCtx)) {
+      return ML_ERROR_CALLOUT_INIT;
+   }
+   ret = ML_OK;
+   for (*vcpu = 0; *vcpu < numVCPUs && ret == ML_OK; (*vcpu) += 1) {
+      /* Reset VCPU-specific part of context. */
+      memset(&ctx.vcpu, 0, sizeof ctx.vcpu);
+      ctx.vcpu.currentVCPU = *vcpu;
+      ctx.vcpu.hasAddrSpace = FALSE;
+      for (i = 0; i < header->count && ret == ML_OK; i++) {
+         MonLoaderEntry *entry = &header->entries[i];
+         MonLoaderContentType content    = entry->content;
+         MonLoaderSourceType  source     = entry->source;
+         VPN                  monVPN     = entry->monVPN;
+         uint64               blobOffset = entry->blobSrc.offset;
+         uint64               blobSize   = entry->blobSrc.size;
+         uint64               flags      = entry->flags;
+         uint64               monPages   = entry->monPages;
+         uint64               monBytes   = PAGES_2_BYTES(monPages);
+         uint64               subIndex   = entry->subIndex;
+         uint64               bspOnly    = entry->bspOnly;
+         uint64               isPriv     = vmx86_server || entry->procVmmon;
+         *line = i;
+
+         /*
+          * The entry is specific to the bootstrap, which only runs in VCPU 0.
+          */
+         if (bspOnly && !IS_BOOT_VCPUID(*vcpu)) {
+            continue;
+         }
+         /*
+          * Entries marked as privileged (isPriv == TRUE) are processed
+          * by the privileged layer (VMKernel/vmmon). Others are
+          * processed by the VMX. One exception is the entry of type
+          * ML_CONTENT_ADDRSPACE: it is always processed by the VMX and,
+          * if marked as privileged, also by the privileged layer.
+          */
+         if (isPriv != MonLoaderCallout_IsPrivileged(ctx.envCtx) &&
+             (content != ML_CONTENT_ADDRSPACE || isPriv == 0)) {
+            continue;
+         }
+         if (monPages == 0 || monVPN + monPages - 1 > VPN_MAX) {
+            ret = ML_ERROR_SIZE;
+            continue;
+         }
+
+         switch (content) {
+            case ML_CONTENT_ADDRSPACE:
+               if (ctx.vcpu.hasAddrSpace) {
+                  ret = ML_ERROR_DUPLICATE;
+                  continue;
+               }
+               /* Create or verify the address space and page table MPNs. */
+               ret = MonLoaderCreateAddressSpace(&ctx, monVPN, flags, monPages,
+                                                 importFromVMX);
+               break;
+            case ML_CONTENT_PAGETABLE_L4:
+            case ML_CONTENT_PAGETABLE_L3:
+            case ML_CONTENT_PAGETABLE_L2:
+            case ML_CONTENT_PAGETABLE_L1:
+               /* Create or verify page table mappings. */
+               ret = MonLoaderMapPageTables(&ctx, CONTENT_TO_PTLEVEL(content),
+                                            flags, monVPN, monPages);
+               break;
+            case ML_CONTENT_ALLOCZERO: {
+               uint64 numPages;
+               if (source == ML_SOURCE_NONE) {
+                  numPages = monPages;
+               } else if (source == ML_SOURCE_BLOB) {
+                  /*
+                   * Used for loading the uninitialized data section
+                   * (.bss), which has a blob size but no blob image
+                   * associated with it.
+                   */
+                  numPages = CEILING(blobSize, PAGE_SIZE);
+               } else {
+                  ret = ML_ERROR_SOURCE_INVALID;
+                  break;
+               }
+               ret = MonLoaderZero(&ctx, flags, monVPN, numPages, monPages,
+                                   &entry->allocs);
+               break;
+            }
+            case ML_CONTENT_COPY:
+               switch (source) {
+                  case ML_SOURCE_BLOB:
+                     ret = MonLoaderCopyFromBlob(&ctx, flags, monVPN, monBytes,
+                                                 blobOffset, blobSize,
+                                                 &entry->allocs);
+                     break;
+                  default:
+                     ret = ML_ERROR_SOURCE_INVALID;
+                     break;
+               }
+               break;
+            case ML_CONTENT_SHARE:
+               switch (source) {
+                  case ML_SOURCE_USER:
+                     ret = MonLoaderShareFromUser(&ctx, flags, monVPN,
+                                                  monPages, subIndex);
+                     break;
+                  case ML_SOURCE_HOST:
+                     ret = MonLoaderShareFromHost(&ctx, flags, monVPN,
+                                                  monPages, subIndex);
+                     break;
+                  case ML_SOURCE_BLOB:
+                     ret = MonLoaderShareFromBlob(&ctx, flags, monVPN,
+                                                  monBytes, blobOffset,
+                                                  blobSize);
+                     break;
+                  default:
+                     ret = ML_ERROR_SOURCE_INVALID;
+                     break;
+               }
+               break;
+            case ML_CONTENT_INVALID:
+            default:
+               ret = ML_ERROR_CONTENT_INVALID;
+               break;
+         }
+      }
+   }
+#ifndef VMMON
+   if (ret == ML_OK) {
+      if (ctx.vcpu.ASLastVPN == 0) {
+         ret = ML_ERROR_NO_ADDRSPACE;
+      } else {
+         ret = MonLoaderSetEntrypoint(&ctx, header->codeSelector,
+                                      header->codeEntrypoint,
+                                      header->stackSelector,
+                                      header->stackEntrypoint);
+      }
+   }
+#endif
+   MonLoaderCallout_CleanUp(ctx.envCtx);
+   return ret;
+}
diff --git a/vmmon-only/bootstrap/monLoaderVmmon.c b/vmmon-only/bootstrap/monLoaderVmmon.c
new file mode 100644
index 00000000..6879e617
--- /dev/null
+++ b/vmmon-only/bootstrap/monLoaderVmmon.c
@@ -0,0 +1,411 @@
+/*********************************************************
+ * Copyright (C) 2016-2017 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * monLoaderVmmon.c --
+ *
+ *      vmmon implementation of the MonLoader callouts.
+ *
+ */
+
+#ifdef __linux__
+#   include "driver-config.h"
+#   include <linux/string.h>
+#else
+#   include <string.h>
+#endif
+
+#include "vm_assert.h"
+#include "vcpuid.h"
+#include "x86types.h"
+#include "hostif.h"
+#include "x86paging_common.h"
+#include "x86paging_64.h"
+#include "vmx86.h"
+#include "monLoaderLog.h"
+
+typedef struct MonLoaderEnvContext {
+   VMDriver *vm;
+   VMSharedRegion *shRegions;
+} MonLoaderEnvContext;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_Init --
+ *
+ *      Initializes platform-specific MonLoader context.
+ *
+ * Returns:
+ *      TRUE if successful, FALSE if not.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+MonLoaderCallout_Init(void *args, MonLoaderEnvContext **ctx)
+{
+   MonLoaderEnvContext *c;
+   MonLoaderArgs *mlArgs = (MonLoaderArgs *)args;
+
+   c = HostIF_AllocKernelMem(sizeof *c, FALSE);
+   if (c == NULL) {
+      Log("Failed to allocate memory for MonLoader context\n");
+      return FALSE;
+   }
+   memset(c, 0, sizeof *c);
+   c->vm = mlArgs->vm;
+   c->shRegions = mlArgs->shRegions;
+
+   *ctx = c;
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_Cleanup --
+ *
+ *      Cleans up platform-specific MonLoader context.
+ *
+ * Returns:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+MonLoaderCallout_CleanUp(MonLoaderEnvContext *ctx)
+{
+   ASSERT(ctx != NULL);
+   HostIF_FreeKernelMem(ctx);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_GetPageRoot --
+ *
+ *      Gets the page root MPN for a VCPU.
+ *
+ * Returns:
+ *      An MPN, or INVALID_MPN in case of error.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+
+MPN
+MonLoaderCallout_GetPageRoot(MonLoaderEnvContext *ctx,  // IN
+                             Vcpuid               vcpu) // IN
+{
+   VMDriver *vm = ctx->vm;
+
+   if (vcpu >= vm->numVCPUs) {
+      return INVALID_MPN;
+   }
+   return vm->ptRootMpns[vcpu];
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_GetPTE --
+ *
+ *      Gets the page table entry at index idx in a page table MPN.
+ *
+ * Returns:
+ *      TRUE and sets *pte on success.  FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+MonLoaderCallout_GetPTE(MonLoaderEnvContext *ctx,   // IN
+                        MPN                  ptMPN, // IN
+                        unsigned             idx,   // IN
+                        Vcpuid               vcpu,  // IN
+                        PT_L1E              *pte)   // OUT
+{
+   VMDriver *vm = ctx->vm;
+   MA pteMA = MPN_2_MA(ptMPN) + idx * sizeof *pte;
+
+   ASSERT(idx < (PAGE_SIZE / sizeof *pte));
+   if (HostIF_ReadPhysical(vm, pteMA, PtrToVA64(pte), TRUE, sizeof *pte) != 0) {
+      Log("Failed to read PTE %d from MPN %"FMT64"x\n", idx, ptMPN);
+      return FALSE;
+   }
+   return TRUE;
+}
+
+
+Bool
+MonLoaderCallout_ImportPage(MonLoaderEnvContext *ctx, // IN
+                            MPN mpn,                  // IN
+                            Vcpuid vcpu)              // IN
+{
+   return TRUE;
+}
+
+
+MPN
+MonLoaderCallout_AllocMPN(MonLoaderEnvContext *ctx,  // IN
+                          Vcpuid               vcpu) // IN
+{
+   NOT_IMPLEMENTED();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_MapMPNInPTE --
+ *
+ *      Maps an MPN into a page table at the specified index.
+ *
+ * Returns:
+ *      TRUE on success, FALSE on failure.
+ *
+ * Side effects:
+ *      A mapping is created.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+MonLoaderCallout_MapMPNInPTE(MonLoaderEnvContext *ctx, // IN
+                             MPN ptMPN,                // IN
+                             unsigned idx,             // IN
+                             uint64 flags,             // IN
+                             MPN mpn,                  // IN
+                             Vcpuid vcpu)              // IN
+{
+   VMDriver *vm = ctx->vm;
+   PT_L1E pte = LM_MAKE_PTE(mpn, 0, flags);
+   MA pteMA = MPN_2_MA(ptMPN) + idx * sizeof pte;
+
+   ASSERT(idx < (PAGE_SIZE / sizeof pte));
+   if (HostIF_WritePhysical(vm, pteMA, PtrToVA64(&pte), TRUE, sizeof pte) !=
+       0) {
+      Warning("Failed to map MPN %"FMT64"x\n", mpn);
+      return FALSE;
+   }
+   LOG(5, "MonLoader mapped MPN %"FMT64"x at PT index %u for VCPU %u\n",
+       mpn, idx, vcpu);
+   return TRUE;
+}
+
+
+Bool
+MonLoaderCallout_FillPage(MonLoaderEnvContext *ctx,     // IN
+                          uint8                pattern, // IN
+                          MPN                  mpn,     // IN
+                          Vcpuid               vcpu)    // IN
+{
+   NOT_IMPLEMENTED();
+}
+
+
+Bool
+MonLoaderCallout_CopyFromBlob(MonLoaderEnvContext *ctx,        // IN
+                              uint64               blobOffset, // IN
+                              size_t               copySize,   // IN
+                              MPN                  mpn,        // IN
+                              Vcpuid               vcpu)       // IN
+{
+   NOT_IMPLEMENTED();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderFindSharedRegion --
+ *
+ *      Searches the shared region table for the given index and returns
+ *      the corresponding descriptor.
+ *
+ * Returns:
+ *      A pointer to the shared region descriptor or NULL if not found.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static VMSharedRegion *
+MonLoaderFindSharedRegion(MonLoaderEnvContext *ctx,
+                          uint64 index)
+{
+   int i;
+
+   for (i = 0; i < ML_SHARED_REGIONS_MAX; i++) {
+      if (ctx->shRegions[i].baseVpn == INVALID_VPN) {
+         /* Not found. */
+         return NULL;
+      } else if (ctx->shRegions[i].index == index) {
+         return &ctx->shRegions[i];
+      }
+   }
+   return NULL;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderGetSharedRegionMPN --
+ *
+ *      Gets shared page's MPN. Assumes vcpuid == 0 for the bootstrap.
+ *
+ * Returns:
+ *      An MPN or INVALID_MPN.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static MPN
+MonLoaderGetSharedRegionMPN(MonLoaderEnvContext *ctx,
+                            uint64 index,
+                            Vcpuid vcpuid,
+                            unsigned pgOffset)
+{
+   VMSharedRegion *s;
+   VA addr;
+   MPN mpn;
+
+   ASSERT(IS_BOOT_VCPUID(vcpuid));
+
+   if (index >= ML_SHARED_REGIONS_MAX) {
+      Log("Invalid shared region %"FMT64"x", index);
+      return INVALID_MPN;
+   }
+   s = MonLoaderFindSharedRegion(ctx, index);
+   if (s == NULL) {
+      return INVALID_MPN;
+   }
+   if (pgOffset >= s->numPages) {
+      return INVALID_MPN;
+   }
+
+   addr = VPN_2_VA(s->baseVpn) + pgOffset * PAGE_SIZE;
+   HostIF_VMLock(ctx->vm, 38);
+   if (HostIF_LookupUserMPN(ctx->vm, addr, &mpn) != PAGE_LOOKUP_SUCCESS) {
+      HostIF_VMUnlock(ctx->vm, 38);
+      Log("Failed to lookup MPN for shared region VA %"FMTVA"x\n", addr);
+      return INVALID_MPN;
+   }
+   HostIF_VMUnlock(ctx->vm, 38);
+   return mpn;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_GetSharedUserPage --
+ *
+ *      Gets a user-provided shared page's MPN for a VCPU.
+ *
+ * Returns:
+ *      An MPN or INVALID_MPN.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+MonLoaderCallout_GetSharedUserPage(MonLoaderEnvContext *ctx,
+                                   uint64 subIndex, // IN
+                                   unsigned page,   // IN
+                                   Vcpuid vcpu)     // IN
+{
+   return MonLoaderGetSharedRegionMPN(ctx, subIndex, vcpu, page);
+}
+
+
+MPN
+MonLoaderCallout_GetSharedHostPage(MonLoaderEnvContext *ctx,      // IN
+                                   uint64               subIndex, // IN
+                                   unsigned             page,     // IN
+                                   Vcpuid               vcpu)     // IN
+{
+   NOT_IMPLEMENTED();
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_IsPrivileged --
+ *
+ *      Returns whether or not this is a privileged environment.
+ *
+ * Returns:
+ *      TRUE if privileged, FALSE if not.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+MonLoaderCallout_IsPrivileged(MonLoaderEnvContext *ctx) // IN
+{
+   return TRUE;
+}
+
+MPN
+MonLoaderCallout_GetBlobMpn(MonLoaderEnvContext *ctx,    // IN
+                            uint64               offset) // IN
+{
+   return INVALID_MPN;
+}
+
+Bool
+MonLoaderCallout_SetEntrypoint(MonLoaderEnvContext *ctx,           // IN
+                               uint16               codeSelector,  // IN
+                               VA64                 code,          // IN
+                               uint16               stackSelector, // IN
+                               VA64                 stack)         // IN
+{
+   NOT_IMPLEMENTED();
+}
diff --git a/vmmon-only/common/apic.c b/vmmon-only/common/apic.c
index a9eb1a4c..753a729f 100644
--- a/vmmon-only/common/apic.c
+++ b/vmmon-only/common/apic.c
@@ -165,7 +165,7 @@ APIC_ReadID(const APICDescriptor *desc) // IN
  *
  * APIC_Write --
  *
- *      Writes the given value to the given APIC register using the proper 
+ *      Writes the given value to the given APIC register using the proper
  *      interface.  Does not check to see if the register number is valid.
  *
  * Side effects:
@@ -195,7 +195,7 @@ APIC_Write(const APICDescriptor *desc, // IN
  *
  * APIC_ReadICR --
  *
- *      Reads the APIC ICR using the proper interface.  The semantics of the 
+ *      Reads the APIC ICR using the proper interface.  The semantics of the
  *      ICR are different in X2APIC mode so APIC_Read() should not be used.
  *
  * Side effects:
@@ -207,7 +207,7 @@ APIC_Write(const APICDescriptor *desc, // IN
  *----------------------------------------------------------------------
  */
 
-uint64 
+uint64
 APIC_ReadICR(const APICDescriptor *desc) // IN
 {
    if (desc->isX2) {
@@ -225,7 +225,7 @@ APIC_ReadICR(const APICDescriptor *desc) // IN
  *
  * APIC_WriteICR --
  *
- *      Writes the given value to the APIC ICR using the proper interface.  
+ *      Writes the given value to the APIC ICR using the proper interface.
  *      The semantics of the ICR are different in X2APIC mode so APIC_Write()
  *      should not be used.
  *
diff --git a/vmmon-only/common/comport.c b/vmmon-only/common/comport.c
index 4d591178..29291b2c 100644
--- a/vmmon-only/common/comport.c
+++ b/vmmon-only/common/comport.c
@@ -19,20 +19,20 @@
 /*
  * comport.c --
  *
- *      Simple COM1 port routines for debugging code that can't do any real 
+ *      Simple COM1 port routines for debugging code that can't do any real
  *      host IO, such as the worldswitch and related.
  *
- *      They all wait for the last character to complete transmission so if the 
- *      system crashes immediately on return, the last character will be seen 
+ *      They all wait for the last character to complete transmission so if the
+ *      system crashes immediately on return, the last character will be seen
  *      by the remote end.
  *
- *      These routines do not have any external dependencies so can be called 
+ *      These routines do not have any external dependencies so can be called
  *      by any code that has privilege to access IO ports.
  *
- *      Under Windows, they can be made to forward output to DbgPrint for 
- *      printing via the debugger.  Just have USE_DBGPRINT set to 1.  If you 
- *      let USE_DBGPRINT be 0 with Windows, make sure the comport hardware is 
- *      powered-up by leaving Hyperterm running with the comport open, else 
+ *      Under Windows, they can be made to forward output to DbgPrint for
+ *      printing via the debugger.  Just have USE_DBGPRINT set to 1.  If you
+ *      let USE_DBGPRINT be 0 with Windows, make sure the comport hardware is
+ *      powered-up by leaving Hyperterm running with the comport open, else
  *      Windows will power the chip down.
  */
 
diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
index 4984eb00..04a071ed 100644
--- a/vmmon-only/common/cpuid.c
+++ b/vmmon-only/common/cpuid.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2016-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,6 +31,8 @@
 #include "hostif.h"
 #include "cpuid.h"
 #include "x86cpuid_asm.h"
+#include "x86svm.h"
+#include "x86vt.h"
 
 uint32 cpuidFeatures;
 static CpuidVendor vendor = CPUID_NUM_VENDORS;
@@ -111,7 +113,6 @@ CPUID_GetVendor(void)
 uint32
 CPUID_GetVersion(void)
 {
-   ASSERT(vendor != CPUID_NUM_VENDORS);
    return version;
 }
 
@@ -119,13 +120,13 @@ CPUID_GetVersion(void)
 /*
  *-----------------------------------------------------------------------------
  *
- * CPUID_SyscallSupported --
+ * CPUID_AddressSizeSupported --
  *
- *     Determine whether processor supports syscall opcode and MSRs.
+ *     Determine whether processor supports the address size cpuid
+ *     extended leaf.
  *
  * Results:
- *     FALSE     if processor does not support syscall
- *     TRUE      if processor supports syscall
+ *     True iff the processor supports CPUID 0x80000008.
  *
  * Side effects:
  *     It determines value only on first call, caching it for future.
@@ -134,27 +135,7 @@ CPUID_GetVersion(void)
  */
 
 Bool
-CPUID_SyscallSupported(void)
-{
-   /*
-    * It is OK to use local static variables here as 'result' does not depend
-    * on any work done in CPUID_Init(). It purely depends on the CPU.
-    */
-   static Bool initialized = FALSE;
-   static Bool result;
-
-   if (UNLIKELY(!initialized)) {
-      result =    CPUIDExtendedSupported() >= 0x80000001
-               && (__GET_EDX_FROM_CPUID(0x80000001) & (1 << 11));
-      initialized = TRUE;
-   }
-
-   return result;
-}
-
-
-Bool
-CPUID_LongModeSupported(void)
+CPUID_AddressSizeSupported(void)
 {
    /*
     * It is OK to use local static variables here as 'result' does not depend
@@ -164,8 +145,7 @@ CPUID_LongModeSupported(void)
    static Bool result;
 
    if (UNLIKELY(!initialized)) {
-      result =       CPUIDExtendedSupported() >= 0x80000001
-                  && (__GET_EDX_FROM_CPUID(0x80000001) & (1 << 29));
+      result = CPUIDExtendedSupported() >= 0x80000008;
       initialized = TRUE;
    }
 
@@ -176,34 +156,23 @@ CPUID_LongModeSupported(void)
 /*
  *-----------------------------------------------------------------------------
  *
- * CPUID_AddressSizeSupported --
+ * CPUID_HostSupportsHV --
  *
- *     Determine whether processor supports the address size cpuid
- *     extended leaf.
+ *     Determine whether processor supports hardware virtualization.  Two
+ *     possibilities are valid: VMX on Intel or SVM on AMD.
  *
  * Results:
- *     True iff the processor supports CPUID 0x80000008.
+ *     True iff the processor supports the required features.
  *
  * Side effects:
- *     It determines value only on first call, caching it for future.
+ *     None.
  *
  *-----------------------------------------------------------------------------
  */
 
 Bool
-CPUID_AddressSizeSupported(void)
+CPUID_HostSupportsHV(void)
 {
-   /*
-    * It is OK to use local static variables here as 'result' does not depend
-    * on any work done in CPUID_Init(). It purely depends on the CPU.
-    */
-   static Bool initialized = FALSE;
-   static Bool result;
-
-   if (UNLIKELY(!initialized)) {
-      result = CPUIDExtendedSupported() >= 0x80000008;
-      initialized = TRUE;
-   }
-
-   return result;
+   return (vendor == CPUID_VENDOR_AMD   && SVM_CapableCPU()) ||
+          (vendor == CPUID_VENDOR_INTEL && VT_CapableCPU());
 }
diff --git a/vmmon-only/common/cpuid.h b/vmmon-only/common/cpuid.h
index 59bb8067..c21b0715 100644
--- a/vmmon-only/common/cpuid.h
+++ b/vmmon-only/common/cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2016-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -36,11 +36,10 @@ extern uint32 cpuidFeatures;
 void CPUID_Init(void);
 CpuidVendor CPUID_GetVendor(void);
 uint32 CPUID_GetVersion(void);
-Bool CPUID_SyscallSupported(void);
-Bool CPUID_LongModeSupported(void);
 Bool CPUID_AddressSizeSupported(void);
+Bool CPUID_HostSupportsHV(void);
 
-static INLINE uint32 
+static INLINE uint32
 CPUID_GetFeatures(void)
 {
    return cpuidFeatures;
@@ -53,4 +52,3 @@ CPUID_SSE2Supported(void)
 }
 
 #endif
-
diff --git a/vmmon-only/common/hashFunc.c b/vmmon-only/common/hashFunc.c
index b8510821..38f05165 100644
--- a/vmmon-only/common/hashFunc.c
+++ b/vmmon-only/common/hashFunc.c
@@ -20,7 +20,7 @@
 /*
  * hashFunc.c --
  *
- *	The core implementation lives in lib/shared/hashFunc.h because it 
+ *      The core implementation lives in lib/shared/hashFunc.h because it
  *      is shared by the vmkernel and vmmon.
  */
 
@@ -31,10 +31,10 @@
  */
 
 // arbitrary constant
-#define	HASH_INIT_VALUE	(42)
+#define HASH_INIT_VALUE (42)
 
 // 64-bit hash for one 4K page
-uint64 
+uint64
 HashFunc_HashPage(const void *addr)
 {
    return hash2((uint64 *)addr, PAGE_SIZE / sizeof (uint64), HASH_INIT_VALUE);
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index 2b94ce1e..c11b8658 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -17,8 +17,8 @@
  *********************************************************/
 
 /*
- *  hostif.h - Platform dependent interface for supporting 
- *             the vmx86 device driver. 
+ *  hostif.h - Platform dependent interface for supporting
+ *             the vmx86 device driver.
  */
 
 
@@ -36,7 +36,7 @@
 #include "hostifGlobalLock.h"
 
 /*
- * Host-specific definitions. 
+ * Host-specific definitions.
  */
 #if !__linux__ && !defined(WINNT_DDK) && !defined __APPLE__
 #error "Only Linux or NT or Mac OS defined for now."
@@ -69,11 +69,12 @@ typedef enum {
 EXTERN int   HostIF_Init(VMDriver *vm);
 EXTERN int   HostIF_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
 EXTERN void *HostIF_MapCrossPage(VMDriver *vm, VA64 uAddr);
-EXTERN void  HostIF_InitFP(VMDriver *vm);
 
 EXTERN void *HostIF_AllocPage(void);
 EXTERN void  HostIF_FreePage(void *ptr);
 
+EXTERN VPN   HostIF_MapPage(MPN mpn);
+EXTERN void  HostIF_UnmapPage(VPN vpn);
 EXTERN int   HostIF_LockPage(VMDriver *vm, VA64 uAddr,
                              Bool allowMultipleMPNsPerVA, MPN *mpn);
 EXTERN int   HostIF_UnlockPage(VMDriver *vm, VA64 uAddr);
@@ -86,9 +87,8 @@ EXTERN unsigned int HostIF_EstimateLockedPageLimit(const VMDriver *vm,
                                                    unsigned int lockedPages);
 EXTERN void  HostIF_Wait(unsigned int timeoutMs);
 EXTERN void  HostIF_WaitForFreePages(unsigned int timeoutMs);
-EXTERN void *HostIF_AllocCrossGDT(uint32 numPages, MPN maxValidFirst,
-                                  MPN *crossGDTMPNs);
-EXTERN void  HostIF_FreeCrossGDT(uint32 numPages, void *crossGDT);
+EXTERN void *HostIF_AllocKernelPages(unsigned numPages, MPN *mpns);
+EXTERN void  HostIF_FreeKernelPages(unsigned numPages, void *ptr);
 EXTERN void  HostIF_VMLock(VMDriver *vm, int callerID);
 EXTERN void  HostIF_VMUnlock(VMDriver *vm, int callerID);
 #ifdef VMX86_DEBUG
@@ -119,12 +119,11 @@ EXTERN int HostIF_AllocLockedPages(VMDriver *vm, VA64 addr,
 EXTERN int HostIF_FreeLockedPages(VMDriver *vm, VA64 addr,
                                   unsigned int numPages, Bool kernelMPNBuffer);
 EXTERN MPN HostIF_GetNextAnonPage(VMDriver *vm, MPN mpn);
-EXTERN int HostIF_GetLockedPageList(VMDriver *vm, VA64 uAddr,
-                                    unsigned int numPages);
 
-EXTERN int HostIF_ReadPage(VMDriver *vm, MPN mpn, VA64 addr, Bool kernelBuffer);
-EXTERN int HostIF_WritePage(VMDriver *vm, MPN mpn, VA64 addr,
-                            Bool kernelBuffer);
+EXTERN int HostIF_ReadPhysical(VMDriver *vm, MA ma, VA64 addr,
+                               Bool kernelBuffer, size_t len);
+EXTERN int HostIF_WritePhysical(VMDriver *vm, MA ma, VA64 addr,
+                                Bool kernelBuffer, size_t len);
 EXTERN int HostIF_WriteMachinePage(MPN mpn, VA64 addr);
 #if defined __APPLE__
 // There is no need for a fast clock lock on Mac OS.
@@ -141,6 +140,9 @@ EXTERN void HostIF_FreeMachinePage(MPN mpn);
 
 EXTERN int HostIF_SafeRDMSR(uint32 msr, uint64 *val);
 
+EXTERN int HostIF_CopyFromUser(void *dst, VA64 src, size_t len);
+EXTERN int HostIF_CopyToUser(VA64 dst, const void *src, size_t len);
+
 #if defined __APPLE__
 EXTERN void HostIF_PageUnitTest(void);
 #endif
diff --git a/vmmon-only/common/memtrack.c b/vmmon-only/common/memtrack.c
index eec98441..b8dd3516 100644
--- a/vmmon-only/common/memtrack.c
+++ b/vmmon-only/common/memtrack.c
@@ -151,7 +151,7 @@ typedef struct MemTrack {
    unsigned          numPages;      /* Number of pages tracked. */
    MemTrackDir1      dir1;          /* First level directory. */
    MemTrackHT        vpnHashTable;  /* VPN to entry hashtable. */
-   MemTrackHT        mpnHashTable;  /* MPN to entry hashtable. */
+   MemTrackHT       *mpnHashTable;  /* MPN to entry hashtable. */
 } MemTrack;
 
 /*
@@ -276,6 +276,7 @@ MemTrackCleanup(MemTrack *mt)    // IN
    unsigned idx;
    unsigned p1;
    MemTrackDir1 *dir1;
+   Bool freeBackMap = mt != NULL && mt->mpnHashTable != NULL;
 
    if (mt == NULL) {
       return;
@@ -304,10 +305,15 @@ MemTrackCleanup(MemTrack *mt)    // IN
       if (mt->vpnHashTable.pages[idx] != NULL) {
          HostIF_FreePage(mt->vpnHashTable.pages[idx]);
       }
-      if (mt->mpnHashTable.pages[idx] != NULL) {
-         HostIF_FreePage(mt->mpnHashTable.pages[idx]);
+      if (freeBackMap) {
+         if (mt->mpnHashTable->pages[idx] != NULL) {
+            HostIF_FreePage(mt->mpnHashTable->pages[idx]);
+         }
       }
    }
+   if (freeBackMap) {
+      HostIF_FreeKernelMem(mt->mpnHashTable);
+   }
 
    HostIF_FreeKernelMem(mt);
 }
@@ -359,14 +365,19 @@ MemTrack_Init(VMDriver *vm) // IN:
       mt->vpnHashTable.pages[idx] = htPage;
    }
 
+   mt->mpnHashTable = HostIF_AllocKernelMem(sizeof *mt->mpnHashTable, FALSE);
+   if (mt->mpnHashTable == NULL) {
+      Warning("MemTrack failed to allocate MPN hash table.\n");
+      goto error;
+   }
+   memset(mt->mpnHashTable, 0, sizeof *mt->mpnHashTable);
    for (idx = 0; idx < MEMTRACK_HT_PAGES; idx++) {
       MemTrackHTPage *htPage = MemTrackAllocPage();
-
       if (htPage == NULL) {
          Warning("MemTrack failed to allocate MPN hash table (%d).\n", idx);
          goto error;
       }
-      mt->mpnHashTable.pages[idx] = htPage;
+      mt->mpnHashTable->pages[idx] = htPage;
    }
 
    return mt;
@@ -406,6 +417,7 @@ MemTrack_Add(MemTrack *mt,    // IN
    MemTrackDir3 *dir3;
    MEMTRACK_IDX2DIR(idx, p1, p2, p3);
 
+
    ASSERT(HostIF_VMLockIsHeld(mt->vm));
 
    if (p1 >= MEMTRACK_DIR1_ENTRIES ||
@@ -429,7 +441,7 @@ MemTrack_Add(MemTrack *mt,    // IN
    ent->mpn = mpn;
 
    MemTrackHTInsert(&mt->vpnHashTable, ent, &ent->vpnChain, ent->vpn);
-   MemTrackHTInsert(&mt->mpnHashTable, ent, &ent->mpnChain, ent->mpn);
+   MemTrackHTInsert(mt->mpnHashTable, ent, &ent->mpnChain, ent->mpn);
 
    mt->numPages++;
 
@@ -492,7 +504,7 @@ MemTrack_LookupMPN(MemTrack *mt, // IN
 {
    MemTrackEntry *next;
    ASSERT(HostIF_VMLockIsHeld(mt->vm));
-   next = *MemTrackHTLookup(&mt->mpnHashTable, mpn);
+   next = *MemTrackHTLookup(mt->mpnHashTable, mpn);
 
    while (next != NULL) {
       if (next->mpn == mpn) {
diff --git a/vmmon-only/common/memtrack.h b/vmmon-only/common/memtrack.h
index 6d104ad1..1f9cb78b 100644
--- a/vmmon-only/common/memtrack.h
+++ b/vmmon-only/common/memtrack.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -20,7 +20,7 @@
  * memtrack.h --
  *
  *    Utility module for tracking pinned memory, which allows later
- *    lookup by VPN.
+ *    lookup by VPN and optionally by MPN.
  */
 
 
diff --git a/vmmon-only/common/phystrack.c b/vmmon-only/common/phystrack.c
index 5972e24a..cd95fdb3 100644
--- a/vmmon-only/common/phystrack.c
+++ b/vmmon-only/common/phystrack.c
@@ -226,7 +226,7 @@ PhysTrack_Alloc(VMDriver *vm)
    }
 
    return tracker;
-} 
+}
 
 
 /*
@@ -238,7 +238,7 @@ PhysTrack_Alloc(VMDriver *vm)
  *
  * Results:
  *      reallocates all structures, including 'tracker'
- *     
+ *
  * Side effects:
  *      tracker deallocated
  *
@@ -246,7 +246,7 @@ PhysTrack_Alloc(VMDriver *vm)
  */
 
 void
-PhysTrack_Free(PhysTracker *tracker) 
+PhysTrack_Free(PhysTracker *tracker)
 {
    unsigned int p1;
 
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index 228996e3..abb6630b 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -62,6 +62,9 @@
 #include "x86vtinstr.h"
 #include "apic.h"
 #include "x86perfctr.h"
+#include "x86paging_common.h"
+#include "x86paging_64.h"
+#include "memtrack.h"
 
 #ifdef LINUX_GDT_IS_RO
 #   include <asm/desc.h>
@@ -85,12 +88,32 @@
 
 static CrossGDT *crossGDT = NULL;
 static MPN crossGDTMPNs[CROSSGDT_NUMPAGES];
-static DTR crossGDTDescHKLA;
 static Selector kernelStackSegment = 0;
 static uint32 dummyLVT;
 static Atomic_uint64 hvRootPage[MAX_PCPUS];
 static Atomic_Ptr tmpGDT[MAX_PCPUS];
 static Bool pebsAvailable = FALSE;
+static Bool ptAvailable = FALSE;
+
+#define L1_FLAGS      (PTE_RW | PTE_A | PTE_D | PTE_P)
+#define L2_FLAGS      (PTE_RW | PTE_A | PTE_D)
+#define L3_FLAGS      (PTE_RW | PTE_A | PTE_D)
+#define L4_FLAGS      (PTE_RW | PTE_A | PTE_D)
+
+#define CANONICAL_MASK MASK64(36)
+
+/*
+ * Index of the PTE in the given PT level when translating the given
+ * LPN. This index is global, i.e. it considers the full page table
+ * hierarchy, not just the containing page table.
+ */
+#define PTE_GLOBAL_INDEX(_lpn, _lvl) (((_lpn) & CANONICAL_MASK) >> ((_lvl) - 1) * 9)
+
+/*
+ * Index of the PTE in the page table at the given PT level when
+ * translating the given LPN.
+ */
+#define PTE_INDEX(_lpn, _lvl) (PTE_GLOBAL_INDEX(_lpn, _lvl) & PT_OFF_MASK)
 
 
 /*
@@ -148,7 +171,7 @@ TaskAllocHVRootPage(Atomic_uint64 *slot) // IN/OUT
        * the same 'slot', only the first one to pass this finish line will win.
        */
       if (HostIF_WriteMachinePage(mpn, PtrToVA64(content)) != 0 ||
-          !Atomic_CMPXCHG64(slot, &invalidMPN, &mpn)) {
+          !Atomic_CMPXCHG64(slot, invalidMPN, mpn)) {
          /*
           * Either we couldn't set up the page or this thread lost the race.
           * We must free its HV root page.
@@ -507,10 +530,8 @@ Task_Terminate(void)
    TaskFreeHVRootPages();
 
    if (crossGDT != NULL) {
-      HostIF_FreeCrossGDT(CROSSGDT_NUMPAGES, crossGDT);
+      HostIF_FreeKernelPages(ARRAYSIZE(crossGDTMPNs), crossGDT);
       crossGDT = NULL;
-      crossGDTDescHKLA.limit  = 0;
-      crossGDTDescHKLA.offset = 0;
    }
 
    if (USE_TEMPORARY_GDT) {
@@ -600,6 +621,11 @@ gotnzss:;
     */
 
    pebsAvailable = PerfCtr_PEBSAvailable();
+   /*
+    * Check if PT is supported.  For simplicity we assume there will not
+    * be mixed CPU models.
+    */
+   ptAvailable = PerfCtr_PTAvailable();
    return TRUE;
 }
 
@@ -731,113 +757,733 @@ TaskRestoreHostGDTTRLDT(Descriptor *tempGDTBase,
 /*
  *-----------------------------------------------------------------------------
  *
- * Task_AllocCrossGDT --
+ * TaskSwitchPTPAllocPage --
+ *
+ *      Allocates and zeroes a page to be used as part of a page table patch.
+ *      Adds a corresponding entry to the PTP memtracker.
+ *
+ * Results:
+ *      On success, a pointer to the page's starting address. NULL on
+ *      failure.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void *
+TaskSwitchPTPAllocPage(VMDriver *vm)
+{
+   MPN mpn;
+   MemTrackEntry *entry;
+   uint8 *ptr;
+
+   ptr = HostIF_AllocKernelPages(1, &mpn);
+   if (ptr == NULL) {
+      return NULL;
+   }
+   memset(ptr, 0, PAGE_SIZE);
+   entry = MemTrack_Add(vm->ptpTracker, VA_2_VPN(PtrToVA64(ptr)), mpn);
+
+   if (entry == NULL) {
+      HostIF_FreeKernelPages(1, ptr);
+      return NULL;
+   }
+
+   return ptr;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSwitchPTPLookupVPN --
+ *
+ *      Looks up the MPN for the given PTP page VPN by querying the PTP
+ *      memtracker.
+ *
+ * Results:
+ *      The VPN's corresponding MPN.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static MPN
+TaskSwitchPTPLookupVPN(VMDriver *vm, VPN vpn)
+{
+   MemTrackEntry *entry = MemTrack_LookupVPN(vm->ptpTracker, vpn);
+
+   ASSERT(entry != NULL && entry->mpn != 0);
+   return entry->mpn;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSwitchPTPPageFree --
+ *
+ *      Frees the PTP page matching the VPN stored by the given
+ *      MemTrackEntry. This function is used as a callback by
+ *      MemTrack_Cleanup().
+ *
+ * Results:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskSwitchPTPPageFree(void *unused, MemTrackEntry *entry)
+{
+   ASSERT(entry->mpn != 0);
+   HostIF_FreeKernelPages(1, VA64ToPtr(VPN_2_VA(entry->vpn)));
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_SwitchPTPPageCleanup --
+ *
+ *      Frees all PTP pages allocated for the given VM and frees the
+ *      PTP MemTracker.
+ *
+ * Results:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+Task_SwitchPTPPageCleanup(VMDriver *vm)
+{
+   MemTrack_Cleanup(vm->ptpTracker, TaskSwitchPTPPageFree, NULL);
+   vm->ptpTracker = NULL;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSetCrossGDTEntry --
  *
- *      Make sure the crossGDT is allocated and initialized.
+ *      Fill in a crossGDT entry from the given descriptor. If the entry has
+ *      already been initialized, it is compared to the given descriptor. Any
+ *      discrepancy is logged and an error is returned.
  *
  * Results:
- *      TRUE iff crossGDT was already initialized or successfully initialized.
+ *      TRUE on success, FALSE otherwise.
  *
  * Side effects:
- *      crossGDT static vars set up if not already.
+ *      crossGDT entry is initialized, if not already.
  *
  *-----------------------------------------------------------------------------
  */
 
-Bool
-Task_AllocCrossGDT(InitBlock *initBlock)  // OUT: crossGDT values filled in
+static Bool
+TaskSetCrossGDTEntry(uint16 index, Descriptor d)
 {
-   DTR64 hostGDT64;
+   Bool res = FALSE;
 
-   /*
-    * Make sure only one of these runs at a time on the whole system, because
-    * there is only one crossGDT for the whole system.
-    */
+   ASSERT(HostIF_GlobalLockIsHeld());
+   ASSERT(Desc_Present(&d));
 
-   HostIF_GlobalLock(2);
+   if (index >= ARRAYSIZE(crossGDT->gdtes)) {
+      Warning("%s: index %u too big\n", __FUNCTION__, index);
+   } else if (!CROSSGDT_TESTINDEXMASK(index)) {
+      Warning("%s: index %u not in CROSSGDT_PAGEMASK %x\n", __FUNCTION__,
+              index, CROSSGDT_PAGEMASK);
+   } else if (!Desc_Present(crossGDT->gdtes + index)) {
+      crossGDT->gdtes[index] = d;
+      res = TRUE;
+   } else if (Desc_EqualIgnoreAccessed(crossGDT->gdtes + index, &d)) {
+      res = TRUE;
+   } else {
+      Warning("%s: entry 0x%X mismatch\n", __FUNCTION__, index);
+      Warning("%s:   crossGDT %16.16" FMT64 "X\n", __FUNCTION__,
+              *(uint64 *)(crossGDT->gdtes + index));
+      Warning("%s:   template %16.16" FMT64 "X\n", __FUNCTION__, *(uint64 *)&d);
+   }
 
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSetCrossGDTVMM --
+ *
+ *      Initialize/compare the VMM portion of the crossGDT.
+ *
+ * Results:
+ *      TRUE if success, FALSE otherwise.
+ *
+ * Side effects:
+ *      VMM portion of the crossGDT is initialized, if not already.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+TaskSetCrossGDTVMM(BSVMM_GDTInit *gdt)
+{
+   uint8 i;
+
+   for (i = 0; i < ARRAYSIZE(gdt->entries); i++) {
+      Descriptor d;
+      if (gdt->entries[i].present == 1) {
+         Desc_SetDescriptor(&d, gdt->entries[i].base,
+                                gdt->entries[i].limit,
+                                gdt->entries[i].type,
+                                gdt->entries[i].S,
+                                gdt->entries[i].DPL,
+                                gdt->entries[i].present,
+                                gdt->entries[i].DB,
+                                gdt->entries[i].gran);
+         d.longmode = gdt->entries[i].longmode;
+
+         if (!TaskSetCrossGDTEntry(gdt->entries[i].index, d)) {
+            return FALSE;
+         }
+      }
+   }
+   return TRUE;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSetCrossGDTHost --
+ *
+ *      Initializes the host portion of the crossGDT by copying it directly from
+ *      the host kernel's GDT. We assume that all the host segments we
+ *      will ever need are below CROSSGDT_HOSTLIMIT.
+ *
+ * Results:
+ *      TRUE on success, FALSE otherwise.
+ *
+ * Side effects:
+ *      The host portion of the crossGDT is initialized.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskSetCrossGDTHost(void)
+{
+   DTR64 hostGDT;
    /*
-    * Maybe the crossGDT has already been set up.
+    * All copied host segment descriptors will come from the first page of
+    * the host kernel GDT.
     */
+   ASSERT(HostIF_GlobalLockIsHeld());
+   ASSERT_ON_COMPILE(CROSSGDT_HOSTLIMIT <= PAGE_SIZE / sizeof(Descriptor));
+   ASSERT_ON_COMPILE(CROSSGDT_PAGEMASK & 1);
 
-   if (crossGDT == NULL) {
-      MPN maxValidFirst =
-         0xFFC00 /* 32-bit MONITOR_LINEAR_START */ - CROSSGDT_NUMPAGES;
+   TaskSaveGDT64(&hostGDT);
+   if (hostGDT.limit > CROSSGDT_HOSTLIMIT * sizeof(Descriptor) - 1) {
+      hostGDT.limit = CROSSGDT_HOSTLIMIT * sizeof(Descriptor) - 1;
+   }
+   TaskCopyGDT64(&hostGDT, crossGDT->gdtes);
+}
 
-      /*
-       * The host entries must fit on pages of the crossGDT that are mapped.
-       * Since we know they are below CROSSGDT_LOWSEG, we can just check that
-       * CROSSGDT_LOWSEG and below are mapped.
-       *
-       * Because the CROSSGDT_LOWSEG segments must reside on the first page of
-       * the crossGDT (as they must remain valid with paging off), all we need
-       * do is check that bit 0 of CROSSGDT_PAGEMASK is set (indicating that
-       * page 0 of the crossGDT will be mapped).
-       */
 
-      ASSERT_ON_COMPILE(CROSSGDT_LOWSEG < PAGE_SIZE);
-      ASSERT_ON_COMPILE(CROSSGDT_PAGEMASK & 1);
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Task_CreateCrossGDT --
+ *
+ *      Allocate and initialize the crossGDT, if not already done. A single
+ *      crossGDT is shared by all VMs managed by this driver.
+ *
+ * Results:
+ *      TRUE if success, FALSE otherwise.
+ *
+ * Side effects:
+ *      crossGDT static vars set up if not already.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
+{
+   HostIF_GlobalLock(2);
 
+   if (crossGDT == NULL) {
       /*
-       * Allocate the crossGDT.
+       * The crossGDT has not yet been created. This must be the first
+       * VM that this driver powers on.
        */
       ASSERT_ON_COMPILE(sizeof *crossGDT == CROSSGDT_NUMPAGES * PAGE_SIZE);
-      crossGDT = HostIF_AllocCrossGDT(CROSSGDT_NUMPAGES, maxValidFirst,
-                                      crossGDTMPNs);
+      crossGDT = HostIF_AllocKernelPages(ARRAYSIZE(crossGDTMPNs),
+                                         crossGDTMPNs);
       if (crossGDT == NULL) {
          HostIF_GlobalUnlock(2);
          Warning("%s: unable to allocate crossGDT\n", __FUNCTION__);
 
          return FALSE;
       }
+      memset(crossGDT, 0, sizeof *crossGDT);
+      TaskSetCrossGDTHost();
+   }
+   if (!TaskSetCrossGDTVMM(gdt)) {
+      HostIF_GlobalUnlock(2);
+      return FALSE;
+   }
 
-      /*
-       * Check that the crossGDT meets the address requirements documented in
-       * bora/doc/worldswitch-pages.txt.
-       */
+   HostIF_GlobalUnlock(2);
 
-      if (crossGDTMPNs[0] > maxValidFirst) {
-         HostIF_FreeCrossGDT(CROSSGDT_NUMPAGES, crossGDT);
-         crossGDT = NULL;
-         HostIF_GlobalUnlock(2);
-         Warning("%s: crossGDT MPN %"FMT64"X gt %"FMT64"X\n", __FUNCTION__,
-                 crossGDTMPNs[0], maxValidFirst);
+   return TRUE;
+}
 
-         return FALSE;
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskFixupHostSwitchIDTE --
+ *
+ *      Fixes up a 64-bit host IDT entry in the crosspage, given the
+ *      host kernel CS and the crosspage's code section address on the
+ *      host.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskFixupHostSwitchIDTE(Gate64 *entry, Selector cs, VMCrossPageCode *cpCode)
+{
+   VA64 handlerVA;
+   DEBUG_ONLY(const VA64 codeBase = offsetof(VMCrossPageCode, codeBlock);)
+
+   ASSERT_ON_COMPILE(sizeof *entry == 16);
+
+   ASSERT(entry->segment      == 0 && entry->ist          == 0 &&
+          entry->reserved0    == 0 && entry->type         == INTER_GATE &&
+          entry->DPL          == 0 && entry->present      == 0 &&
+          entry->offset_16_31 == 0 && entry->offset_32_63 == 0 &&
+          entry->reserved1    == 0);
+
+   /*
+    * entry->offset_0_15 is initialized in crosspage.S with an offset relative
+    * to the crosspage's code section. Here, we transform it into an absolute
+    * address.
+    */
+   ASSERT(entry->offset_0_15 >= codeBase &&
+          entry->offset_0_15 < codeBase + sizeof cpCode->codeBlock);
+
+   handlerVA = PtrToVA64(cpCode) + entry->offset_0_15;
+
+   entry->offset_0_15  = LOWORD(handlerVA);
+   entry->segment      = cs;
+   entry->present      = 1;
+   entry->offset_16_31 = HIWORD(handlerVA);
+   entry->offset_32_63 = HIDWORD(handlerVA);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ *  TaskFixupHostSwitchIDT --
+ *
+ *      Fixes up the contents of the host-context switch IDT and IDTR,
+ *      which were partially initialized at compile-time. At this point,
+ *      we have the necessary runtime information needed to fully
+ *      initialize them: the crosspage's address in the host and the
+ *      host kernel's CS.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskFixupHostSwitchIDT(VMCrossPage *crosspage)
+{
+   VMCrossPageData *cpData = &crosspage->crosspageData;
+   VMCrossPageCode *cpCode = &crosspage->crosspageCode;
+   const Selector   cs     = cpData->hostInitial64CS;
+   Gate64          *idt    = (Gate64 *)&cpData->switchHostIDT;
+
+   ASSERT(cpData->switchHostIDTR.limit == sizeof cpData->switchHostIDT - 1);
+   ASSERT(cpData->switchHostIDTR.offset == 0);
+   cpData->switchHostIDTR.offset = PtrToVA64(&cpData->switchHostIDT);
+
+   TaskFixupHostSwitchIDTE(&idt[EXC_DB ], cs, cpCode);
+   TaskFixupHostSwitchIDTE(&idt[EXC_NMI], cs, cpCode);
+   TaskFixupHostSwitchIDTE(&idt[EXC_UD ], cs, cpCode);
+   TaskFixupHostSwitchIDTE(&idt[EXC_MC ], cs, cpCode);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskFixupPatchPT --
+ * TaskFixupPatchPTE --
+ *
+ *      These functions recursively walk the specified page table patch
+ *      subtree and convert all entries containing a 'VA | flags' into
+ *      their actual PTE values at that level.
+ *
+ *      When 'PTE_P' is not present in an entry, the value is actually
+ *      a VA.  All other flag values, besides 'PTE_P' may be set in
+ *      the entry; the flag values are preserved during conversion to
+ *      a PTE (and 'PTE_P' is included).
+ *
+ *      Level 1 entries are always entered as true PTE values.  Since
+ *      they always have PTE_P set, they never need fixing up.
+ *
+ * Results:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskFixupPatchPT(VMDriver *vm,
+                 VM_PDPTE *ptPage,
+                 unsigned  ptLevel);
+
+static void
+TaskFixupPatchPTE(VMDriver *vm,
+                  VM_PDPTE *pte,
+                  unsigned  ptLevel)
+{
+   const VM_PDPTE entry   = *pte;
+   const VM_PDPTE paEntry = VM_PAGE_BASE(entry);
+   const uint32   flags   = entry & (PAGE_SIZE - 1);
+
+   ASSERT_ON_COMPILE(sizeof(VM_PDPTE) == sizeof(uint64));
+   ASSERT_ON_COMPILE(sizeof(PT_L4E)   == sizeof(VM_PDPTE));
+   ASSERT_ON_COMPILE(sizeof(PT_L3E)   == sizeof(VM_PDPTE));
+   ASSERT_ON_COMPILE(sizeof(PT_L2E)   == sizeof(VM_PDPTE));
+   ASSERT_ON_COMPILE(sizeof(PT_L1E)   == sizeof(VM_PDPTE));
+   ASSERT(PTP_LEVEL_L1 <= ptLevel && ptLevel <= PTP_LEVEL_L4);
+
+   if (ptLevel == 1) {
+      ASSERT(PTE_PRESENT(flags)); /* Already in PTE form. */
+   } else if (paEntry != 0) {
+      MPN mpn;
+      VM_PDPTE *nextPt = (VM_PDPTE *)(uintptr_t)paEntry;
+
+      ASSERT(!PTE_PRESENT(flags)); /* Not in PTE form. */
+      mpn = TaskSwitchPTPLookupVPN(vm, VA_2_VPN(PtrToVA64(nextPt)));
+
+      *pte = LM_MAKE_PTE(mpn, 0, flags | PTE_P);
+
+      TaskFixupPatchPT(vm, nextPt, ptLevel - 1);
+   }
+}
+
+static void
+TaskFixupPatchPT(VMDriver *vm,
+                 VM_PDPTE *ptPage,
+                 unsigned  ptLevel)
+{
+   unsigned i;
+
+   ASSERT(PTP_LEVEL_L1 <= ptLevel && ptLevel <= PTP_LEVEL_L4);
+
+   for (i = 0; i < PAGE_SIZE / sizeof(VM_PDPTE); i++) {
+      VM_PDPTE *pte = &ptPage[i];
+      if (*pte != 0) {
+         TaskFixupPatchPTE(vm, pte, ptLevel);
       }
+   }
+}
 
-      /*
-       * Fill the crossGDT with a copy of our host GDT.  VMX will have to fill
-       * in monitor segments via Task_InitCrossGDT.
-       *
-       * We are assuming that all the host segments we will ever need are below
-       * CROSSGDT_LOWSEG.  If this assumption ever breaks, the host segments
-       * would have to be unconditionally transitioned to the CROSSGDT
-       * intermediate segments before switching to the monitor.  The only time
-       * the GDT has been found to be bigger than CROSSGDT_LOWSEG is when they
-       * are running KVM or Xen, and we never see the large segment numbers.
-       */
 
-      memset(crossGDT, 0, sizeof *crossGDT);
-      TaskSaveGDT64(&hostGDT64);
-      if (hostGDT64.limit > CROSSGDT_LOWSEG * 8 - 1) {
-         hostGDT64.limit = CROSSGDT_LOWSEG * 8 - 1;
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskFixupPTPatches --
+ *
+ *    Fixes up the PTEs for the entire page table hierarchy rooted at
+ *    each PTP. It translates PTEs from the 'VA | flags' intermediate
+ *    format to the actual PTE format.
+ *
+ * Results:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+TaskFixupPTPatches(VMDriver *vm, VMCrossPageData *cpData)
+{
+   unsigned i;
+
+   for (i = 0; i < MAX_SWITCH_PT_PATCHES; i++) {
+      VMMPageTablePatch *patch = &cpData->vmmPTP[i];
+      if (patch->level == PTP_EMPTY) {
+         break;
       }
-      TaskCopyGDT64(&hostGDT64, crossGDT->gdtes);
+      TaskFixupPatchPTE(vm, &patch->pte, patch->level);
+   }
+}
 
-      /*
-       * Set up descriptor for the crossGDT using host kernel LA as a base.
-       */
 
-      crossGDTDescHKLA.limit  = sizeof *crossGDT - 1;
-      crossGDTDescHKLA.offset = HOST_KERNEL_VA_2_LA((VA)crossGDT);
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSavePTPatch --
+ *
+ *      This function saves a page table patch entry.  The patch
+ *      entries are used during worldswitch to ensure that the cross
+ *      page and portions of the host GDT are mapped at all times (for
+ *      NMI-safe worldswitches).
+ *
+ *      The code searches for an empty slot rather than using a static
+ *      local index (incremented after use) because it is run once on
+ *      each VCPU.  Each VCPU has a distinct 'crosspage', and thus a
+ *      distinct patch table.
+ *
+ * Results:
+ *      Saved patch entry.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static VMMPageTablePatch *
+TaskSavePTPatch(VMCrossPageData *crosspage,
+                LPN64            lpn,
+                unsigned         level,
+                VM_PDPTE         pte)
+{
+   unsigned i;
+   const unsigned pteIdx     = PTE_INDEX(lpn, level);
+   const uint64 pteGlobalIdx = PTE_GLOBAL_INDEX(lpn, level);
+
+   ASSERT(PTP_LEVEL_L1 <= level && level <= PTP_LEVEL_L4);
+
+   for (i = 0; i < MAX_SWITCH_PT_PATCHES; ++i) {
+      ASSERT(crosspage->vmmPTP[i].level != level || /* No duplicates. */
+             crosspage->vmmPTP[i].pteGlobalIdx != pteGlobalIdx ||
+             crosspage->vmmPTP[i].pteIdx != pteIdx);
+
+      if (crosspage->vmmPTP[i].level == PTP_EMPTY) {
+         crosspage->vmmPTP[i].level = level;
+         crosspage->vmmPTP[i].pteIdx = pteIdx;
+         crosspage->vmmPTP[i].pte   = pte;
+         crosspage->vmmPTP[i].pteGlobalIdx = pteGlobalIdx;
+
+         return &crosspage->vmmPTP[i];
+      }
    }
+   Panic("Internal error: PTP table is full");
+}
 
-   HostIF_GlobalUnlock(2);
 
-   initBlock->crossGDTHKLA = crossGDTDescHKLA.offset;
-   ASSERT_ON_COMPILE(sizeof initBlock->crossGDTMPNs == sizeof crossGDTMPNs);
-   memcpy(initBlock->crossGDTMPNs, crossGDTMPNs, sizeof crossGDTMPNs);
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskSearchPTPatch --
+ *
+ *    Looks for an entry in the PT patch table.
+ *
+ * Results:
+ *      Pointer to the PTP entry, or NULL if not found.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static VMMPageTablePatch *
+TaskSearchPTPatch(VMCrossPageData *cpData,
+                  LPN64            lpn,
+                  unsigned         level)
+{
+   unsigned i;
+
+   ASSERT(PTP_LEVEL_L1 <= level && level <= PTP_LEVEL_L4);
+
+   for (i = 0; i < MAX_SWITCH_PT_PATCHES; i++) {
+      VMMPageTablePatch *patch = &cpData->vmmPTP[i];
+      if (patch->level == level &&
+          patch->pteGlobalIdx == PTE_GLOBAL_INDEX(lpn, level)) {
+
+         return patch;
+      }
+   }
+   return NULL;
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskCreatePTPatch --
+ *
+ *      Creates a page table patch for BackToHost to apply to the
+ *      monitor's page table before switching to the host. These patches
+ *      map the crosspage and crossGDT at their host addresses so there
+ *      is common ground during the switch.
+ *
+ *      A patch is essentially a PTE-rooted page table subtree. The
+ *      location of the root PTE is determined by calculating the lowest
+ *      page table that is shared with the monitor in the translation
+ *      path for the LPN associated with the patch. We disallow patches
+ *      inside the monitor address space.
+ *
+ *      At creation time, the patch's PTEs are initialized to a 'VA | flags'
+ *      intermediary representation, where VA is the virtual address of
+ *      a page, and 'flags' are the PTE flags. This allows easy
+ *      traversal of the structure during patch creation. PTEs are fixed
+ *      up later on after all patches have been created.
+ *
+ * Results:
+ *      TRUE if the patch was created successfully, FALSE otherwise.
+ *
+ * Side effects:
+ *      Patch is created and saved to the crosspage's PTP table.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+TaskCreatePTPatch(VMDriver        *vm,
+                  VMCrossPageData *cpData,
+                  LPN64            monStartLPN,
+                  LPN64            monEndLPN,
+                  LPN64            lpn,
+                  MPN              mpn,
+                  uint16          *numPages)
+{
+   const PT_L1E       l1pte    = LM_MAKE_PTE(mpn, 0, L1_FLAGS);
+   const int          flags[4] = {L1_FLAGS, L2_FLAGS, L3_FLAGS, L4_FLAGS};
+   VM_PDPTE          *pte;
+   unsigned           level;
+   VMMPageTablePatch *patch;
+
+   ASSERT_ON_COMPILE(sizeof(PT_L4E) == sizeof(VM_PDPTE));
+   ASSERT_ON_COMPILE(sizeof(PT_L3E) == sizeof(VM_PDPTE));
+   ASSERT_ON_COMPILE(sizeof(PT_L2E) == sizeof(VM_PDPTE));
+   ASSERT_ON_COMPILE(sizeof(PT_L1E) == sizeof(VM_PDPTE));
+
+   /*
+    * Find the level of the first non-VMM PTE in the LPN's translation
+    * path. This will be the level in which the patch's root PTE will be
+    * placed.
+    */
+   for (level = 4; level > 0; level--) {
+      uint64 lpnIdx = PTE_GLOBAL_INDEX(lpn, level);
+      if (lpnIdx < PTE_GLOBAL_INDEX(monStartLPN, level) ||
+          lpnIdx > PTE_GLOBAL_INDEX(monEndLPN, level)) {
+         break;
+      }
+   }
+
+   /*
+    * Ensure that we actually found something. If not (i.e. the l4e, l3e,
+    * l2e and l1e are all VMM entries), the LPN overlaps with the VMM's
+    * address space, so we return an error.
+    */
+   if (level == 0) {
+      Warning("%s: cannot create page table patch because LPN 0x%" FMT64 "x "
+              "overlaps with the VMM address space.\n", __FUNCTION__, lpn);
+      return FALSE;
+   }
+
+   patch = TaskSearchPTPatch(cpData, lpn, level);
+   if (patch == NULL) {
+      patch = TaskSavePTPatch(cpData, lpn, level, 0); /* PTE filled later */
+   }
+
+   /*
+    * Traverse the patch-rooted page table subtree until we reach L1.
+    * Allocate new page tables as needed.
+    */
+   pte = &patch->pte;
+   while (level > 1) {
+      VM_PDPTE *page;
+      ASSERT(!PTE_PRESENT(*pte & (PAGE_SIZE - 1))); /* Pre-fixup entry. */
+      page = (VM_PDPTE *)VM_PAGE_BASE((uintptr_t)*pte);
+      if (page == NULL) {
+         page = TaskSwitchPTPAllocPage(vm);
+         if (page == NULL) {
+            Warning("%s: failure allocating memory for page table patch.\n",
+                    __FUNCTION__);
+            return FALSE;
+         }
+         *numPages += 1;
+         *pte = (VM_PDPTE)((uintptr_t)page | flags[level - 1]); /* VA | flags */
+      }
+      level -= 1;
+      pte = (VM_PDPTE *)&page[PTE_INDEX(lpn, level)];
+   }
+
+   ASSERT(level == 1 && *pte == 0);
+   ASSERT_ON_COMPILE(PTE_PRESENT(L1_FLAGS));
+   *pte = l1pte;
+
+   return TRUE;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskCreatePTPatches
+ *
+ *      Creates VMM mappings for the crosspage and crossGDT that match
+ *      those from the vmmon address space, so that they are mapped at
+ *      a common linear address on both address spaces. Such mappings
+ *      are created in the form of patches that are applied to/removed
+ *      from the VMM's page tables.
+ *
+ * Results:
+ *      TRUE if all patches were created successfully, FALSE otherwise.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+TaskCreatePTPatches(VMDriver    *vm,
+                    VMCrossPage *crosspage,
+                    LPN64        monStartLPN,
+                    LPN64        monEndLPN,
+                    uint16      *numPages)
+{
+   VMCrossPageData * const cpData = &crosspage->crosspageData;
+   LPN64                   xgCPN  = LA_2_LPN(cpData->vmm64CrossGDTLA);
+   LPN64                   xpCPN  = LA_2_LPN(cpData->vmm64CrossPageLA);
+   MPN                     xpMPN  = MA_2_MPN(cpData->crosspageMA);
+   int                     i;
+
+   /*
+    * Set up patches that the BackToHost code will use to map the
+    * crosspage and crossGDT at their crossover addresses (HKLA for
+    * the host).
+    */
+   if (!TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN, xpCPN, xpMPN,
+                          numPages)) {
+      return FALSE;
+   }
+
+   for (i = 0; CROSSGDT_PAGEMASK >> i; i++) {
+      if ((CROSSGDT_PAGEMASK >> i) & 1) {
+         /*
+          * Set up patches for just first and last pages of cross-gdt
+          * due to the selected value of CROSSGDT_PAGEMASK.
+          */
+         if (!TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN, xgCPN + i,
+                                crossGDTMPNs[i], numPages)) {
+            return FALSE;
+         }
+      }
+   }
+   TaskFixupPTPatches(vm, cpData);
 
    return TRUE;
 }
@@ -866,12 +1512,13 @@ Task_InitCrosspage(VMDriver *vm,          // IN
                                           //         VM
 {
    Vcpuid vcpuid;
+   uint16 numPTPPages = 0;
 
    if (crossGDT == NULL) {
       return 1;
    }
 
-   initParams->crossGDTHKLA = crossGDTDescHKLA.offset;
+   initParams->crossGDTHKLA = HOST_KERNEL_VA_2_LA((VA)crossGDT);
    ASSERT_ON_COMPILE(sizeof initParams->crossGDTMPNs == sizeof crossGDTMPNs);
    memcpy(initParams->crossGDTMPNs, crossGDTMPNs, sizeof crossGDTMPNs);
 
@@ -936,7 +1583,20 @@ Task_InitCrosspage(VMDriver *vm,          // IN
       }
       p->crosspageData.crosspageMA = (uint32)MPN_2_MA(crossPageMPN);
       p->crosspageData.hostCrossPageLA = (LA64)(uintptr_t)p;
-
+      p->crosspageData.vmm64CrossPageLA = p->crosspageData.hostCrossPageLA;
+      p->crosspageData.vmm64CrossGDTLA = HOST_KERNEL_VA_2_LA((VA)crossGDT);
+
+      HostIF_VMLock(vm, 39);
+      if (!TaskCreatePTPatches(vm, p,
+                               initParams->monStartLPN,
+                               initParams->monEndLPN,
+                               &numPTPPages)) {
+         HostIF_VMUnlock(vm, 39);
+         Warning("%s: Could not create page table patches for VCPU %d\n",
+                 __FUNCTION__, vcpuid);
+         return 1;
+      }
+      HostIF_VMUnlock(vm, 39);
       /*
        * Pass our kernel code segment numbers back to MonitorPlatformInit.
        * They have to be in the GDT so they will be valid when the crossGDT is
@@ -948,82 +1608,26 @@ Task_InitCrosspage(VMDriver *vm,          // IN
                 SELECTOR_TABLE(p->crosspageData.hostInitial64CS) == 0);
 
       p->crosspageData.moduleCallInterrupted = FALSE;
+      VersionedAtomic_BeginWrite(&p->crosspageData.pseudoTSCConv.vers);
       p->crosspageData.pseudoTSCConv.p.mult  = 1;
       p->crosspageData.pseudoTSCConv.p.shift = 0;
       p->crosspageData.pseudoTSCConv.p.add   = 0;
-      p->crosspageData.pseudoTSCConv.changed = TRUE;
+      VersionedAtomic_EndWrite(&p->crosspageData.pseudoTSCConv.vers);
       p->crosspageData.worldSwitchPTSC       = Vmx86_GetPseudoTSC();
       p->crosspageData.timerIntrTS           = MAX_ABSOLUTE_TS;
       p->crosspageData.hstTimerExpiry        = MAX_ABSOLUTE_TS;
       p->crosspageData.monTimerExpiry        = MAX_ABSOLUTE_TS;
       vm->crosspage[vcpuid]                  = p;
-   }
-
-   return 0;
-}
 
-
-/*
- *-----------------------------------------------------------------------------
- *
- * Task_InitCrossGDT --
- *
- *    Fill in a crossGDT entry from the given template.
- *
- * Results:
- *    0 on success
- *    != 0 on failure
- *
- * Side effects:
- *    CrossGDT entry filled from template.  If crossGDT has already been
- *    initialized, the entry is compared to the given template.  Any
- *    discrepancy is logged and an error is returned.  This is necessary
- *    because this same GDT is shared among all VMs on this host, so really,
- *    the first call initializes it and the others just do compares.
- *
- *-----------------------------------------------------------------------------
- */
-
-int
-Task_InitCrossGDT(InitCrossGDT *initCrossGDT)  // IN
-{
-   Descriptor v;
-   int rc;
-   uint32 i;
-
-   rc = 1;
-   i  = initCrossGDT->index;
-   v  = initCrossGDT->value;
-
-   HostIF_GlobalLock(3);
-   if (i >= sizeof crossGDT->gdtes / sizeof crossGDT->gdtes[0]) {
-      HostIF_GlobalUnlock(3);
-      Warning("%s: index %u too big\n", __FUNCTION__, i);
-   } else if (!(  (1 << (i * sizeof crossGDT->gdtes[0] / PAGE_SIZE))
-                & CROSSGDT_PAGEMASK)) {
-      HostIF_GlobalUnlock(3);
-      Warning("%s: index %u not in CROSSGDT_PAGEMASK %x\n", __FUNCTION__,
-              i, CROSSGDT_PAGEMASK);
-   } else if (!Desc_Present(&v)) {
-      HostIF_GlobalUnlock(3);
-      Warning("%s: entry %u not present\n", __FUNCTION__, i);
-   } else if (!Desc_Present(crossGDT->gdtes + i)) {
-      crossGDT->gdtes[i] = v;
-      HostIF_GlobalUnlock(3);
-      rc = 0;
-   } else if (Desc_EqualIgnoreAccessed(crossGDT->gdtes + i, &v)) {
-      HostIF_GlobalUnlock(3);
-      rc = 0;
-   } else {
-      HostIF_GlobalUnlock(3);
-      Warning("%s: entry 0x%X mismatch\n", __FUNCTION__, i);
-      Warning("%s:   crossGDT %16.16llX\n", __FUNCTION__,
-              (long long unsigned)*(uint64 *)(crossGDT->gdtes + i));
-      Warning("%s:   template %16.16llX\n", __FUNCTION__,
-              (long long unsigned)*(uint64 *)&v);
+      TaskFixupHostSwitchIDT(p);
    }
+   /*
+    * Report back to the VMX the number of pages allocated for this VM's
+    * page table patches.
+    */
+   initParams->numPTPPages = numPTPPages;
 
-   return rc;
+   return 0;
 }
 
 
@@ -1172,14 +1776,14 @@ TaskDisableTF(void)
 static INLINE Bool
 TaskGotException(const VMCrossPage *crosspage, unsigned exc)
 {
-   return crosspage->crosspageCode.faultHandler.wsException[exc];
+   return crosspage->crosspageData.wsException[exc];
 }
 
 
 static INLINE void
 TaskSetException(VMCrossPage *crosspage, unsigned exc, Bool v)
 {
-   crosspage->crosspageCode.faultHandler.wsException[exc] = v;
+   crosspage->crosspageData.wsException[exc] = v;
 }
 
 
@@ -1375,7 +1979,7 @@ TaskUpdateLatestPTSC(VMDriver *vm, VMCrossPageData *crosspage)
          if (ptsc <= latest) {
             break;
          }
-      } while (!Atomic_CMPXCHG64(&vm->ptscLatest, &latest, &ptsc));
+      } while (!Atomic_CMPXCHG64(&vm->ptscLatest, latest, ptsc));
       /* After updating the latest PTSC, decrement the reference count. */
       Atomic_Dec32((Atomic_uint32 *)&vm->ptscOffsetInfo.inVMMCnt);
    }
@@ -1519,10 +2123,11 @@ TaskUpdatePTSCParameters(VMDriver *vm,
          }
          new.inVMMCnt++;
       } while (!Atomic_CMPXCHG64((Atomic_uint64 *)&vm->ptscOffsetInfo,
-                                 (uint64 *)&old, (uint64 *)&new));
+                                 *(uint64 *)&old, *(uint64 *)&new));
       /* Use the designated global offset as this thread's offset. */
+      VersionedAtomic_BeginWrite(&crosspage->pseudoTSCConv.vers);
       crosspage->pseudoTSCConv.p.add   = vm->ptscOffsets[new.vcpuid];
-      crosspage->pseudoTSCConv.changed = TRUE;
+      VersionedAtomic_EndWrite(&crosspage->pseudoTSCConv.vers);
       /*
        * Need to derive the worldSwitchPTSC value from TSC since the
        * PTSC, when calculated from TSC, may drift from the reference
@@ -1530,8 +2135,9 @@ TaskUpdatePTSCParameters(VMDriver *vm,
        */
       ptsc = tsc + crosspage->pseudoTSCConv.p.add;
    } else {
+      VersionedAtomic_BeginWrite(&crosspage->pseudoTSCConv.vers);
       crosspage->pseudoTSCConv.p.add   = ptsc - tsc;
-      crosspage->pseudoTSCConv.changed = TRUE;
+      VersionedAtomic_EndWrite(&crosspage->pseudoTSCConv.vers);
    }
    /* Cache PTSC value for BackToHost. */
    crosspage->worldSwitchPTSC = ptsc;
@@ -1581,8 +2187,8 @@ TaskUpdatePTSCParameters(VMDriver *vm,
 static INLINE_SINGLE_CALLER void
 TaskSwitchToMonitor(VMCrossPage *crosspage)
 {
-   const uint8 *codePtr = ((uint8 *)&crosspage->crosspageCode.worldswitch +
-                           crosspage->crosspageCode.worldswitch.hostToVmm);
+   const uint8 *codePtr = ((uint8 *)&crosspage->crosspageCode +
+                           crosspage->crosspageCode.offsets.hostToVmm);
 
 #if defined(__GNUC__)
    /*
@@ -1751,6 +2357,7 @@ Task_Switch(VMDriver *vm,  // IN
    uint64      fs64  = 0;
    uint64      gs64  = 0;
    uint64      kgs64 = 0;
+   uint64      ptMSR = 0;
    uint64      pebsMSR = 0;
    DTR64       hostGDT64, hostIDT64;
    Selector    cs, ds, es, fs, gs, ss;
@@ -1783,9 +2390,7 @@ Task_Switch(VMDriver *vm,  // IN
     * world switch.  We must be careful not to overwrite the
     * crosspages arguments when doing this though, see bug 820257.
     */
-   if (hvRootMPN == INVALID_MPN &&
-       (crosspage->crosspageData.activateVMX ||
-        crosspage->crosspageData.activateSVM)) {
+   if (hvRootMPN == INVALID_MPN) {
       crosspage->crosspageData.userCallType = MODULECALL_USERCALL_NONE;
       crosspage->crosspageData.moduleCallType = MODULECALL_ALLOC_VMX_PAGE;
       crosspage->crosspageData.pcpuNum = pCPU;
@@ -1816,6 +2421,17 @@ Task_Switch(VMDriver *vm,  // IN
             }
          }
 
+         /*
+          * The same as PEBS disable PT(Processor Trace) if it is supported and
+          * enabled.
+          */
+         if (ptAvailable) {
+            ptMSR = __GET_MSR(MSR_RTIT_CTL);
+            if ((ptMSR & MSR_RTIT_CTL_TRACE_EN) != 0) {
+               __SET_MSR(MSR_RTIT_CTL, ptMSR & ~MSR_RTIT_CTL_TRACE_EN);
+            }
+         }
+
          /*
           * Save the host's standard IDT and set up an IDT that only
           * has space for all the hardware exceptions (though only a
@@ -1826,7 +2442,7 @@ Task_Switch(VMDriver *vm,  // IN
          TaskLoadIDT64(&crosspage->crosspageData.switchHostIDTR);
          TaskTestCrossPageExceptionHandlers(crosspage);
 
-         if (crosspage->crosspageData.activateVMX) {
+         if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
             /*
              * Ensure that VMX is enabled and locked in the feature control MSR,
              * so that we can set CR4.VMXE to activate VMX.
@@ -1860,10 +2476,9 @@ Task_Switch(VMDriver *vm,  // IN
          crosspage->crosspageData.wsCR0 |= (cr0reg & CR0_RESERVED);
 
          /*
-          * CR4.VMXE must be enabled to support VMX in the monitor, and it
-          * can't be cleared if it is set on the host.
+          * CR4.VMXE must be enabled to support VMX in the monitor.
           */
-         if (crosspage->crosspageData.activateVMX || (cr4reg & CR4_VMXE) != 0) {
+         if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
             crosspage->crosspageData.wsCR4 |= CR4_VMXE;
          }
 
@@ -1895,7 +2510,7 @@ Task_Switch(VMDriver *vm,  // IN
 
          TaskSaveGDT64(&hostGDT64);
 
-         if (crosspage->crosspageData.activateVMX) {
+         if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
             MA vmxonRegion = MPN_2_MA(hvRootMPN);
             VMXStatus status = VMXON_2_STATUS(&vmxonRegion);
             if (status == VMX_Success) {
@@ -1905,7 +2520,7 @@ Task_Switch(VMDriver *vm,  // IN
             }
          }
 
-         if (crosspage->crosspageData.activateSVM) {
+         if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
             efer = __GET_MSR(MSR_EFER);
             if ((efer & MSR_EFER_SVME) == 0) {
                __SET_MSR(MSR_EFER, efer | MSR_EFER_SVME);
@@ -1993,12 +2608,12 @@ Task_Switch(VMDriver *vm,  // IN
          } else if (foreignVMCS != ~0ULL) {
             VMPTRLD_UNCHECKED(&foreignVMCS);
          }
-         
+
          if (WS_INTR_STRESS) {
             TaskEnableTF();
          }
 
-         if (crosspage->crosspageData.activateSVM) {
+         if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
             __SET_MSR(MSR_VM_HSAVE_PA, foreignHSAVE);
             if ((efer & MSR_EFER_SVME) == 0) {
                __SET_MSR(MSR_EFER, efer);
@@ -2079,6 +2694,10 @@ Task_Switch(VMDriver *vm,  // IN
             __SET_MSR(IA32_MSR_PEBS_ENABLE, pebsMSR);
          }
 
+         if ((ptMSR & MSR_RTIT_CTL_TRACE_EN) != 0) {
+            __SET_MSR(MSR_RTIT_CTL, ptMSR);
+         }
+
          TaskUpdateLatestPTSC(vm, &crosspage->crosspageData);
          vm->currentHostCpu[vcpuid] = INVALID_PCPU;
 
diff --git a/vmmon-only/common/task.h b/vmmon-only/common/task.h
index b2fcfd97..0ea0b01b 100644
--- a/vmmon-only/common/task.h
+++ b/vmmon-only/common/task.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2013,2015 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -16,26 +16,24 @@
  *
  *********************************************************/
 
-
-
 #ifndef TASK_H
 #define TASK_H
 
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
+#include "bootstrap_vmm.h"
 
 struct InitBlock;
-struct InitCrossGDT;
 
-extern Bool Task_AllocCrossGDT(struct InitBlock *initBlock);
+extern Bool Task_CreateCrossGDT(BSVMM_GDTInit *gdt);
 extern int Task_InitCrosspage(VMDriver *vm, struct InitBlock *params);
-extern int Task_InitCrossGDT(struct InitCrossGDT *initCrossGDT);
 extern void Task_Switch(VMDriver *vm, Vcpuid vcpuid);
 extern Bool Task_Initialize(void);
 extern void Task_Terminate(void);
 extern MPN Task_GetHVRootPageForPCPU(uint32 pCPU);
 extern Descriptor *Task_GetTmpGDT(uint32 pCPU);
+extern void Task_SwitchPTPPageCleanup(VMDriver *vm);
 
 #endif
 
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index 156e94a9..f6b0d6fc 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -61,6 +61,9 @@
 #include <asm/timex.h>
 #endif
 #include "x86perfctr.h"
+#include "x86vtinstr.h"
+#include "bootstrap_vmm.h"
+#include "monLoader.h"
 
 
 PseudoTSC pseudoTSC;
@@ -105,6 +108,12 @@ static int vmIDsUnused;
 /* Max rate requested for fast clock by any virtual machine. */
 static unsigned globalFastClockRate;
 
+typedef struct {
+   Atomic_uint32 index;
+   MSRQuery *query;
+} Vmx86GetMSRData;
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -198,7 +207,7 @@ Vmx86LockedPageLimit(const VMDriver* vm)  // IN:
 
 static INLINE Bool
 Vmx86HasFreePages(VMDriver *vm,
-		  unsigned int numPages,
+                  unsigned int numPages,
                   Bool checkVM)
 {
    /*
@@ -218,11 +227,11 @@ Vmx86HasFreePages(VMDriver *vm,
 
       ASSERT(HostIF_VMLockIsHeld(vm));
       if (vm->memInfo.admitted) {
-	 if (vm->memInfo.maxAllocation <= vm->memInfo.locked) {
-	    return FALSE;
-	 } else if (vm->memInfo.maxAllocation - vm->memInfo.locked < numPages) {
-	    return FALSE;
-	 }
+         if (vm->memInfo.maxAllocation <= vm->memInfo.locked) {
+            return FALSE;
+         } else if (vm->memInfo.maxAllocation - vm->memInfo.locked < numPages) {
+            return FALSE;
+         }
       }
    } else {
       /*
@@ -232,9 +241,9 @@ Vmx86HasFreePages(VMDriver *vm,
       unsigned limit = Vmx86LockedPageLimit(vm);
 
       if (limit <= numLockedPages) {
-	 return FALSE;
+         return FALSE;
       } else if (limit - numLockedPages < numPages) {
-	 return FALSE;
+         return FALSE;
       }
    }
 
@@ -415,7 +424,7 @@ Vmx86AllocVMID(void)
  *
  * Side effects:
  *      Add VM to linked list.
- *	Increment count of VMs.
+ *      Increment count of VMs.
  *
  *----------------------------------------------------------------
  */
@@ -458,7 +467,7 @@ Vmx86RegisterVMOnList(VMDriver *vm) // IN
  *
  * Side effects:
  *      Remove VM from linked list.
- *	Decrement count of VMs.
+ *      Decrement count of VMs.
  *
  *----------------------------------------------------------------
  */
@@ -520,6 +529,10 @@ Vmx86FreeAllVMResources(VMDriver *vm)
 
       Vmx86_SetHostClockRate(vm, 0);
 
+      if (vm->ptpTracker) {
+         Task_SwitchPTPPageCleanup(vm);
+      }
+
       HostIF_FreeAllResources(vm);
 
       HostIF_FreeKernelMem(vm);
@@ -539,9 +552,9 @@ Vmx86FreeAllVMResources(VMDriver *vm)
  *
  *       If ignoreLimits is TRUE then additional pages may be reserved even
  *       if limits are violated. The request to ignore limits may come in
- *       cases of anonymous page allocations. Swapping is not always possible 
+ *       cases of anonymous page allocations. Swapping is not always possible
  *       at those points but a swap target will have been posted so that the
- *       vmm will release memory shortly allowing the excessive reservation 
+ *       vmm will release memory shortly allowing the excessive reservation
  *       to be reduced.
  *
  * Results:
@@ -555,7 +568,7 @@ Vmx86FreeAllVMResources(VMDriver *vm)
 
 static Bool
 Vmx86ReserveFreePages(VMDriver *vm,
-		      unsigned int numPages,
+                      unsigned int numPages,
                       Bool ignoreLimits)
 {
    Bool retval = FALSE;
@@ -572,26 +585,26 @@ Vmx86ReserveFreePages(VMDriver *vm,
       if (!retval) {
          HostIF_VMUnlock(vm, 0);
          HostIF_GlobalUnlock(17);
-	 break;
+         break;
       } else {
-	 // Wait to satisfy the global limit.
-	 retval = Vmx86HasFreePages(vm, numPages, FALSE);
-	 if (retval) {
-	    numLockedPages += numPages;
-	    vm->memInfo.locked += numPages;
+         // Wait to satisfy the global limit.
+         retval = Vmx86HasFreePages(vm, numPages, FALSE);
+         if (retval) {
+            numLockedPages += numPages;
+            vm->memInfo.locked += numPages;
             HostIF_VMUnlock(vm, 0);
-	    HostIF_GlobalUnlock(17);
-	    break;
-	 } else {
+            HostIF_GlobalUnlock(17);
+            break;
+         } else {
             /*
              * There are not enough pages -- drop the locks and wait for
              * the host and/or other VMs to produce free pages.
-	     */
+             */
 
             HostIF_VMUnlock(vm, 0);
-	    HostIF_GlobalUnlock(17);
-	    HostIF_WaitForFreePages(10);
-	 }
+            HostIF_GlobalUnlock(17);
+            HostIF_WaitForFreePages(10);
+         }
       }
    }
 
@@ -628,7 +641,7 @@ Vmx86ReserveFreePages(VMDriver *vm,
 
 static void
 Vmx86UnreserveFreePages(VMDriver *vm,
-			unsigned int numPages)
+                        unsigned int numPages)
 {
    ASSERT(vm);
 
@@ -663,10 +676,17 @@ Vmx86UnreserveFreePages(VMDriver *vm,
  */
 
 VMDriver *
-Vmx86_CreateVM(void)
+Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize)
 {
    VMDriver *vm;
    Vcpuid v;
+   void *bsBuf = NULL;
+   BSVMM_HostParams *bsParams;
+
+   /* Disallow VM creation if HV is not available, as the VM cannot be run. */
+   if (!CPUID_HostSupportsHV()) {
+      return NULL;
+   }
 
    vm = HostIF_AllocKernelMem(sizeof *vm, TRUE);
    if (vm == NULL) {
@@ -676,14 +696,36 @@ Vmx86_CreateVM(void)
 
    vm->userID = 0;
    vm->memInfo.admitted = FALSE;
-   vm->fastSuspResFlag = 0;
    for (v = 0; v < MAX_INITBLOCK_CPUS; v++) {
       vm->currentHostCpu[v] = INVALID_PCPU;
    }
-
+   for (v = 0; v < MAX_VCPUS; v++) {
+      vm->ptRootMpns[v] = INVALID_MPN;
+   }
    if (HostIF_Init(vm)) {
       goto cleanup;
    }
+   bsBuf = HostIF_AllocKernelMem(bsBlobSize, FALSE);
+   if (bsBuf == NULL) {
+      goto cleanup;
+   }
+   if (HostIF_CopyFromUser(bsBuf, bsBlob, bsBlobSize) != 0) {
+      goto cleanup;
+   }
+   bsParams = BSVMM_Validate(bsBuf, bsBlobSize);
+   if (bsParams == NULL) {
+      Warning("Could not validate the VMM bootstrap blob");
+      goto cleanup;
+   }
+   memcpy(&vm->bsParams, bsParams, sizeof *bsParams);
+
+   if (!Task_CreateCrossGDT(&bsParams->gdtInit)) {
+      goto cleanup;
+   }
+   vm->ptpTracker = MemTrack_Init(vm);
+   if (vm->ptpTracker == NULL) {
+      goto cleanup;
+   }
 
    HostIF_GlobalLock(0);
 
@@ -702,9 +744,13 @@ Vmx86_CreateVM(void)
 
    HostIF_GlobalUnlock(0);
 
+   HostIF_FreeKernelMem(bsBuf);
    return vm;
 
 cleanup:
+   if (bsBuf != NULL) {
+      HostIF_FreeKernelMem(bsBuf);
+   }
    /*
     * The VM is not on a list, "vmCount" has not been incremented,
     * "vm->cowID" is INVALID_VMID, and either the VM's mutex hasn't
@@ -720,6 +766,47 @@ Vmx86_CreateVM(void)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86SetPageTableRoots  --
+ *
+ *      Translates the user VA corresponding to the root page tables
+ *      for all VCPUs into MPNs and stores them in VMDriver.
+ *
+ * Results:
+ *      TRUE if successful, FALSE otherwise.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+Vmx86SetPageTableRoots(VMDriver *vm, UserVA64 *ptRootVAs, uint16 numVCPUs)
+{
+   uint16 vcpu;
+
+   ASSERT_ON_COMPILE(MAX_VCPUS == MAX_INITBLOCK_CPUS);
+
+   if (numVCPUs > vm->numVCPUs) {
+      return FALSE;
+   }
+   for (vcpu = 0; vcpu < numVCPUs; vcpu++) {
+      if ((ptRootVAs[vcpu] & (PAGE_SIZE - 1)) != 0) {
+         Warning("Error: page table VA %"FMT64"x is not page-aligned\n",
+                 ptRootVAs[vcpu]);
+         return FALSE;
+      }
+      ASSERT(vm->ptRootMpns[vcpu] == INVALID_MPN);
+      if (HostIF_LookupUserMPN(vm, ptRootVAs[vcpu], &vm->ptRootMpns[vcpu]) !=
+          PAGE_LOOKUP_SUCCESS) {
+         Warning("Failure looking up page table root MPN for VCPU %d\n", vcpu);
+         return FALSE;
+      }
+   }
+   return TRUE;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -749,6 +836,87 @@ Vmx86_LookupUserMPN(VMDriver *vm, // IN: VMDriver
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_ProcessBootstrap  --
+ *
+ *     Copies the VMM bootstrap blob header and processes it by invoking
+ *     MonLoader.
+ *
+ * Results:
+ *      TRUE if successful, FALSE otherwise.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_ProcessBootstrap(VMDriver *vm,
+                       VA64 bsBlobAddr,
+                       uint32 numBytes,
+                       uint32 headerOffset,
+                       uint16 numVCPUs,
+                       UserVA64 *ptRootVAs,
+                       VMSharedRegion *shRegions)
+{
+   void *blobHdr = NULL;
+   unsigned errLine;
+   Vcpuid errVcpu;
+   MonLoaderError ret;
+   MonLoaderHeader *header;
+   Bool res = FALSE;
+   MonLoaderArgs args;
+
+   /*
+    * Only the beginning of the blob may be passed in: the header at
+    * offset 0, which must fit on one page.
+    */
+   if (numBytes > PAGE_SIZE || headerOffset != 0 ||
+       MonLoader_GetFixedHeaderSize() > numBytes) {
+      Warning("Invalid arguments for processing bootstrap. "
+              "Header offset: %d, Fixed header size: %zd bytes, "
+              "Blob size: %d bytes\n",
+              headerOffset, MonLoader_GetFixedHeaderSize(), numBytes);
+      goto cleanup;
+   }
+   blobHdr = HostIF_AllocKernelMem(numBytes, FALSE);
+   if (blobHdr == NULL) {
+      Warning("Failure allocating kernel buffer for bootstrap blob\n");
+      goto cleanup;
+   }
+   if (HostIF_CopyFromUser(blobHdr, bsBlobAddr, numBytes) != 0) {
+      Warning("Failure copying bootstrap blob from userspace\n");
+      goto cleanup;
+   }
+   ASSERT(headerOffset == 0);
+   header = (MonLoaderHeader *)blobHdr;
+   if (MonLoader_GetFullHeaderSize(header) > numBytes) {
+      Warning("Invalid arguments for processing bootstrap. "
+              "Full header size: %zd bytes, Blob size: %d bytes\n",
+              MonLoader_GetFullHeaderSize(header), numBytes);
+      goto cleanup;
+   }
+   if (!Vmx86SetPageTableRoots(vm, ptRootVAs, numVCPUs)) {
+      goto cleanup;
+   }
+   args.vm = vm;
+   args.shRegions = shRegions;
+   ret = MonLoader_Process(header, numVCPUs, &args, &errLine, &errVcpu);
+   if (ret != ML_OK) {
+      Warning("Error processing bootstrap: error %d at line %u, vcpu %u\n",
+               ret, errLine, errVcpu);
+      goto cleanup;
+   }
+   res = TRUE;
+
+cleanup:
+   if (blobHdr != NULL) {
+      HostIF_FreeKernelMem(blobHdr);
+   }
+   return res;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -790,7 +958,7 @@ Vmx86_ReleaseVM(VMDriver *vm)  // IN:
  *      None.
  *
  * Side effects:
- *	Bumps fdCount.
+ *      Bumps fdCount.
  *
  *----------------------------------------------------------------------
  */
@@ -819,7 +987,7 @@ Vmx86_Open(void)
  *
  * Side effects:
  *      Decrements fdCount
- *	May de-initialize ptsc.
+ *      May de-initialize ptsc.
  *
  *----------------------------------------------------------------------
  */
@@ -890,8 +1058,6 @@ Vmx86_InitVM(VMDriver *vm,          // IN
    }
    vm->numVCPUs = initParams->numVCPUs;
 
-   HostIF_InitFP(vm);
-
    /*
     * Initialize the driver's part of the cross-over page used to
     * talk to the monitor
@@ -946,7 +1112,7 @@ Vmx86_InitVM(VMDriver *vm,          // IN
  */
 
 void
-Vmx86_ReadTSCAndUptime(VmTimeStart *st)	// OUT: return value
+Vmx86_ReadTSCAndUptime(VmTimeStart *st)  // OUT: return value
 {
    uintptr_t flags;
 
@@ -994,7 +1160,7 @@ Vmx86_ComputekHz(uint64 cycles, uint64 uptime)
       cycles >>= 1;
       uptime >>= 1;
    }
- 
+
    if (uptime == 0) {
       return 0;
    }
@@ -1065,7 +1231,7 @@ Vmx86GetBusyKHzEstimate(void)
  */
 
 static INLINE_SINGLE_CALLER uint32
-Vmx86GetkHzEstimate(VmTimeStart *st)	// IN: start time
+Vmx86GetkHzEstimate(VmTimeStart *st)   // IN: start time
 {
    uint64 cDiff, tDiff;
    uintptr_t flags;
@@ -1102,7 +1268,7 @@ Vmx86GetkHzEstimate(VmTimeStart *st)	// IN: start time
  */
 
 uint32
-Vmx86_GetkHzEstimate(VmTimeStart *st)	// IN: start time
+Vmx86_GetkHzEstimate(VmTimeStart *st)   // IN: start time
 {
    static uint32 kHz;
 
@@ -1328,7 +1494,7 @@ Vmx86MinAllocationFunc(unsigned nonpaged,
  *      memory.
  *
  * Results:
- *	The minAllocation for this vm.
+ *      The minAllocation for this vm.
  *
  *
  * Side effects:
@@ -1357,7 +1523,7 @@ Vmx86MinAllocation(VMDriver *vm,
  *      percentage of guest memory must fit within host RAM.
  *
  * Results:
- *	Number of pages that must fit within host ram for a given overcommit
+ *      Number of pages that must fit within host ram for a given overcommit
  *      level.
  *
  *
@@ -1610,7 +1776,7 @@ Vmx86_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
  *      allocated MPNs. MPNs of the allocated pages are copied to the
  *      caller's buffer at 'addr'.
  *
- *	Negative system specific error code on error (NTSTATUS on Windows,
+ *      Negative system specific error code on error (NTSTATUS on Windows,
  *      etc.)
  *
  * Side effects:
@@ -1620,11 +1786,11 @@ Vmx86_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
  */
 
 int
-Vmx86_AllocLockedPages(VMDriver *vm,	     // IN: VMDriver
-		       VA64 addr,	     // OUT: VA of an array for
+Vmx86_AllocLockedPages(VMDriver *vm,         // IN: VMDriver
+                       VA64 addr,            // OUT: VA of an array for
                                              //      allocated MPNs.
-		       unsigned numPages,    // IN: number of pages to allocate
-		       Bool kernelMPNBuffer, // IN: is the MPN buffer in kernel
+                       unsigned numPages,    // IN: number of pages to allocate
+                       Bool kernelMPNBuffer, // IN: is the MPN buffer in kernel
                                              //     or user address space?
                        Bool ignoreLimits)    // IN: should limits be ignored?
 {
@@ -1659,8 +1825,8 @@ Vmx86_AllocLockedPages(VMDriver *vm,	     // IN: VMDriver
  *      by Vmx86_AllocLockedPages().
  *
  * Results:
- *	0 on success,
- *	non-0 system specific error code on error (NTSTATUS on Windows, etc.)
+ *      0 on success,
+ *      non-0 system specific error code on error (NTSTATUS on Windows, etc.)
  *
  * Side effects:
  *      Number of global and per-VM locked pages is decreased.
@@ -1669,10 +1835,10 @@ Vmx86_AllocLockedPages(VMDriver *vm,	     // IN: VMDriver
  */
 
 int
-Vmx86_FreeLockedPages(VMDriver *vm,	    // IN: VM instance pointer
-		      VA64 addr,            // IN: user or kernel array of MPNs to free
-		      unsigned numPages,    // IN: number of pages to free
-		      Bool kernelMPNBuffer) // IN: is the MPN buffer in kernel or user address space?
+Vmx86_FreeLockedPages(VMDriver *vm,         // IN: VM instance pointer
+                      VA64 addr,            // IN: user or kernel array of MPNs to free
+                      unsigned numPages,    // IN: number of pages to free
+                      Bool kernelMPNBuffer) // IN: is the MPN buffer in kernel or user address space?
 {
    int ret;
 
@@ -1693,11 +1859,11 @@ Vmx86_FreeLockedPages(VMDriver *vm,	    // IN: VM instance pointer
  *
  * Vmx86_GetNextAnonPage --
  *
- *      Queries the driver to retrieve the list of anonymous pages. 
+ *      Queries the driver to retrieve the list of anonymous pages.
  *      A supplied value of INVALID_MPN will start the query from
  *      the head of the list. Callers supply the previously received
  *      mpn to retrieve the next in the chain. Note: There is no
- *      guarantee of coherency. 
+ *      guarantee of coherency.
  *
  * Results:
  *      A valid mpn or INVALID_MPN if the list has been exhausted.
@@ -1722,55 +1888,22 @@ Vmx86_GetNextAnonPage(VMDriver *vm,       // IN: VM instance pointer
 }
 
 
-/*
- *----------------------------------------------------------------------
- *
- * Vmx86_GetLockedPageList --
- *
- *      puts MPNs of pages that were allocated by HostIF_AllocLockedPages()
- *      into user mode buffer.
- *
- * Results:
- *	non-negative number of the MPNs in the buffer on success.
- *	negative error code on error.
- *
- * Side effects:
- *      none
- *
- *----------------------------------------------------------------------
- */
-
-int
-Vmx86_GetLockedPageList(VMDriver *vm,          // IN: VM instance pointer
-                        VA64 uAddr,            // OUT: user mode buffer for MPNs
-		        unsigned int numPages) // IN: size of the buffer in MPNs
-{
-   int ret;
-
-   HostIF_VMLock(vm, 9);
-   ret = HostIF_GetLockedPageList(vm, uAddr, numPages);
-   HostIF_VMUnlock(vm, 9);
-
-   return ret;
-}
-
-
 /*
  *----------------------------------------------------------------------
  *
  * Vmx86_GetMemInfo --
  *
- *      Return the info about all VMs. 
+ *      Return the info about all VMs.
  *
  * Results:
  *      TRUE if all info was successfully copied.
  *
  * Side effects:
- *      VMGetMemInfoArgs is filled in. If the supplied curVM is null 
+ *      VMGetMemInfoArgs is filled in. If the supplied curVM is null
  *      then only the baseline information will be returned. Calling
- *      with a null curVM may return results for maxLockedPages 
- *      that differ from those  when the vm is passed if huge pages 
- *      are in use. 
+ *      with a null curVM may return results for maxLockedPages
+ *      that differ from those  when the vm is passed if huge pages
+ *      are in use.
  *
  *----------------------------------------------------------------------
  */
@@ -1846,7 +1979,7 @@ Vmx86_GetMemInfo(VMDriver *curVM,
  *
  * Vmx86SetMemoryUsage --
  *
- *      Updates the paged, nonpaged, and anonymous memory reserved memory 
+ *      Updates the paged, nonpaged, and anonymous memory reserved memory
  *      values for the vm.
  *
  * Results:
@@ -1968,8 +2101,8 @@ Vmx86_Admit(VMDriver *curVM,     // IN
       while (allocatedPages < nonpaged) {
          pages = Vmx86_AllocLockedPages(curVM,
                                         PtrToVA64(mpns + allocatedPages),
-	                                MIN(ALLOCATE_CHUNK_SIZE, nonpaged - allocatedPages),
-	                                TRUE,
+                                        MIN(ALLOCATE_CHUNK_SIZE, nonpaged - allocatedPages),
+                                        TRUE,
                                         FALSE);
          if (pages <= 0) {
             break;
@@ -2078,34 +2211,7 @@ Vmx86_UpdateMemInfo(VMDriver *curVM,
 /*
  *----------------------------------------------------------------------
  *
- * Vmx86_PAEEnabled --
- *
- *      Is PAE enabled?
- *
- * Results:
- *      TRUE if PAE enabled.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-Bool
-Vmx86_PAEEnabled(void)
-{
-   uintptr_t cr4;
-
-   GET_CR4(cr4);
-
-   return (cr4 & CR4_PAE) != 0;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * Vmx86_VMXEnabled --
+ * Vmx86VMXEnabled --
  *
  *      Test the VMXE bit as an easy proxy for whether VMX operation
  *      is enabled.
@@ -2119,8 +2225,8 @@ Vmx86_PAEEnabled(void)
  *----------------------------------------------------------------------
  */
 
-Bool
-Vmx86_VMXEnabled(void)
+static Bool
+Vmx86VMXEnabled(void)
 {
    if (VT_CapableCPU()) {
       uintptr_t cr4;
@@ -2134,154 +2240,6 @@ Vmx86_VMXEnabled(void)
 }
 
 
-/*
- *-----------------------------------------------------------------------------
- *
- * Vmx86LookupVMByUserIDLocked --
- *
- *      Lookup a VM by userID. The caller must hold the global lock.
- *
- * Returns:
- *      On success: Pointer to the driver's VM instance.
- *      On failure: NULL (not found).
- *
- * Side effects:
- *      None
- *
- *-----------------------------------------------------------------------------
- */
-
-static VMDriver *
-Vmx86LookupVMByUserIDLocked(int userID) // IN
-{
-   VMDriver *vm;
-
-   ASSERT(HostIF_GlobalLockIsHeld());
-
-   for (vm = vmDriverList; vm != NULL; vm = vm->nextDriver) {
-      if (vm->userID == userID) {
-         return vm;
-      }
-   }
-
-   return NULL;
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * Vmx86_LookupVMByUserID --
- *
- *      Lookup a VM by userID.
- *
- * Returns:
- *      On success: Pointer to the driver's VM instance.
- *      On failure: NULL (not found).
- *
- * Side effects:
- *      None
- *
- *-----------------------------------------------------------------------------
- */
-
-VMDriver *
-Vmx86_LookupVMByUserID(int userID) // IN
-{
-   VMDriver *vm;
-
-   HostIF_GlobalLock(10);
-   vm = Vmx86LookupVMByUserIDLocked(userID);
-   HostIF_GlobalUnlock(10);
-
-   return vm;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * Vmx86_FastSuspResSetOtherFlag --
- *
- *      Sets the value of other VM's fastSuspResFlag.
- *
- * Returns:
- *      TRUE if VM was found and flag was set successfully.
- *      FALSE if VM was not found.
- *
- * Side effects:
- *      The value we set the flag to is this VM's userID.
- *
- *----------------------------------------------------------------------
- */
-
-Bool
-Vmx86_FastSuspResSetOtherFlag(VMDriver *vm,      // IN
-                              int otherVmUserId) // IN
-{
-   VMDriver *otherVM;
-
-   HostIF_GlobalLock(35);
-   otherVM = Vmx86LookupVMByUserIDLocked(otherVmUserId);
-   if (otherVM != NULL) {
-      ASSERT(otherVM->fastSuspResFlag == 0);
-      otherVM->fastSuspResFlag = vm->userID;
-   } else {
-      Warning("otherVmUserId (%d) is invalid", otherVmUserId);
-   }
-   HostIF_GlobalUnlock(35);
-
-   return otherVM != NULL;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * Vmx86_FastSuspResGetMyFlag --
- *
- *      Gets the value of fastSuspResFlag. If blockWait is true, this
- *      function will not return until the flag is non-zero, or until
- *      timeout.
- *
- * Returns:
- *      The value of the flag which, if non-zero, should be the userID of
- *      the vm that set it.
- *
- * Side effects:
- *      The flag is reset to zero once read.
- *
- *----------------------------------------------------------------------
- */
-
-int
-Vmx86_FastSuspResGetMyFlag(VMDriver *vm,   // IN
-                           Bool blockWait) // IN
-{
-   int retval = 0;
-   int ntries = 1;
-   const int waitInterval = 10;     /* Wait 10ms at a time. */
-   const int maxWaitTime  = 100000; /* Wait maximum of 100 seconds. */
-
-   if (blockWait) {
-      ntries = maxWaitTime / waitInterval;
-   }
-
-   while (ntries--) {
-      HostIF_GlobalLock(6);
-      retval = vm->fastSuspResFlag;
-      vm->fastSuspResFlag = 0;
-      HostIF_GlobalUnlock(6);
-      if (retval || !ntries) {
-         break;
-      }
-      HostIF_Wait(waitInterval);
-   }
-
-   return retval;
-}
-
-
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2301,7 +2259,7 @@ Vmx86_FastSuspResGetMyFlag(VMDriver *vm,   // IN
 static void
 Vmx86EnableHVOnCPU(void)
 {
-   if (SVM_CapableCPU()) {
+   if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
       uint64 vmCR = __GET_MSR(MSR_VM_CR);
       if (!SVM_LockedFromFeatures(vmCR)) {
          CPUIDRegs regs;
@@ -2311,12 +2269,13 @@ Vmx86EnableHVOnCPU(void)
                                   MSR_VM_CR_SVM_LOCK);
          }
       }
-   }
-   if (VT_CapableCPU()) {
+   } else if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
       uint64 featCtl = __GET_MSR(MSR_FEATCTL);
       if (!VT_LockedFromFeatures(featCtl)) {
          __SET_MSR(MSR_FEATCTL, featCtl | MSR_FEATCTL_LOCK | MSR_FEATCTL_VMXE);
       }
+   } else {
+      NOT_REACHED();
    }
 }
 
@@ -2334,7 +2293,7 @@ Vmx86EnableHVOnCPU(void)
 static INLINE uint64
 Vmx86RefClockInCycles(uint64 uptime)
 {
-   return Mul64x3264(uptime, 
+   return Mul64x3264(uptime,
                      pseudoTSC.refClockToPTSC.ratio.mult,
                      pseudoTSC.refClockToPTSC.ratio.shift);
 }
@@ -2353,7 +2312,7 @@ Vmx86RefClockInCycles(uint64 uptime)
 static INLINE uint64
 Vmx86RefClockToPTSC(uint64 uptime)
 {
-   return Vmx86RefClockInCycles(uptime) + 
+   return Vmx86RefClockInCycles(uptime) +
       Atomic_Read64(&pseudoTSC.refClockToPTSC.add);
 }
 
@@ -2411,7 +2370,7 @@ Vmx86_InitPseudoTSC(PTSCInitParams *params) // IN/OUT
 
       pseudoTSC.initialized = TRUE;
    }
-   /* 
+   /*
     * Allow the calling vmx to respect ptsc.noTSC=TRUE config option
     * even if another vmx is already running (pseudoTSC was already
     * initialized).  Useful for testing.
@@ -2533,12 +2492,6 @@ Vmx86_CheckPseudoTSC(uint64 *lastTSC, // IN/OUT: last/current value of the TSC
 }
 
 
-typedef struct {
-   Atomic_uint32 index;
-   MSRQuery *query;
-} Vmx86GetMSRData;
-
-
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2546,7 +2499,7 @@ typedef struct {
  *
  *      Collect MSR value on the current logical CPU.
  *
- *	Function must not block (it is invoked from interrupt context).
+ *      Function must not block (it is invoked from interrupt context).
  *      Only VT MSRs are supported on VT-capable processors.
  *
  * Results:
@@ -2653,6 +2606,143 @@ Vmx86_GetAllMSRs(MSRQuery *query) // IN/OUT
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86CheckVMXStatus --
+ *
+ *      Checks the status of the given operation and issues a warning if it was
+ *      not successful. If it is a valid failure, the error code will be read
+ *      and logged.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+Vmx86CheckVMXStatus(const char *operation, // IN: Operation string
+                    VMXStatus status)      // IN: Status to check
+{
+   if (status != VMX_Success) {
+      Warning("%s failed with status %s.\n", operation,
+              status == VMX_FailValid ? "VMX_FailValid" :
+              status == VMX_FailInvalid ? "VMX_FailInvalid" : "UNKNOWN");
+/*
+ * We use a broken in-house version of binutils (2.16.1-vt) with gcc 4.3 which
+ * doesn't handle VMREAD/VMWRITE operands properly.
+ */
+#ifdef __GNUC__
+#if __GNUC__== 4 && __GNUC_MINOR__ > 3
+      if (status == VMX_FailValid) {
+         uint64 errorCode;
+         VMREAD_2_STATUS(VT_VMCS_VMINSTR_ERR, &errorCode);
+         Log("VM-instruction error: Error %"FMT64"d\n", errorCode);
+      }
+#endif
+#endif
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86FlushVMCSPage --
+ *
+ *      VMCLEAR the given VMCS page on the current logical CPU. We first enable
+ *      HV if necessary, and execute a VMXON using the given VMXON region MPN.
+ *      If HV was already enabled, it will remain enabled. If we enabled HV or
+ *      executed a VMXON in non-root operation, we will restore the state of
+ *      each respectively after the VMCLEAR.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      The hardware VMCS cache will be flushed.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+Vmx86FlushVMCSPage(void *clientData) // IN: The MA of the VMCS to VMCLEAR
+{
+   MA vmxonRegion;
+   Bool hvWasEnabled;
+   MA vmcs = (MA)clientData;
+   Bool vmxWasInRootOperation = FALSE;
+   VMXStatus vmxonStatus, vmclearStatus, vmxoffStatus;
+
+   ASSERT(vmcs);
+
+   /* Enable HV if it isn't already enabled. */
+   hvWasEnabled = Vmx86VMXEnabled();
+   if (!hvWasEnabled) {
+      uintptr_t cr4reg;
+      ASSERT(VT_CapableCPU());
+      Vmx86EnableHVOnCPU();
+      GET_CR4(cr4reg);
+      SET_CR4(cr4reg | CR4_VMXE);
+   }
+
+   /* VMXON using this CPUs's VMXON region. */
+   vmxonRegion = MPN_2_MA(Task_GetHVRootPageForPCPU(HostIF_GetCurrentPCPU()));
+   vmxonStatus = VMXON_2_STATUS(&vmxonRegion);
+   if (vmxonStatus != VMX_Success) {
+      /* VMXON failed, we must already be in VMX root operation. */
+      vmxWasInRootOperation = TRUE;
+   }
+
+   /* VMCLEAR the given VMCS page. */
+   vmclearStatus = VMCLEAR_2_STATUS(&vmcs);
+   Vmx86CheckVMXStatus("VMCLEAR", vmclearStatus);
+
+   /* VMXOFF if we were initially in VMX non-root operation. */
+   if (!vmxWasInRootOperation) {
+      vmxoffStatus = VMXOFF_2_STATUS();
+      Vmx86CheckVMXStatus("VMXOFF", vmxoffStatus);
+   }
+
+   /* Disable HV if it was initially disabled. */
+   if (!hvWasEnabled) {
+      uintptr_t cr4reg;
+      GET_CR4(cr4reg);
+      SET_CR4(cr4reg & ~CR4_VMXE);
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_FlushVMCSAllCPUs --
+ *
+ *      Enable HV (if necessary) and VMCLEAR a VMCS page on all logical CPUs.
+ *      This will prevent stale data from surfacing out of the VMCS cache when
+ *      executing VMREADs.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      HV will be enabled and hardware VMCS caches will be flushed across all
+ *      CPUs.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+Vmx86_FlushVMCSAllCPUs(MA vmcs) // IN: The MA of the VMCS to VMCLEAR
+{
+   HostIF_CallOnEachCPU(Vmx86FlushVMCSPage, (void *)vmcs);
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -2662,7 +2752,7 @@ Vmx86_GetAllMSRs(MSRQuery *query) // IN/OUT
  *
  *      usecs is the total spin time in monitor.  Very low numbers
  *      indicate we detected there was a vCPU thread that was not
- *      in the monitor, so we didn't spin.  In that case, simply 
+ *      in the monitor, so we didn't spin.  In that case, simply
  *      nudge the threads we want and return.
  *
  * Results:
@@ -2838,7 +2928,7 @@ Vmx86PerfCtrInUse(Bool isGen, unsigned pmcNum, unsigned ctrlMSR,
  * Vmx86GetUnavailPerfCtrsOnCPU --
  *
  *      Determine which performance counters are already in use by the
- *      host on the current PCPU. 
+ *      host on the current PCPU.
  *
  * Results:
  *      A bitset representing unavailable performance counter.
@@ -2879,10 +2969,11 @@ Vmx86GetUnavailPerfCtrsOnCPU(void *data)
       selBase = PERFCTR_CORE_PERFEVTSEL0_ADDR;
       ctrBase = PERFCTR_CORE_PERFCTR0_ADDR;
    } else if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
-      if (CPUID_FAMILY_IS_BULLDOZER(__GET_EAX_FROM_CPUID(1))) {
+     if(CPUID_ISSET(0x80000001, ECX, PERFCORE,
+        __GET_ECX_FROM_CPUID(0x80000001))) {
          numGen  = 6;
-         selBase = PERFCTR_BD_BASE_ADDR + PERFCTR_BD_EVENTSEL;
-         ctrBase = PERFCTR_BD_BASE_ADDR + PERFCTR_BD_CTR;
+         selBase = PERFCTR_AMD_EXT_BASE_ADDR + PERFCTR_AMD_EXT_EVENTSEL;
+         ctrBase = PERFCTR_AMD_EXT_BASE_ADDR + PERFCTR_AMD_EXT_CTR;
          stride  = 2;
       } else {
          numGen  = 4;
@@ -2947,3 +3038,79 @@ Vmx86_GetUnavailablePerfCtrs(void)
    return Atomic_Read64(&unavailCtrs);
 }
 
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetPageRoot --
+ *
+ *      Get the page root MPN for the specified VCPU.
+ *
+ * Results:
+ *      TRUE and an MPN on success, FALSE on failure.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_GetPageRoot(VMDriver *vm,  // IN:
+                  Vcpuid vcpuid, // IN:
+                  MPN *mpn)      // OUT:
+{
+   if (vcpuid >= vm->numVCPUs) {
+      return FALSE;
+   }
+   *mpn = vm->ptRootMpns[vcpuid];
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_MapPage --
+ *
+ *      Maps the specified MPN into the host kernel address space.
+ *      returns the VPN of the mapping.
+ *
+ * Results:
+ *      The VPN in the kernel address space of the new mapping, or 0 if
+ *      the mapping failed.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+VPN
+Vmx86_MapPage(MPN mpn) // IN:
+{
+   return HostIF_MapPage(mpn);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_UnmapPage --
+ *
+ *      Unmaps the specified VPN from the host kernel address space.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_UnmapPage(VPN vpn) // IN:
+{
+   HostIF_UnmapPage(vpn);
+}
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index 9e227ca4..7f0f33fb 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -38,6 +38,7 @@
 #include "rateconv.h"
 #include "vmmem_shared.h"
 #include "apic.h"
+#include "bootstrap_vmm.h"
 
 typedef struct PseudoTSCOffsetInfo {
    uint32 inVMMCnt;                  /* Number of vcpus executing in the VMM. */
@@ -63,8 +64,12 @@ typedef struct VMDriver {
    Vcpuid                       numVCPUs;     /* Number of vcpus in VM. */
    struct VMHost               *vmhost;       /* Host-specific fields. */
 
+   BSVMM_HostParams             bsParams;
+   MPN                          ptRootMpns[MAX_VCPUS];
+
    /* Pointers to the crossover pages shared with the monitor. */
    struct VMCrossPage          *crosspage[MAX_INITBLOCK_CPUS];
+   struct MemTrack             *ptpTracker;
    volatile uint32              currentHostCpu[MAX_INITBLOCK_CPUS];
    VCPUSet                      crosscallWaitSet[MAX_INITBLOCK_CPUS];
    APICDescriptor               hostAPIC;
@@ -74,13 +79,17 @@ typedef struct VMDriver {
    struct PerfCounter          *perfCounter;
    VMMemMgmtInfo                memInfo;
    unsigned                     fastClockRate;/* Protected by FastClockLock. */
-   int                          fastSuspResFlag;
 
    volatile PseudoTSCOffsetInfo ptscOffsetInfo; /* Volatile per PR 699101#29. */
    Atomic_uint64                ptscLatest;
    int64                        ptscOffsets[MAX_INITBLOCK_CPUS];
 } VMDriver;
 
+typedef struct MonLoaderArgs {
+   VMDriver *vm;
+   VMSharedRegion *shRegions;
+} MonLoaderArgs;
+
 typedef struct VmTimeStart {
    uint64 count;
    uint64 time;
@@ -105,7 +114,14 @@ extern PseudoTSC pseudoTSC;
 
 #define MAX_LOCKED_PAGES (-1)
 
-extern VMDriver *Vmx86_CreateVM(void);
+extern VMDriver *Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize);
+extern Bool Vmx86_ProcessBootstrap(VMDriver *vm,
+                                   VA64 bsBlobAddr,
+                                   uint32 numBytes,
+                                   uint32 headerOffset,
+                                   uint16 numVCPUs,
+                                   UserVA64 *ptRootVAs,
+                                   VMSharedRegion *shRegions);
 extern int Vmx86_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
 extern int Vmx86_ReleaseVM(VMDriver *vm);
 extern int Vmx86_InitVM(VMDriver *vm, InitBlock *initParams);
@@ -126,13 +142,11 @@ extern int Vmx86_UnlockPageByMPN(VMDriver *vm, MPN mpn, VA64 uAddr);
 extern MPN Vmx86_GetRecycledPage(VMDriver *vm);
 extern int Vmx86_ReleaseAnonPage(VMDriver *vm, MPN mpn);
 extern int Vmx86_AllocLockedPages(VMDriver *vm, VA64 addr,
-				  unsigned numPages, Bool kernelMPNBuffer,
+                                  unsigned numPages, Bool kernelMPNBuffer,
                                   Bool ignoreLimits);
 extern int Vmx86_FreeLockedPages(VMDriver *vm, VA64 addr,
-				 unsigned numPages, Bool kernelMPNBuffer);
+                                 unsigned numPages, Bool kernelMPNBuffer);
 extern MPN Vmx86_GetNextAnonPage(VMDriver *vm, MPN mpn);
-extern int Vmx86_GetLockedPageList(VMDriver *vm, VA64 uAddr,
-				   unsigned int numPages);
 
 extern int32 Vmx86_GetNumVMs(void);
 extern int32 Vmx86_GetTotalMemUsage(void);
@@ -147,15 +161,12 @@ extern Bool Vmx86_Readmit(VMDriver *curVM, OvhdMem_Deltas *delta);
 extern void Vmx86_UpdateMemInfo(VMDriver *curVM,
                                 const VMMemMgmtInfoPatch *patch);
 extern void Vmx86_Add2MonPageTable(VMDriver *vm, VPN vpn, MPN mpn,
-				   Bool readOnly);
-extern Bool Vmx86_PAEEnabled(void);
-extern Bool Vmx86_VMXEnabled(void);
+                                   Bool readOnly);
 extern Bool Vmx86_GetAllMSRs(MSRQuery *query);
+extern void Vmx86_FlushVMCSAllCPUs(MA vmcs);
 extern void Vmx86_MonTimerIPI(void);
 extern void Vmx86_InitIDList(void);
-extern VMDriver *Vmx86_LookupVMByUserID(int userID);
-extern Bool Vmx86_FastSuspResSetOtherFlag(VMDriver *vm, int otherVmUserId);
-extern int  Vmx86_FastSuspResGetMyFlag(VMDriver *vm, Bool blockWait);
+extern Bool Vmx86_GetPageRoot(VMDriver *vm, Vcpuid vcpuid, MPN *mpn);
 extern void Vmx86_Open(void);
 extern void Vmx86_Close(void);
 
@@ -199,4 +210,4 @@ extern uint64 Vmx86_GetPseudoTSC(void);
 
 extern uint64 Vmx86_GetUnavailablePerfCtrs(void);
 
-#endif 
+#endif
diff --git a/vmmon-only/include/address_defs.h b/vmmon-only/include/address_defs.h
index f7ba0645..94259e8a 100644
--- a/vmmon-only/include/address_defs.h
+++ b/vmmon-only/include/address_defs.h
@@ -36,6 +36,11 @@
 
 #include "vm_basic_defs.h" // For PAGE_SHIFT
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 /*
  * Virtual, physical, machine address and page conversion macros
  */
@@ -92,4 +97,9 @@ IsGoodMPNOrMemref(MPN mpn)
    return IsGoodMPN(mpn) || mpn == MEMREF_MPN;
 }
 
+
+#if defined __cplusplus
+} // extern "C"
 #endif
+
+#endif // _ADDRESS_DEFS_H_
diff --git a/vmmon-only/include/basic_initblock.h b/vmmon-only/include/basic_initblock.h
index 438e9b61..29326559 100644
--- a/vmmon-only/include/basic_initblock.h
+++ b/vmmon-only/include/basic_initblock.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006, 2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,7 +40,7 @@
 #include "vcpuid.h"
 
 
-#define MAX_INITBLOCK_CPUS     128
+#define MAX_INITBLOCK_CPUS     MAX_VCPUS
 
 
 typedef
@@ -49,9 +49,12 @@ struct InitBlock {
    uint32 magicNumber;     /* Magic number (INIT_BLOCK_MAGIC) */
    Vcpuid numVCPUs;
    VA64   crosspage[MAX_INITBLOCK_CPUS];
+   LPN64  monStartLPN;
+   LPN64  monEndLPN;
    uint32 vmInitFailurePeriod;
    LA64   crossGDTHKLA;
    MPN    crossGDTMPNs[5];  // CROSSGDT_NUMPAGES
+   uint16 numPTPPages;
 }
 #include "vmware_pack_end.h"
 InitBlock;
diff --git a/vmmon-only/include/bootstrap_vmm.h b/vmmon-only/include/bootstrap_vmm.h
new file mode 100644
index 00000000..1e481223
--- /dev/null
+++ b/vmmon-only/include/bootstrap_vmm.h
@@ -0,0 +1,65 @@
+/*********************************************************
+ * Copyright (C) 2015,2017 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * bootstrap_vmm.h --
+ *
+ *    Public VMM bootstrap declarations.
+ */
+
+#ifndef _BOOTSTRAP_VMM_H
+#define _BOOTSTRAP_VMM_H
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_USERLEVEL
+
+#include "includeCheck.h"
+#include "vm_basic_types.h"
+#include "monAddrLayout.h"
+
+#define BOOTSTRAP_MAGIC 42
+#define BOOTSTRAP_MAX_GDT_DESCS 2
+
+typedef struct BSVMM_GDTInitEntry {
+   uint16 index;
+   LA32   base;
+   VA32   limit;
+   uint32 type;
+   uint32 S;
+   uint32 DPL;
+   uint32 present;
+   uint32 longmode;
+   uint32 DB;
+   uint32 gran;
+} BSVMM_GDTInitEntry;
+
+typedef struct BSVMM_GDTInit {
+   BSVMM_GDTInitEntry entries[BOOTSTRAP_MAX_GDT_DESCS];
+} BSVMM_GDTInit;
+
+typedef struct BSVMM_HostParams {
+   uint32           magic;
+   VMM64_AddrLayout addrLayout;
+   BSVMM_GDTInit    gdtInit;
+} BSVMM_HostParams;
+
+BSVMM_HostParams* BSVMM_Validate(void *buf, uint32 nbytes);
+
+#endif
diff --git a/vmmon-only/include/circList.h b/vmmon-only/include/circList.h
index ac4f48f1..850b8e6f 100644
--- a/vmmon-only/include/circList.h
+++ b/vmmon-only/include/circList.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -32,75 +32,126 @@
 #define INCLUDE_ALLOW_MODULE
 #define INCLUDE_ALLOW_VMKERNEL
 #include "includeCheck.h"
+
 #include "vmware.h"
 
+#if defined(__cplusplus)
+extern "C" {
+#endif
+
 typedef struct ListItem {
    struct ListItem *prev;
    struct ListItem *next;
 } ListItem;
 
-/* A list with no elements is a null pointer. */
-#define   LIST_ITEM_DEF(name)   \
-   ListItem * name = NULL
-
-#define   LIST_EMPTY(l)      ((l) == NULL)
 
-/* initialize list item */
-#define   INIT_LIST_ITEM(p)   \
-   do {   \
-      (p)->prev = (p)->next = (p);   \
-   } while (0)
-
-/* check if initialized */
-#define   IS_LIST_ITEM_INITIALIZED(li)   \
-   (((li) == (li)->prev) && ((li) == (li)->next))
+/*
+ *----------------------------------------------------------------------
+ *
+ * CircList_IsEmpty --
+ *
+ *      A NULL list is an empty list.
+ *
+ * Result:
+ *      TRUE if list is empty, FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
 
-/* return first element in the list */
-#define   LIST_FIRST(l)      (l)
-#define   LIST_FIRST_CHK(l)   (l)
+static INLINE Bool
+CircList_IsEmpty(const ListItem *item)  // IN
+{
+   return item == NULL;
+}
 
-/* return last element in the list */
-#define   LIST_LAST(l)      ((l)->prev)
-#define   LIST_LAST_CHK(l)   (LIST_EMPTY(l) ? NULL : LIST_LAST(l))
 
 /*
- * LIST_CONTAINER - get the struct for this entry (like list_entry)
- * @ptr: the &struct ListItem pointer.
- * @type:   the type of the struct this is embedded in.
- * @member: the name of the list struct within the struct.
+ *----------------------------------------------------------------------
+ *
+ * CircList_InitItem --
+ *
+ *      Initialize item as a single-element circular list.
+ *
+ * Result:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
  */
-#define LIST_CONTAINER(ptr, type, member) \
-   VMW_CONTAINER_OF(ptr, type, member)
 
-/*
- * delete item from the list
- */
-#define   LIST_DEL            DelListItem
+static INLINE void
+CircList_InitItem(ListItem *item)  // OUT
+{
+   item->prev = item->next = item;
+}
 
-/*
- * link two lists together
- */
-#define   LIST_SPLICE         SpliceLists
 
 /*
- * Split a list into two lists
+ *----------------------------------------------------------------------
+ *
+ * CircList_First --
+ *
+ *      Return first item in the list.
+ *
+ * Result:
+ *      First item.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
  */
-#define   LIST_SPLIT          SplitLists
 
-/*
- * Add item to front of stack. List pointer points to new head.
- */
-#define   LIST_PUSH           PushListItem
+static INLINE ListItem *
+CircList_First(ListItem *item)  // IN
+{
+   return item;
+}
+
 
 /*
- * Add item at back of queue. List pointer only changes if list was empty.
+ *----------------------------------------------------------------------
+ *
+ * CircList_Last --
+ *
+ *      Return last item in the list.
+ *
+ * Result:
+ *      Last item.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
  */
-#define   LIST_QUEUE          QueueListItem
+
+static INLINE ListItem *
+CircList_Last(ListItem *item)
+{
+   return item->prev;
+}
+
 
 /*
- * Get the list size.
+ * CIRC_LIST_CONTAINER - get the struct for this entry (like list_entry)
+ * @ptr: the &struct ListItem pointer.
+ * @type:   the type of the struct this is embedded in.
+ * @member: the name of the list struct within the struct.
  */
-#define   LIST_SIZE           GetListSize
+#define CIRC_LIST_CONTAINER(ptr, type, member) \
+   VMW_CONTAINER_OF(ptr, type, member)
+/* 
+ * Historical name, left here to reduce churn.
+ * TODO: remove, all LIST_CONTAINER uses should be
+ * VMW_CONTAINER_OF and stop depending on circList.h
+ * to provide the definition.
+ */
+#define LIST_CONTAINER(ptr, type, member) VMW_CONTAINER_OF(ptr, type, member)
 
 /*
  * LIST_SCAN_FROM scans the list from "from" up until "until".
@@ -109,38 +160,32 @@ typedef struct ListItem {
  * "until" is the element where search should stop.
  * member is the field to use for the search - either "next" or "prev".
  */
-#define   LIST_SCAN_FROM(p, from, until, member)   \
+#define CIRC_LIST_SCAN_FROM(p, from, until, member)   \
    for (p = (from); (p) != NULL;   \
       (p) = (((p)->member == (until)) ? NULL : (p)->member))
 
 /* scan the entire list (non-destructively) */
-#define   LIST_SCAN(p, l)   \
-   LIST_SCAN_FROM(p, LIST_FIRST(l), LIST_FIRST(l), next)
-
+#define CIRC_LIST_SCAN(p, l)   \
+   CIRC_LIST_SCAN_FROM(p, CircList_First(l), CircList_First(l), next)
 
-/* scan a list backward from last element to first (non-destructively) */
-#define   LIST_SCAN_BACK(p, l)   \
-   LIST_SCAN_FROM(p, LIST_LAST_CHK(l), LIST_LAST(l), prev)
 
 /* scan the entire list where loop element may be destroyed */
-#define   LIST_SCAN_SAFE(p, pn, l)   \
-   if (!LIST_EMPTY(l))  \
-      for (p = (l), (pn) = NextListItem(p, l); (p) != NULL;   \
-           (p) = (pn), (pn) = NextListItem(p, l))
+#define CIRC_LIST_SCAN_SAFE(p, pn, l)   \
+   if (!CircList_IsEmpty(l))  \
+      for (p = (l), (pn) = CircList_Next(p, l); (p) != NULL;   \
+           (p) = (pn), (pn) = CircList_Next(p, l))
 
 /* scan the entire list backwards where loop element may be destroyed */
-#define   LIST_SCAN_BACK_SAFE(p, pn, l)   \
-   if (!LIST_EMPTY(l))  \
-      for (p = LIST_LAST(l), (pn) = PrevListItem(p, l); (p) != NULL;   \
-           (p) = (pn), (pn) = PrevListItem(p, l))
+#define CIRC_LIST_SCAN_BACK_SAFE(p, pn, l)   \
+   if (!CircList_IsEmpty(l))  \
+      for (p = CircList_Last(l), (pn) = CircList_Prev(p, l); (p) != NULL;   \
+           (p) = (pn), (pn) = CircList_Prev(p, l))
 
 
-/* function definitions */
-
 /*
  *----------------------------------------------------------------------
  *
- * NextListItem --
+ * CircList_Next --
  *
  *      Returns the next member of a doubly linked list, or NULL if last.
  *      Assumes: p is member of the list headed by head.
@@ -156,8 +201,8 @@ typedef struct ListItem {
  */
 
 static INLINE ListItem *
-NextListItem(ListItem *p,        // IN
-             ListItem *head)     // IN
+CircList_Next(ListItem *p,        // IN
+              ListItem *head)     // IN
 {
    if (head == NULL || p == NULL) {
       return NULL;
@@ -171,7 +216,7 @@ NextListItem(ListItem *p,        // IN
 /*
  *----------------------------------------------------------------------
  *
- * PrevListItem --
+ * CircList_Prev --
  *
  *      Returns the prev member of a doubly linked list, or NULL if first.
  *      Assumes: p is member of the list headed by head.
@@ -187,8 +232,8 @@ NextListItem(ListItem *p,        // IN
  */
 
 static INLINE ListItem *
-PrevListItem(ListItem *p,        // IN
-             ListItem *head)     // IN
+CircList_Prev(ListItem *p,        // IN
+              ListItem *head)     // IN
 {
    if (head == NULL || p == NULL) {
       return NULL;
@@ -201,7 +246,7 @@ PrevListItem(ListItem *p,        // IN
 /*
  *----------------------------------------------------------------------
  *
- * DelListItem --
+ * CircList_DeleteItem --
  *
  *      Deletes a member of a doubly linked list, possibly modifies the
  *      list header itself.
@@ -217,8 +262,8 @@ PrevListItem(ListItem *p,        // IN
  */
 
 static INLINE void
-DelListItem(ListItem *p,         // IN
-            ListItem **headp)    // IN/OUT
+CircList_DeleteItem(ListItem *p,         // IN
+                    ListItem **headp)    // IN/OUT
 {
    ListItem *next;
 
@@ -241,7 +286,7 @@ DelListItem(ListItem *p,         // IN
 /*
  *----------------------------------------------------------------------
  *
- * QueueListItem --
+ * CircList_Queue --
  *
  *      Adds a new member to the back of a doubly linked list (queue)
  *      Assumes neither p nor headp is null and p is not a member of *headp.
@@ -256,14 +301,14 @@ DelListItem(ListItem *p,         // IN
  */
 
 static INLINE void
-QueueListItem(ListItem *p,              // IN
-              ListItem **headp)         // IN/OUT
+CircList_Queue(ListItem *p,              // IN
+               ListItem **headp)         // IN/OUT
 {
    ListItem *head;
 
    head = *headp;
-   if (LIST_EMPTY(head)) {
-      INIT_LIST_ITEM(p);
+   if (CircList_IsEmpty(head)) {
+      CircList_InitItem(p);
       *headp = p;
    } else {
       p->prev = head->prev;
@@ -277,7 +322,7 @@ QueueListItem(ListItem *p,              // IN
 /*
  *----------------------------------------------------------------------
  *
- * PushListItem --
+ * CircList_Push --
  *
  *      Adds a new member to the front of a doubly linked list (stack)
  *      Assumes neither p nor headp is null and p is not a member of *headp.
@@ -292,10 +337,10 @@ QueueListItem(ListItem *p,              // IN
  */
 
 static INLINE void
-PushListItem(ListItem *p,               // IN
-             ListItem **headp)          // IN/OUT
+CircList_Push(ListItem *p,               // IN
+              ListItem **headp)          // IN/OUT
 {
-   QueueListItem(p, headp);
+   CircList_Queue(p, headp);
    *headp = p;
 }
 
@@ -303,7 +348,7 @@ PushListItem(ListItem *p,               // IN
 /*
  *----------------------------------------------------------------------
  *
- * SpliceLists --
+ * CircList_Splice --
  *
  *      Make a single list {l1 l2} from {l1} and {l2} and return it.
  *      It is okay for one or both lists to be NULL.
@@ -320,16 +365,16 @@ PushListItem(ListItem *p,               // IN
  */
 
 static INLINE ListItem *
-SpliceLists(ListItem *l1,      // IN
-            ListItem *l2)      // IN
+CircList_Splice(ListItem *l1,      // IN
+                ListItem *l2)      // IN
 {
    ListItem *l1Last, *l2Last;
 
-   if (LIST_EMPTY(l1)) {
+   if (CircList_IsEmpty(l1)) {
       return l2;
    }
 
-   if (LIST_EMPTY(l2)) {
+   if (CircList_IsEmpty(l2)) {
       return l1;
    }
 
@@ -349,10 +394,11 @@ SpliceLists(ListItem *l1,      // IN
 }
 
 
+#if 0  /* Presently unused, enable if a use is found */
 /*
  *----------------------------------------------------------------------
  *
- * SplitLists --
+ * CircList_Split --
  *
  *      Make a list l = {l1 l2} into two separate lists {l1} and {l2}, where:
  *      l = { ... x -> p -> ... } split into:
@@ -372,14 +418,14 @@ SpliceLists(ListItem *l1,      // IN
  */
 
 static INLINE void
-SplitLists(ListItem *p,         // IN
-           ListItem *l,         // IN
-           ListItem **l1p,      // OUT
-           ListItem **l2p)      // OUT
+CircList_Split(ListItem *p,         // IN
+               ListItem *l,         // IN
+               ListItem **l1p,      // OUT
+               ListItem **l2p)      // OUT
 {
    ListItem *last;
 
-   if (p == LIST_FIRST(l)) {   /* first element */
+   if (p == CircList_First(l)) {   /* first element */
       *l1p = NULL;
       *l2p = l;
       return;
@@ -395,12 +441,13 @@ SplitLists(ListItem *p,         // IN
    p->prev = last;
    last->next = p;
 }
+#endif
 
 
 /*
  *----------------------------------------------------------------------
  *
- * GetListSize --
+ * CircList_Size --
  *
  *	Return the number of items in the list.
  *
@@ -414,15 +461,19 @@ SplitLists(ListItem *p,         // IN
  */
 
 static INLINE int
-GetListSize(ListItem *head)     // IN
+CircList_Size(ListItem *head)     // IN
 {
    ListItem *li;
    int ret = 0;
 
-   LIST_SCAN(li, head) {
+   CIRC_LIST_SCAN(li, head) {
       ret++;
    }
    return ret;
 }
 
+#if defined(__cplusplus)
+}  // extern "C"
+#endif
+
 #endif /* _CIRCLIST_H_ */
diff --git a/vmmon-only/include/community_source.h b/vmmon-only/include/community_source.h
index 2d32d8fa..754416e0 100644
--- a/vmmon-only/include/community_source.h
+++ b/vmmon-only/include/community_source.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2009-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2009-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/compat_cred.h b/vmmon-only/include/compat_cred.h
deleted file mode 100644
index 4c6d940f..00000000
--- a/vmmon-only/include/compat_cred.h
+++ /dev/null
@@ -1,51 +0,0 @@
-/*********************************************************
- * Copyright (C) 2002 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef __COMPAT_CRED_H__
-#   define __COMPAT_CRED_H__
-
-
-/*
- * Include linux/cred.h via linux/sched.h - it is not nice, but
- * as cpp does not have #ifexist...
- */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 11, 0)
-#include <linux/sched.h>
-#else
-#include <linux/cred.h>
-#endif
-
-#if !defined(current_fsuid) && LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 29)
-#define current_uid() (current->uid)
-#define current_euid() (current->euid)
-#define current_fsuid() (current->fsuid)
-#define current_gid() (current->gid)
-#define current_egid() (current->egid)
-#define current_fsgid() (current->fsgid)
-#endif
-
-#if !defined(cap_set_full)
-/* cap_set_full was removed in kernel version 3.0-rc4. */
-#define cap_set_full(_c) do { (_c) = CAP_FULL_SET; } while (0)
-#endif
-
-#if !defined(GLOBAL_ROOT_UID)
-#define GLOBAL_ROOT_UID (0)
-#endif
-
-#endif /* __COMPAT_CRED_H__ */
diff --git a/vmmon-only/include/compat_highmem.h b/vmmon-only/include/compat_highmem.h
deleted file mode 100644
index 263380d6..00000000
--- a/vmmon-only/include/compat_highmem.h
+++ /dev/null
@@ -1,32 +0,0 @@
-/*********************************************************
- * Copyright (C) 2012 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef __COMPAT_HIGHMEM_H__
-#   define __COMPAT_HIGHMEM_H__
-
-#include <linux/highmem.h>
-
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
-#   define compat_kmap_atomic(_page)   kmap_atomic(_page)
-#   define compat_kunmap_atomic(_page) kunmap_atomic(_page)
-#else
-#   define compat_kmap_atomic(_page)   kmap_atomic((_page), KM_USER0)
-#   define compat_kunmap_atomic(_page) kunmap_atomic((_page), KM_USER0)
-#endif
-
-#endif /* __COMPAT_HIGHMEM_H__ */
diff --git a/vmmon-only/include/compat_interrupt.h b/vmmon-only/include/compat_interrupt.h
deleted file mode 100644
index 1d72a4bb..00000000
--- a/vmmon-only/include/compat_interrupt.h
+++ /dev/null
@@ -1,55 +0,0 @@
-/*********************************************************
- * Copyright (C) 2003 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef __COMPAT_INTERRUPT_H__
-#   define __COMPAT_INTERRUPT_H__
-
-
-#include <linux/interrupt.h>
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 5, 69)
-/*
- * We cannot just define irqreturn_t, as some 2.4.x kernels have
- * typedef void irqreturn_t; for "increasing" backward compatibility.
- */
-typedef void compat_irqreturn_t;
-#define COMPAT_IRQ_NONE
-#define COMPAT_IRQ_HANDLED
-#define COMPAT_IRQ_RETVAL(x)
-#else
-typedef irqreturn_t compat_irqreturn_t;
-#define COMPAT_IRQ_NONE		IRQ_NONE
-#define COMPAT_IRQ_HANDLED	IRQ_HANDLED
-#define COMPAT_IRQ_RETVAL(x)	IRQ_RETVAL(x)
-#endif
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 18)
-#define COMPAT_IRQF_DISABLED    SA_INTERRUPT
-#define COMPAT_IRQF_SHARED      SA_SHIRQ
-#else
-#define COMPAT_IRQF_DISABLED    IRQF_DISABLED
-#define COMPAT_IRQF_SHARED      IRQF_SHARED
-#endif
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 20)
-#define COMPAT_IRQ_HANDLER_ARGS(irq, devp) (int irq, void *devp, struct pt_regs *regs)
-#else
-#define COMPAT_IRQ_HANDLER_ARGS(irq, devp) (int irq, void *devp)
-#endif
-
-#endif /* __COMPAT_INTERRUPT_H__ */
diff --git a/vmmon-only/include/compat_ioport.h b/vmmon-only/include/compat_ioport.h
deleted file mode 100644
index bacdb50b..00000000
--- a/vmmon-only/include/compat_ioport.h
+++ /dev/null
@@ -1,63 +0,0 @@
-/*********************************************************
- * Copyright (C) 2003 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef __COMPAT_IOPORT_H__
-#   define __COMPAT_IOPORT_H__
-
-
-#include <linux/ioport.h>
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
-static inline void *
-compat_request_region(unsigned long start, unsigned long len, const char *name)
-{
-   if (check_region(start, len)) {
-      return NULL;
-   }
-   request_region(start, len, name);
-   return (void*)1;
-}
-#else
-#define compat_request_region(start, len, name) request_region(start, len, name)
-#endif
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 3, 7)
-/* mmap io support starts from 2.3.7, fail the call for kernel prior to that */
-static inline void *
-compat_request_mem_region(unsigned long start, unsigned long len, const char *name)
-{
-   return NULL;
-}
-
-static inline void
-compat_release_mem_region(unsigned long start, unsigned long len)
-{
-   return;
-}
-#else
-#define compat_request_mem_region(start, len, name) request_mem_region(start, len, name)
-#define compat_release_mem_region(start, len)       release_mem_region(start, len)
-#endif
-
-/* these two macro defs are needed by compat_pci_request_region */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 3, 15)
-#   define IORESOURCE_IO    0x00000100
-#   define IORESOURCE_MEM   0x00000200
-#endif
-
-#endif /* __COMPAT_IOPORT_H__ */
diff --git a/vmmon-only/include/compat_pci.h b/vmmon-only/include/compat_pci.h
deleted file mode 100644
index d1f897a7..00000000
--- a/vmmon-only/include/compat_pci.h
+++ /dev/null
@@ -1,72 +0,0 @@
-/*********************************************************
- * Copyright (C) 1999 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * compat_pci.h: PCI compatibility wrappers.
- */
-
-#ifndef __COMPAT_PCI_H__
-#define __COMPAT_PCI_H__
-
-#include "compat_ioport.h"
-#include <linux/pci.h>
-
-#ifndef DMA_BIT_MASK
-#  define DMA_BIT_MASK(n) DMA_##n##BIT_MASK
-#endif
-
-/*
- * Power Management related compat wrappers.
- */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 10)
-#   define compat_pci_save_state(pdev)      pci_save_state((pdev), NULL)
-#   define compat_pci_restore_state(pdev)   pci_restore_state((pdev), NULL)
-#else
-#   define compat_pci_save_state(pdev)      pci_save_state((pdev))
-#   define compat_pci_restore_state(pdev)   pci_restore_state((pdev))
-#endif
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 11)
-#   define pm_message_t          u32
-#   define compat_pci_choose_state(pdev, state)  (state)
-#   define PCI_D0               0
-#   define PCI_D3hot            3
-#else
-#   define compat_pci_choose_state(pdev, state)  pci_choose_state((pdev), (state))
-#endif
-
-/* 2.6.14 changed the PCI shutdown callback */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 14)
-#   define COMPAT_PCI_SHUTDOWN(func)               .driver = { .shutdown = (func), }
-#   define COMPAT_PCI_DECLARE_SHUTDOWN(func, var)  (func)(struct device *(var))
-#   define COMPAT_PCI_TO_DEV(dev)                  (to_pci_dev(dev))
-#else
-#   define COMPAT_PCI_SHUTDOWN(func)               .shutdown = (func)
-#   define COMPAT_PCI_DECLARE_SHUTDOWN(func, var)  (func)(struct pci_dev *(var))
-#   define COMPAT_PCI_TO_DEV(dev)                  (dev)
-#endif
-
-/* 2.6.26 introduced the device_set_wakeup_enable() function */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 26)
-#   define compat_device_set_wakeup_enable(dev, val) do {} while(0)
-#else
-#   define compat_device_set_wakeup_enable(dev, val) \
-       device_set_wakeup_enable(dev, val)
-#endif
-
-#endif /* __COMPAT_PCI_H__ */
diff --git a/vmmon-only/include/compat_pgtable.h b/vmmon-only/include/compat_pgtable.h
index 4722d4e4..aca2f5db 100644
--- a/vmmon-only/include/compat_pgtable.h
+++ b/vmmon-only/include/compat_pgtable.h
@@ -48,11 +48,6 @@ typedef p4d_t compat_p4d_t;
 #   define COMPAT_P4D_MASK                  0            /* Not used */
 typedef pgd_t compat_p4d_t;
 #endif
-/* p[gu]d_large did not exist before 2.6.25 */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 25)
-#   define pud_large(pud) 0
-#   define pgd_large(pgd) 0
-#endif
 /* pud_pfn did not exist before 3.8. */
 #if LINUX_VERSION_CODE < KERNEL_VERSION(3, 8, 0)
 #   define pud_pfn(pud)  INVALID_MPN
diff --git a/vmmon-only/include/compat_semaphore.h b/vmmon-only/include/compat_semaphore.h
deleted file mode 100644
index f5527b9c..00000000
--- a/vmmon-only/include/compat_semaphore.h
+++ /dev/null
@@ -1,49 +0,0 @@
-/*********************************************************
- * Copyright (C) 2002 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef __COMPAT_SEMAPHORE_H__
-#   define __COMPAT_SEMAPHORE_H__
-
-
-/* <= 2.6.25 have asm only, 2.6.26 has both, and 2.6.27-rc2+ has linux only. */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 27)
-#   include <asm/semaphore.h>
-#else
-#   include <linux/semaphore.h>
-#endif
-
-
-/*
-* The init_MUTEX_LOCKED() API appeared in 2.2.18, and is also in
-* 2.2.17-21mdk --hpreg
-*/
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 2, 18)
-   #ifndef init_MUTEX_LOCKED
-      #define init_MUTEX_LOCKED(_sem) *(_sem) = MUTEX_LOCKED
-   #endif
-   #ifndef DECLARE_MUTEX
-      #define DECLARE_MUTEX(name) struct semaphore name = MUTEX
-   #endif
-   #ifndef DECLARE_MUTEX_LOCKED
-      #define DECLARE_MUTEX_LOCKED(name) struct semaphore name = MUTEX_LOCKED
-   #endif
-#endif
-
-
-#endif /* __COMPAT_SEMAPHORE_H__ */
diff --git a/vmmon-only/include/cpuid_info.h b/vmmon-only/include/cpuid_info.h
index 1d3ba307..bd1cdbdc 100644
--- a/vmmon-only/include/cpuid_info.h
+++ b/vmmon-only/include/cpuid_info.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -29,6 +29,10 @@
 #include "vm_basic_asm.h"
 #include "x86cpuid_asm.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
 
 typedef struct CPUID0 {
    int numEntries;
@@ -92,4 +96,9 @@ CPUIDSummary_RegsFromCpuid0(CPUID0* id0In,
    return id0Out;
 }
 
+
+#if defined __cplusplus
+} // extern "C"
 #endif
+
+#endif // _CPUID_INFO_H
diff --git a/vmmon-only/include/crossgdt.h b/vmmon-only/include/crossgdt.h
index ad823eaa..b3374a47 100644
--- a/vmmon-only/include/crossgdt.h
+++ b/vmmon-only/include/crossgdt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2015 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -42,7 +42,7 @@ typedef struct CrossGDT {
    Descriptor gdtes[0x5000 / sizeof (Descriptor)];  // 0x5000 > GDT_LIMIT
 } CrossGDT;
 
-#define CROSSGDT_NUMPAGES ((sizeof (CrossGDT) + PAGE_SIZE - 1) / PAGE_SIZE)
+#define CROSSGDT_NUMPAGES CEILING(sizeof (CrossGDT), PAGE_SIZE)
 
 /*
  * Out of the 5 pages, only the first and last are really used.
@@ -52,28 +52,17 @@ typedef struct CrossGDT {
  * mapping and invalidation code which pages are mapped and unmapped.
  */
 #define CROSSGDT_PAGEMASK 0x11
+#define CROSSGDT_GETINDEXMASK(i) (1 << ((i) * sizeof (Descriptor) / PAGE_SIZE))
+#define CROSSGDT_TESTINDEXMASK(i) (CROSSGDT_GETINDEXMASK(i) & CROSSGDT_PAGEMASK)
 
 /*
- * These segments are placed in the first crossGDT page.  We assume
- * they do not overlap any host segments (checked by
- * Task_InitCrossGDT).  The only real requirement is that they (and
- * the host CS/SS) be physically contiguous with the start of the
- * crossGDT so they will remain valid when paging is turned off.
+ * All necessary host segments must be below CROSSGDT_HOSTLIMIT. In Nov 2006,
+ * host GDT limits for the various guest OSes were:
  *
- * As of this writing (Nov 2006), host GDT limits:
  *     Linux 64 bit:  80 (yes 80, not 7F)
- *           32 bit:  FF
  *     MacOS 64 bit:  8F
- *           32 bit:  8F
  *   Windows 64 bit:  6F
- *           32 bit: 3FF
  */
-#define CROSSGDT_LOWSEG   (0x0FD0 / 8)  // all host segs must be below this
-#define CROSSGDT_64BITCS  (0x0FD0 / 8)  // 64-bit code segment
-#define CROSSGDT_64BITSS  (0x0FD8 / 8)  // 64-bit data segment
-#define CROSSGDT_FLAT32CS (0x0FE0 / 8)  // 32-bit flat code seg
-#define CROSSGDT_FLAT32SS (0x0FE8 / 8)  // 32-bit flat data seg
-#define CROSSGDT_MON32CS  (0x0FF0 / 8)  // 32-bit FFC00000 base code seg
-#define CROSSGDT_MON32SS  (0x0FF8 / 8)  // 32-bit FFC00000 base data seg
+#define CROSSGDT_HOSTLIMIT (PAGE_SIZE / sizeof (Descriptor)) /* 1st page */
 
 #endif
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 6bce93ee..f5282910 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -43,6 +43,17 @@
 #include "overheadmem_types.h"
 #include "pageLock_defs.h"
 #include "numa_defs.h"
+#include "bootstrap_vmm.h"
+
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
+/*
+ * Maximum number of shared regions that can be passed to MonLoader.
+ */
+#define ML_SHARED_REGIONS_MAX 3
 
 /*
  *-----------------------------------------------------------------------------
@@ -133,7 +144,7 @@ PtrToVA64(void const *ptr) // IN
  *
  */
 
-#define VMMON_VERSION           (308 << 16 | 0)
+#define VMMON_VERSION           (329 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -197,11 +208,10 @@ enum IOCTLCmd {
 #endif
    IOCTLCMD(VERSION) = IOCTLCMD(FIRST),
    IOCTLCMD(CREATE_VM),
+   IOCTLCMD(PROCESS_BOOTSTRAP),
    IOCTLCMD(RELEASE_VM),
    IOCTLCMD(GET_NUM_VMS),
-   IOCTLCMD(ALLOC_CROSSGDT),
    IOCTLCMD(INIT_VM),
-   IOCTLCMD(INIT_CROSSGDT),
    IOCTLCMD(RUN_VM),
    IOCTLCMD(LOOK_UP_MPN),
    IOCTLCMD(LOCK_PAGE),
@@ -212,7 +222,6 @@ enum IOCTLCmd {
    IOCTLCMD(ADMIT),
    IOCTLCMD(UPDATE_MEM_INFO),
    IOCTLCMD(READMIT),
-   IOCTLCMD(PAE_ENABLED),
    IOCTLCMD(GET_TOTAL_MEM_USAGE),
    IOCTLCMD(GET_KHZ_ESTIMATE),
    IOCTLCMD(SET_HOST_CLOCK_RATE),
@@ -224,7 +233,6 @@ enum IOCTLCmd {
    IOCTLCMD(ALLOC_LOCKED_PAGES),
    IOCTLCMD(FREE_LOCKED_PAGES),
    IOCTLCMD(GET_NEXT_ANON_PAGE),
-   IOCTLCMD(GET_LOCKED_PAGES_LIST),
 
    IOCTLCMD(GET_ALL_MSRS),
 
@@ -251,7 +259,6 @@ enum IOCTLCmd {
 
 #if defined __linux__ || defined __APPLE__
    IOCTLCMD(GET_ALL_CPUID),
-   IOCTLCMD(GET_KERNEL_CLOCK_RATE),
 #endif
 
 #if defined _WIN32 || defined __APPLE__
@@ -260,9 +267,8 @@ enum IOCTLCmd {
 
 #if defined _WIN32
    IOCTLCMD(FREE_CONTIG_PAGES),
-   IOCTLCMD(HARD_LIMIT_MONITOR_STATUS),	// Windows 2000 only
-   IOCTLCMD(BLUE_SCREEN),	// USE_BLUE_SCREEN only
-   IOCTLCMD(CHANGE_HARD_LIMIT),
+   IOCTLCMD(HARD_LIMIT_MONITOR_STATUS), // used by vmauthd on Windows
+   IOCTLCMD(CHANGE_HARD_LIMIT),         // used by vmauthd on Windows
    IOCTLCMD(GET_KERNEL_PROC_ADDRESS),
    IOCTLCMD(READ_VA64),
    IOCTLCMD(SET_MEMORY_PARAMS),
@@ -277,14 +283,7 @@ enum IOCTLCmd {
    IOCTLCMD(BLUEPILL),
 #endif
 
-   IOCTLCMD(SET_POLL_TIMEOUT_PTR),
-
-   IOCTLCMD(FAST_SUSP_RES_SET_OTHER_FLAG),
-   IOCTLCMD(FAST_SUSP_RES_GET_MY_FLAG),
-
 #if defined __linux__
-   IOCTLCMD(SET_HOST_CLOCK_PRIORITY),
-   IOCTLCMD(VMX_ENABLED),
    IOCTLCMD(SET_HOST_SWAP_SIZE),
 #endif
 
@@ -318,10 +317,9 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_VERSION             VMIOCTL_BUFFERED(VERSION)
 #define IOCTL_VMX86_CREATE_VM           VMIOCTL_BUFFERED(CREATE_VM)
 #define IOCTL_VMX86_RELEASE_VM          VMIOCTL_BUFFERED(RELEASE_VM)
+#define IOCTL_VMX86_PROCESS_BOOTSTRAP   VMIOCTL_BUFFERED(PROCESS_BOOTSTRAP)
 #define IOCTL_VMX86_GET_NUM_VMS         VMIOCTL_BUFFERED(GET_NUM_VMS)
-#define IOCTL_VMX86_ALLOC_CROSSGDT      VMIOCTL_BUFFERED(ALLOC_CROSSGDT)
 #define IOCTL_VMX86_INIT_VM             VMIOCTL_BUFFERED(INIT_VM)
-#define IOCTL_VMX86_INIT_CROSSGDT       VMIOCTL_BUFFERED(INIT_CROSSGDT)
 #define IOCTL_VMX86_RUN_VM              VMIOCTL_NEITHER(RUN_VM)
 #define IOCTL_VMX86_SEND_IPI            VMIOCTL_NEITHER(SEND_IPI)
 #define IOCTL_VMX86_GET_IPI_VECTORS     VMIOCTL_BUFFERED(GET_IPI_VECTORS)
@@ -334,8 +332,6 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_ADMIT               VMIOCTL_BUFFERED(ADMIT)
 #define IOCTL_VMX86_READMIT             VMIOCTL_BUFFERED(READMIT)
 #define IOCTL_VMX86_UPDATE_MEM_INFO     VMIOCTL_BUFFERED(UPDATE_MEM_INFO)
-#define IOCTL_VMX86_PAE_ENABLED         VMIOCTL_BUFFERED(PAE_ENABLED)
-#define IOCTL_VMX86_BEEP                VMIOCTL_BUFFERED(BEEP)
 #define IOCTL_VMX86_HARD_LIMIT_MONITOR_STATUS   VMIOCTL_BUFFERED(HARD_LIMIT_MONITOR_STATUS)
 #define IOCTL_VMX86_CHANGE_HARD_LIMIT   VMIOCTL_BUFFERED(CHANGE_HARD_LIMIT)
 #define IOCTL_VMX86_ALLOC_CONTIG_PAGES  VMIOCTL_BUFFERED(ALLOC_CONTIG_PAGES)
@@ -352,7 +348,6 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_ALLOC_LOCKED_PAGES  VMIOCTL_BUFFERED(ALLOC_LOCKED_PAGES)
 #define IOCTL_VMX86_FREE_LOCKED_PAGES   VMIOCTL_BUFFERED(FREE_LOCKED_PAGES)
 #define IOCTL_VMX86_GET_NEXT_ANON_PAGE  VMIOCTL_BUFFERED(GET_NEXT_ANON_PAGE)
-#define IOCTL_VMX86_GET_LOCKED_PAGES_LIST VMIOCTL_BUFFERED(GET_LOCKED_PAGES_LIST)
 
 #define IOCTL_VMX86_GET_KERNEL_PROC_ADDRESS  VMIOCTL_BUFFERED(GET_KERNEL_PROC_ADDRESS)
 #define IOCTL_VMX86_READ_VA64           VMIOCTL_BUFFERED(READ_VA64)
@@ -361,16 +356,11 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_REMEMBER_KHZ_ESTIMATE VMIOCTL_BUFFERED(REMEMBER_KHZ_ESTIMATE)
 
 #define IOCTL_VMX86_GET_ALL_MSRS        VMIOCTL_BUFFERED(GET_ALL_MSRS)
-#define IOCTL_VMX86_COUNT_PRESENT_PAGES	VMIOCTL_BUFFERED(COUNT_PRESENT_PAGES)
-
-#define IOCTL_VMX86_FAST_SUSP_RES_SET_OTHER_FLAG VMIOCTL_BUFFERED(FAST_SUSP_RES_SET_OTHER_FLAG)
-#define IOCTL_VMX86_FAST_SUSP_RES_GET_MY_FLAG    VMIOCTL_BUFFERED(FAST_SUSP_RES_GET_MY_FLAG)
 
 #define IOCTL_VMX86_GET_REFERENCE_CLOCK_HZ   VMIOCTL_BUFFERED(GET_REFERENCE_CLOCK_HZ)
 #define IOCTL_VMX86_INIT_PSEUDO_TSC          VMIOCTL_BUFFERED(INIT_PSEUDO_TSC)
 #define IOCTL_VMX86_CHECK_PSEUDO_TSC         VMIOCTL_BUFFERED(CHECK_PSEUDO_TSC)
 #define IOCTL_VMX86_GET_PSEUDO_TSC           VMIOCTL_NEITHER(GET_PSEUDO_TSC)
-#define IOCTL_VMX86_SET_HOST_CLOCK_PRIORITY  VMIOCTL_BUFFERED(SET_HOST_CLOCK_PRIORITY)
 #define IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS    VMIOCTL_NEITHER(GET_UNAVAIL_PERF_CTRS)
 #define IOCTL_VMX86_REMAP_SCATTER_LIST VMIOCTL_BUFFERED(REMAP_SCATTER_LIST)
 #define IOCTL_VMX86_UNMAP_SCATTER_LIST VMIOCTL_BUFFERED(UNMAP_SCATTER_LIST)
@@ -563,13 +553,34 @@ typedef struct IPIVectors {
 #endif
 
 /*
- * This struct is passed to IOCTL_VMX86_INIT_CROSSGDT to fill in a crossGDT
- * entry.
+ * Arguments and return value for VM creation.
  */
-typedef struct InitCrossGDT {
-   uint32 index;      // index in crossGDT to update (offset / 8)
-   Descriptor value;  // value to set the crossGDT entry to
-} InitCrossGDT;
+typedef struct VMCreateBlock {
+   VA64               bsBlob;        // IN: User VA of the VMM bootstrap blob.
+   uint32             bsBlobSize;    // IN: Size of VMM bootstrap blob.
+   uint16             vmid;          // OUT: VM ID for the created VM.
+} VMCreateBlock;
+
+/*
+ * Information about a shared region.
+ */
+typedef struct VMSharedRegion {
+   uint32 index;
+   VPN    baseVpn;
+   uint32 numPages;
+} VMSharedRegion;
+
+/*
+ * Arguments for VMM bootstrap processing.
+ */
+typedef struct VMProcessBootstrapBlock {
+   VA64           bsBlobAddr;    // IN: User VA of the VMM bootstrap blob.
+   uint32         numBytes;      // IN: Size of VMM bootstrap blob.
+   uint32         headerOffset;  // IN: Offset of header in blob.
+   uint16         numVCPUs;      // IN: Number of VCPUs.
+   VA64           ptRootVAs[MAX_VCPUS];  // IN: User VA of PT roots.
+   VMSharedRegion shRegions[ML_SHARED_REGIONS_MAX]; // IN: Shared regions.
+} VMProcessBootstrapBlock;
 
 #if defined __linux__
 
@@ -620,4 +631,9 @@ typedef struct VMAllocContiguousMem {
 /* Clean up helper macros */
 #undef IOCTLCMD
 
+
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif // ifndef _IOCONTROLS_H_
diff --git a/vmmon-only/include/memDefaults.h b/vmmon-only/include/memDefaults.h
index 68611708..3c986450 100644
--- a/vmmon-only/include/memDefaults.h
+++ b/vmmon-only/include/memDefaults.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2012 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -24,12 +24,15 @@
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMCORE
 #define INCLUDE_ALLOW_MODULE
-
 #include "includeCheck.h"
 
 #include "vm_basic_math.h"
 #include "vm_basic_defs.h"
 
+#if defined(__cplusplus)
+extern "C" {
+#endif
+
 #define MEMDEFAULTS_MIN_HOST_PAGES   MBYTES_2_PAGES(128)
 
 
@@ -151,4 +154,8 @@ MemDefaults_CalcMinReservedMBs(uint32 hostMem)  // IN:
 void MemDefaults_GetReservedMemory(uint32 *host, uint32 *min,
                                    uint32 *max, uint32 *recommended);
 
+#if defined(__cplusplus)
+}  // extern "C"
+#endif
+
 #endif
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index 3f6f444b..9487cd5f 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -56,7 +56,9 @@
    MC(COSCHED)                                                                \
    MC(ALLOC_VMX_PAGE)                                                         \
    MC(ALLOC_TMP_GDT)                                                          \
-   MC(PIN_MPN)
+   MC(PIN_MPN)                                                                \
+   MC(VMCLEAR_VMCS_ALL_CPUS)                                                  \
+   MC(GET_PAGE_ROOT)
 
 /*
  *----------------------------------------------------------------------
@@ -124,55 +126,14 @@ typedef enum UCCostStamp {
 } UCCostStamp;
 #endif // VMX86_SERVER
 
-/*
- * Header for the wsBody64.S worldswitch code file.
- */
-typedef struct WSModule {
-   uint32 vmmonVersion;  // VMMON_VERSION when assembled as part of monitor
-   uint16 moduleSize;    // size of whole wsBody64 module
-   uint16 hostToVmm;     // offset from beginning of header to hostToVmm
-   uint16 vmm64ToHost;
-   uint16 _pad[3];
-
-   uint8 code[1024];      // big enough for MAX('.wsBody64', 'wsBody64Log')
-} WSModule;
-
 typedef
 #include "vmware_pack_begin.h"
-struct SwitchNMIOffsets {
-   uint16         db;    // offset to start of  #DB handler
-   uint16         nmi;   // offset to start of #NMI handler
-   uint16         df;    // offset to start of  #DF handler
-   uint16         ud;    // offset to start of  #UD handler
-   uint16         gp;    // offset to start of  #GP handler
-   uint16         pf;    // offset to start of  #PF handler
-   uint16         mce;   // offset to start of #MCE handler
+struct CodeOffsets {
+   uint16 hostToVmm;
+   uint16 vmmToHost;
 }
 #include "vmware_pack_end.h"
-SwitchNMIOffsets;
-
-/*
- * This is a header for the switchNMI.S module.  It contains code for
- * exceptions occurring during worldswitch.  The code gets copied to
- * the crosspage by initialization.
- */
-typedef
-#include "vmware_pack_begin.h"
-struct SwitchNMI {                                // see switchNMI.S
-   uint16           switchNMISize;
-   SwitchNMIOffsets host;                         // offsets to handlers
-   volatile Bool    wsException[NUM_EXCEPTIONS];  // EXC_DE ... EXC_XF
-                                                  // TRUE -> fault occurred in
-                                                  //   worldswitch
-   uint64           wsUD2;                        // IP of ud2 instruction
-                                                  //    0ULL == unset
-                                                  //   other == worldswitch IP
-   uint8            codeBlock[768];               // Enough for
-                                                  //   max('.switchNMI',
-                                                  //       '.switchNMILog').
-}
-#include "vmware_pack_end.h"
-SwitchNMI;
+CodeOffsets;
 
 #define SHADOW_DR(cpData, n)    (cpData)->shadowDR[n].ureg64
 
@@ -211,7 +172,7 @@ SwitchNMI;
 
 /*----------------------------------------------------------------------
  *
- * VMM64PageTablePatch
+ * VMMPageTablePatch
  *
  *    Describes an entry in the monitor page table which needs to be
  *    patched during the back-to-host worldswitch.
@@ -224,28 +185,16 @@ SwitchNMI;
  *        This is the level in the page table to which the patch must
  *        be applied: L4, L3, L2, L1.  This information is used to
  *        determine the base of the region of memory which must be
- *        patched.  The level value corresponds to the following
- *        regions in monitor memory:
- *
- *          MMU_ROOT_64
- *          MMU_L3_64
- *          MMU_L2_64
- *          MON_PAGE_TABLE_64
- *
- *        The value zero is reserved to indicate an empty spot in the
- *        array of patches.
+ *        patched. The value zero is reserved to indicate an empty spot
+ *        in the array of patches.
  *
- *      o level offset
+ *      o index
  *
- *        The monitor memory regions corresponding to the page table
- *        levels may be more than one page in length, so a 'page
- *        offset' is required to know the starting address of the page
- *        table page which must be patched in 'level'.
+ *        The index of the PTE at the given page table.
  *
- *      o page index
+ *      o ptIdx
  *
- *        The 'index' value specifies the element in the page which
- *        should be patched.
+ *        The index of the page table at the given level.
  *
  *      o pte
  *
@@ -256,19 +205,19 @@ SwitchNMI;
  */
 typedef
 #include "vmware_pack_begin.h"
-struct VMM64PageTablePatch {
+struct VMMPageTablePatch {
 #define PTP_EMPTY    (0U) /* Unused array entry. (must be 0) */
-#define PTP_LEVEL_L1 (1U)       /* leaf level */
+#define PTP_LEVEL_L1 (1U)
 #define PTP_LEVEL_L2 (2U)
 #define PTP_LEVEL_L3 (3U)
 #define PTP_LEVEL_L4 (4U)       /* root level */
-   uint16   level;              /* [0, 4]  (maximal size: 3 bits) */
-   uint16   page;               /* Index of 'page' in 'level'.    */
-   uint32   index;              /* Index of 'pte' in 'page'.      */
-   VM_PDPTE pte;                /* PTE.                           */
+   uint32   level;              /* [0, 4]  (maximal size: 3 bits) */
+   uint32   pteIdx;             /* Index of the PTE in the page table. */
+   uint64   pteGlobalIdx;       /* Global index of the PTE in 'level'. */
+   VM_PDPTE pte;                /* PTE.                                */
 }
 #include "vmware_pack_end.h"
-VMM64PageTablePatch;
+VMMPageTablePatch;
 
 #define MODULECALL_NUM_ARGS  4
 
@@ -345,16 +294,17 @@ struct VMCrossPageData {
    uint64   mon64RIP;
    Task64   monTask64;          /* vmm64's task */
 
-   VMM64PageTablePatch vmm64PTP[MAX_SWITCH_PT_PATCHES]; /* page table patch */
-   LA64                vmm64CrossPageLA;
-   LA64                vmm64CrossGDTLA;   // where crossGDT mapped by PT patch
-                                          //  64-bit host: host kernel linear
-                                          // address
+   VMMPageTablePatch vmmPTP[MAX_SWITCH_PT_PATCHES]; /* page table patch */
+   LA64              vmm64CrossPageLA;
+   LA64              vmm64CrossGDTLA;   // where crossGDT mapped by PT patch
+                                        //  64-bit host: host kernel linear
+                                        // address
 
    /*
     * The monitor may requests up to two actions when returning to the
     * host.  The moduleCallType field and args encode a request for
-    * some action in the driver.  The userCallType field (together
+    * some action in the driver.  The vcpuSet field is an additional
+    * argument used in some calls.  The userCallType field (together
     * with the RPC block) encodes a user call request.  The two
     * requests are independent.  The user call is executed first, with
     * the exception of MODULECALL_INTR which has a special effect.
@@ -362,6 +312,9 @@ struct VMCrossPageData {
    ModuleCallType moduleCallType;
    uint32         retval;
    uint64         args[MODULECALL_NUM_ARGS];
+#if !defined(VMX86_SERVER)
+   VCPUSet        vcpuSet;
+#endif
    int            userCallType;
    uint32         pcpuNum;   /* Used as extra module call arg within vmmon. */
 
@@ -397,8 +350,6 @@ struct VMCrossPageData {
    VmAbsoluteTS hstTimerExpiry; // PTSC of host timer interrupt
    VmAbsoluteTS monTimerExpiry; // PTSC of next MonTimer callback
 
-   Bool     activateVMX;        // TRUE -> activate Intel VMX extensions
-   Bool     activateSVM;        // TRUE -> activate AMD SVM extensions
    Bool     retryWorldSwitch;   // TRUE -> return to host on host->vmm switch
    /*
     * TRUE if moduleCall was interrupted by signal. Only
@@ -406,12 +357,11 @@ struct VMCrossPageData {
     * restart RunVM call, nobody else should look at it.
     */
    Bool     moduleCallInterrupted;
-   uint8    _pad3[4];
+   uint8    _pad3[6];
 
-   DTR64    switchHostIDTR;     // baseLA = switchHostIDT's host knl LA
+   DTR64    switchHostIDTR;   // baseLA = switchHostIDT's host kernel LA
    uint16   _pad4[3];
-   DTR64    switchMon64IDTR;    // has baseLA = switchMon64IDT's monitor LA
-                                //   contains 64-bit DB,NMI,MCE entries
+   DTR64    switchMonIDTR;    // baseLA = switchMonIDT's monitor LA
    uint16   _pad5[3];
 
    /*
@@ -419,12 +369,16 @@ struct VMCrossPageData {
     * IDT has only enough space for the hardware exceptions; they are
     * sized to accommodate 64-bit descriptors.
     */
-   uint8 switchHostIDT [sizeof(Gate64) * NUM_EXCEPTIONS]; // hostCS:hostVA
-   uint8 switchMon64IDT[sizeof(Gate64) * NUM_EXCEPTIONS]; // 64-bit monCS:monVA
+   uint8 switchHostIDT[sizeof(Gate64) * NUM_EXCEPTIONS]; // hostCS:hostVA
+   uint8 switchMonIDT[sizeof(Gate64) * NUM_EXCEPTIONS];  // monCS:monVA
+
+   volatile Bool wsException[NUM_EXCEPTIONS]; // Tracks faults in worldswitch.
+   uint64        wsUD2;                       // IP of ud2 instr or 0 if unset.
 }
 #include "vmware_pack_end.h"
 VMCrossPageData;
 
+
 /*
  *----------------------------------------------------------------------
  *
@@ -437,8 +391,10 @@ VMCrossPageData;
 typedef
 #include "vmware_pack_begin.h"
 struct VMCrossPageCode {
-   WSModule   worldswitch;
-   SwitchNMI  faultHandler;
+   uint16        size;           // Size of the code module.
+   uint32        vmmonVersion;   // VMMON_VERSION
+   CodeOffsets   offsets;        // Offsets to handlers.
+   uint8         codeBlock[512]; // Code for worldswitch and fault handling.
 }
 #include "vmware_pack_end.h"
 VMCrossPageCode;
@@ -465,16 +421,16 @@ struct VMCrossPage {
    uint32          version;         /* 4 bytes. Must be at offset zero. */
    uint32          crosspage_size;  /* 4 bytes. Must be at offset 4.    */
    VMCrossPageData crosspageData;
+   VMCrossPageCode crosspageCode;
    uint8           _pad[PAGE_SIZE - (sizeof(uint32) /* version */        +
                                      sizeof(uint32) /* crosspage_size */ +
                                      sizeof(VMCrossPageData)             +
                                      sizeof(VMCrossPageCode))];
-   VMCrossPageCode crosspageCode;
 }
 #include "vmware_pack_end.h"
 VMCrossPage;
 
-#define CROSSPAGE_VERSION_BASE 0xbf1 /* increment by 1 */
+#define CROSSPAGE_VERSION_BASE 0xbfb /* increment by 1 */
 #define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
 
 #if !defined(VMX86_SERVER) && defined(VMM)
diff --git a/vmmon-only/include/modulecallstructs.h b/vmmon-only/include/modulecallstructs.h
index 7943a2ba..1537b273 100644
--- a/vmmon-only/include/modulecallstructs.h
+++ b/vmmon-only/include/modulecallstructs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006,2009-2011,2013-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006,2009-2011,2013-2015 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -66,7 +66,8 @@
    SWMSR(MSR_CSTAR)         \
    SWMSR(MSR_SFMASK)        \
    SWMSR(MSR_TSC_AUX)       \
-   SWMSR(MSR_BD_TSC_RATIO)
+   SWMSR(MSR_BD_TSC_RATIO)  \
+   SWMSR(MSR_BNDCFGS)
 
 /*
  *      Data structures for dealing with the context-switched MSRs that need
diff --git a/vmmon-only/include/monAddrLayout.h b/vmmon-only/include/monAddrLayout.h
new file mode 100644
index 00000000..f47800df
--- /dev/null
+++ b/vmmon-only/include/monAddrLayout.h
@@ -0,0 +1,57 @@
+/*********************************************************
+ * Copyright (C) 2005,2007,2009,2013,2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * monAddrLayout.h --
+ *
+ *    Address layout of the monitor
+ */
+
+#ifndef _MON_ADDR_LAYOUT_H
+#define _MON_ADDR_LAYOUT_H
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_USERLEVEL
+#include "includeCheck.h"
+
+#pragma pack(push, 1)
+typedef struct VMM64_AddrLayout {
+   /* 
+    *All address are VPNs and all lengths are numPages
+    */
+   uint64 monBase;            // MONITOR_BASE_VPN
+   uint64 mmuRootStart;       // MMU_ROOT_START
+   uint32 mmuRootLen;         // MMU_ROOT_LEN
+   uint64 mmuL3Start;         // MMU_L3_START
+   uint32 mmuL3Len;           // MMU_L3_LEN
+   uint64 mmuL2Start;         // MMU_L2_START
+   uint32 mmuL2Len;           // MMU_L2_LEN
+   uint64 monPageTableStart;  // MON_PAGE_TABLE_START
+   uint32 monPageTableLen;    // MON_PAGE_TABLE_LEN
+#ifndef VMX86_SERVER
+   uint64 monCpStart;         // CROSS_PAGE_START
+#endif
+} VMM64_AddrLayout;
+#pragma pack(pop)
+
+#define VMM_SCRATCHAS_FIRST_L4OFF   1
+#define VMM_SCRATCHAS_LAST_L4OFF  127
+
+#endif
diff --git a/vmmon-only/include/monLoader.h b/vmmon-only/include/monLoader.h
new file mode 100644
index 00000000..bd698308
--- /dev/null
+++ b/vmmon-only/include/monLoader.h
@@ -0,0 +1,302 @@
+/*********************************************************
+ * Copyright (C) 2015-2017 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * monLoader.h --
+ *
+ *      Describes the monitor loader, its header and support code for
+ *      processing this header.
+ *
+ *
+ * Overview
+ * ========
+ *
+ * Before the monitor or its in-context bootstrap code can run, a monitor
+ * address space must be created and partially populated.  This address space
+ * contains code and data statically built, empty but allocated space, shared
+ * and run-time initialized content.  The monitor loader header regularizes
+ * encoding of address space information, allowing a common representation and
+ * common code to be re-used for different contexts (vmmon for hosted, vmkernel
+ * for ESX, and the VMX while deprivileging of bootstrap is ongoing).
+ *
+ * The Header
+ * ==========
+ *
+ * The monitor loader header contains a sequence of entries describing content.
+ * Each entry has a start and end VPN, an optional content source, permission
+ * flags to be applied when mapping, an optional subIndex specifying a shared
+ * region (for shared content types) and a flag specifying whether to process
+ * this entry for all VCPUs or just the bootstrap processor.
+ *
+ * Content types
+ * =============
+ *
+ * ADDRSPACE: Must be first.  Describes the address space in which all other
+ * entries reside.  Page tables from L4 to L1 will be allocated, in order,
+ * eagerly.  These page tables will be wired with the permissions of this entry
+ * from L4 to L1.  This allows easy access to the L1E for any VPN in the space.
+ *
+ * ML_CONTENT_PAGETABLE_Lx: Maps the page tables for a given level.  It must be
+ * exactly the size of the tables preallocated by ADDRSPACE for the level.
+ *
+ * ML_CONTENT_ALLOCZERO: Allocates new MPNs, zeroes the pages and maps them.
+ *
+ * ML_CONTENT_COPY: Allocates new MPNs, maps them and copies from the specified
+ * source.
+ *
+ * ML_CONTENT_SHARE: Memory provided by user or host kernel and mapped into the
+ * monitor address space.  The subIndex field specifies which region, as
+ * multiple regions may be shared for each source.
+ *
+ * Processing
+ * ==========
+ *
+ * The monitor loader can be built in different contexts.  Each context must
+ * provide implementations of callout functions.  To fully build the context,
+ * callouts for memory allocation, access and reporting of resources will be
+ * added, as will accounting functionality.
+ *
+ * Callouts
+ * ========
+ * 
+ * Memory-accessing callouts take a Vcpuid as memory is tracked per-VCPU.
+ *
+ * MonLoaderCallout_AllocMPN(MPN): Allocate a new MPN.
+ * MonLoaderCallout_CleanUp(): Release temporary MonLoader callout resources.
+ * MonLoaderCallout_CopyFromBlob(blobOffset, size, MPN): Copy blob contents.
+ * MonLoaderCallout_FillPage(pattern, mpn): fill a page with a pattern.
+ * MonLoaderCallout_GetPTE(MPN, index, *pte): Get indexth PTE in a PT MPN.
+ * MonLoaderCallout_GetPageRoot(vcpu): Get a VCPU's page root.
+ * MonLoaderCallout_ImportPage(MPN): Import an MPN for tracking and future use.
+ * MonLoaderCallout_Init(): Initialize MonLoader callouts.
+ * MonLoaderCallout_GetSharedHostPage(subIdx, page): Get shared host page MPN.
+ * MonLoaderCallout_GetSharedUserPage(subIdx, page): Get shared user page MPN.
+ * MonLoaderCallout_SetEntrypoint(): Sets the entry code/stack for execution.
+ *
+ * Building vs Importing
+ * =====================
+ *
+ * While legacy VMX is still responsible for building part of the monitor
+ * context, the monitor loader must cooperate.  Rather than building the
+ * context itself, the monitor loader verifies its environment matches its
+ * header's expectations.  This includes verifying sufficient allocations,
+ * permissions of page table wiring and page table self-mapping.
+ *
+ * Errors
+ * ======
+ *
+ * To avoid ASSERTs across contexts, errors are returned and clean-up is done
+ * carefully if processing fails at any stage.  Some errors are debug-only and
+ * essentially verify invariants for debug builds.  The line in the table at
+ * which the error was encountered is returned for logging and debugging.
+ *
+ * Compatibility
+ * =============
+ *
+ * bootstrap-offsets.pl relies on MonLoaderContentType, MonLoaderSourceType and
+ * the structure of MonLoaderEntry to determine and set blob offsets for
+ * ML_CONTENT_COPY + ML_SOURCE_BLOB.  If these are changed, the script should
+ * be updated accordingly.
+ */
+
+#ifndef _MON_LOADER
+#define _MON_LOADER
+
+#include "vm_basic_types.h"
+#include "x86paging_common.h"
+#include "x86types.h" /* PT_L1E */
+#include "vcpuid.h"   /* Vcpuid */
+
+#define ML_NAME_MAX 16
+
+/* ML perms are simple and abbreviated. */
+
+#define ML_PERM_RWX (PTE_P | PTE_RW)
+#define ML_PERM_RW  (PTE_P | PTE_RW | PTE_NX)
+#define ML_PERM_RO  (PTE_P |          PTE_NX)
+#define ML_PERM_RX   PTE_P
+
+#define ML_PERM_MASK (PTE_P| PTE_RW | PTE_NX | PTE_US)
+
+#define ML_PERMS_MATCH(x,p) (((x) & ML_PERM_MASK) == ((p) & ML_PERM_MASK))
+
+#define LOADER_HEADER_MAGIC 0x8675309E98675309
+
+typedef enum {
+   ML_CONTENT_INVALID = 0,
+   ML_CONTENT_ADDRSPACE,     /* The static address space. */
+   ML_CONTENT_ALLOCZERO,     /* Allocate, zero-fill and map. */
+   ML_CONTENT_COPY,          /* Copy data from external source. */
+   ML_CONTENT_PAGETABLE_L4,  /* Mappings for level 4 page tables in AS. */
+   ML_CONTENT_PAGETABLE_L3,  /* Mappings for level 3 page tables in AS. */
+   ML_CONTENT_PAGETABLE_L2,  /* Mappings for level 2 page tables in AS. */
+   ML_CONTENT_PAGETABLE_L1,  /* Mappings for level 1 page tables in AS. */
+   ML_CONTENT_SHARE,         /* Share data from external source. */
+} MonLoaderContentType;
+
+#define CONTENT_TO_PTLEVEL(x) (x == ML_CONTENT_PAGETABLE_L4 ? 4 : \
+                               x == ML_CONTENT_PAGETABLE_L3 ? 3 : \
+                               x == ML_CONTENT_PAGETABLE_L2 ? 2 : \
+                               x == ML_CONTENT_PAGETABLE_L1 ? 1 : \
+                               0)
+
+/* Sources of content, for pages not zeroed, unmapped or otherwise special. */
+typedef enum MonLoaderSourceType {
+   ML_SOURCE_INVALID  = 0x0,
+   ML_SOURCE_NONE,
+   ML_SOURCE_BLOB,
+   ML_SOURCE_USER,
+   ML_SOURCE_HOST,
+} MonLoaderSourceType;
+
+/*
+ * NOTE: When modifying MonLoaderEntry, corresponding changes must be
+ * made to vmcore/make/misc/bootstrap-offsets.pl.
+ */
+typedef struct {
+   MonLoaderContentType content;           /* Content type. */
+   MonLoaderSourceType  source;            /* Source, if any, for content. */
+   VPN                  monVPN;            /* Destination in monitor AS. */
+   uint64               monPages;          /* Size in pages. */
+   uint64               flags;             /* PTE permissions */
+   unsigned             allocs;            /* MPNs allocated (all VCPUs). */
+   /* Set for source ML_SOURCE_BLOB: */
+   struct blobSrc {
+      uint64 offset; /* offset within the blob, in bytes. */
+      uint64 size;   /* size of content, in bytes. */
+   } blobSrc;
+   uint64               bspOnly;           /* Process only on BSP. */
+   uint64               subIndex;          /* Region ID for ML_CONTENT_COPY. */
+   uint64               procVmmon;         /* Processed by the vmmon on hosted. */
+} MonLoaderEntry;
+
+
+/* Packed for easy consumption by bootstrap-offsets.pl. */
+#pragma pack(push, 1)
+typedef struct {
+   uint64         magic;
+   uint32         entrySize;
+   uint32         count;
+   /* cs:rip */
+   uint16         codeSelector;
+   VA64           codeEntrypoint;
+   /* ss:rip */
+   uint16         stackSelector;
+   VA64           stackEntrypoint;
+   MonLoaderEntry entries[];
+} MonLoaderHeader;
+#pragma pack(pop)
+
+/* Environment context structure, defined by the environment. */
+struct MonLoaderEnvContext;
+typedef struct MonLoaderEnvContext MonLoaderEnvContext;
+
+/* Callout prototypes */
+MPN  MonLoaderCallout_AllocMPN(MonLoaderEnvContext *, Vcpuid);
+void MonLoaderCallout_CleanUp(MonLoaderEnvContext *);
+Bool MonLoaderCallout_CopyFromBlob(MonLoaderEnvContext *, uint64, size_t, MPN,
+                                   Vcpuid);
+Bool MonLoaderCallout_FillPage(MonLoaderEnvContext *, uint8, MPN, Vcpuid);
+MPN  MonLoaderCallout_GetPageRoot(MonLoaderEnvContext *, Vcpuid);
+Bool MonLoaderCallout_GetPTE(MonLoaderEnvContext *, MPN, unsigned, Vcpuid,
+                             PT_L1E *);
+Bool MonLoaderCallout_ImportPage(MonLoaderEnvContext *, MPN, Vcpuid);
+Bool MonLoaderCallout_Init(void *, MonLoaderEnvContext **);
+Bool MonLoaderCallout_MapMPNInPTE(MonLoaderEnvContext *, MPN, unsigned, uint64,
+                                  MPN, Vcpuid);
+MPN  MonLoaderCallout_GetSharedUserPage(MonLoaderEnvContext *, uint64, unsigned,
+                                        Vcpuid);
+MPN  MonLoaderCallout_GetSharedHostPage(MonLoaderEnvContext *, uint64, unsigned,
+                                        Vcpuid);
+Bool MonLoaderCallout_IsPrivileged(MonLoaderEnvContext *);
+Bool MonLoaderCallout_SetEntrypoint(MonLoaderEnvContext *, uint16, VA64, uint16,
+                                    VA64);
+MPN  MonLoaderCallout_GetBlobMpn(MonLoaderEnvContext *, uint64);
+
+typedef enum MonLoaderError {
+   ML_OK = 0,
+   ML_ERROR_ADDRSPACE_TOO_LARGE,
+   ML_ERROR_ALLOC,
+   ML_ERROR_ALREADY_MAPPED,
+   ML_ERROR_ARGS,
+   ML_ERROR_CALLOUT_INIT,
+   ML_ERROR_CALLOUT_COPY,
+   ML_ERROR_CALLOUT_ENTRYPOINT,
+   ML_ERROR_CALLOUT_GETPTE,
+   ML_ERROR_CALLOUT_MAPINPTE,
+   ML_ERROR_CALLOUT_PAGEROOT_GET,
+   ML_ERROR_CALLOUT_ZERO,
+   ML_ERROR_CONTENT_INVALID,
+   ML_ERROR_CONTEXT_INIT,
+   ML_ERROR_DUPLICATE,
+   ML_ERROR_INVALID_VPN,
+   ML_ERROR_MAGIC,
+   ML_ERROR_MAP,
+   ML_ERROR_NO_ADDRSPACE,
+   ML_ERROR_PAGE_TABLE_IMPORT,
+   ML_ERROR_PAGE_TABLE_MAP_SIZE,
+   ML_ERROR_PAGE_TABLE_VERIFY,
+   ML_ERROR_SHARE,
+   ML_ERROR_SIZE,
+   ML_ERROR_SOURCE_INVALID,
+   ML_ERROR_TABLE_MISSING,
+} MonLoaderError;
+
+
+/* A subindex above shared area subindices for sharing of MonLoaderHeader. */
+#define MONLOADER_HEADER_IDX (NUM_SHARED_AREAS + 1)
+
+
+MonLoaderError MonLoader_Process(MonLoaderHeader *header, unsigned numVCPUs,
+                                 void *args, unsigned *line, Vcpuid *vcpu);
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoader_GetFixedHeaderSize --
+ *
+ *      Returns the size of the fixed portion of MonLoaderHeader.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE size_t
+MonLoader_GetFixedHeaderSize(void)
+{
+   return sizeof(MonLoaderHeader);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoader_GetFullHeaderSize --
+ *
+ *      Returns the size of the full MonLoaderHeader, including the
+ *      variable size portion.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE size_t
+MonLoader_GetFullHeaderSize(MonLoaderHeader *header)
+{
+   return MonLoader_GetFixedHeaderSize() +
+          header->count * sizeof(MonLoaderEntry);
+}
+
+#endif /* !_MON_LOADER */
diff --git a/vmmon-only/include/monLoaderLog.h b/vmmon-only/include/monLoaderLog.h
new file mode 100644
index 00000000..3fa0da6f
--- /dev/null
+++ b/vmmon-only/include/monLoaderLog.h
@@ -0,0 +1,66 @@
+/*********************************************************
+ * Copyright (C) 2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * monLoaderLog.h --
+ *
+ *      Logging definitions for MonLoader.
+ */
+
+#ifndef _MONLOADER_LOG_H_
+#define _MONLOADER_LOG_H_
+
+#ifdef VMX86_VMX
+
+#define LOGLEVEL_MODULE main
+#include "loglevel_vmcore.h"
+/*
+ * Redefine LOG() to match the vmkernel calling convention.
+ */
+#undef LOG_BYNAME
+#undef LOG
+
+#define LOG_BYNAME(_mod, _min, _fmt, ...) \
+        (DOLOG_BYNAME(_mod, _min) ? Log(_fmt "\n", ## __VA_ARGS__) : (void) 0)
+
+#define LOG(_min, _fmt, ...) \
+        LOG_BYNAME(LOGLEVEL_MODULE, _min, _fmt, ## __VA_ARGS__)
+
+#elif defined VMKERNEL
+
+#define LOGLEVEL_MODULE MonLoader
+#include "log.h"
+
+#elif defined VMMON
+
+#include "vm_assert.h"
+#define ML_LOGLEVEL_VMMON 0 /* MonLoader/vmmon loglevel. */
+
+#undef LOG
+#define LOG(_min, _fmt, ...)                         \
+do {                                                 \
+   if (vmx86_log && ML_LOGLEVEL_VMMON >= (_min)) {   \
+      Log(_fmt "\n", ## __VA_ARGS__);                \
+   }                                                 \
+} while (0)
+
+#else /* !defined VMX86_VMX && !defined VMKERNEL && !defined VMMON */
+#error MonLoader cannot be built as part of this environment
+#endif
+
+#endif /* _MONLOADER_LOG_H_ */
diff --git a/vmmon-only/include/mon_assert.h b/vmmon-only/include/mon_assert.h
index b86832ca..3d047f89 100644
--- a/vmmon-only/include/mon_assert.h
+++ b/vmmon-only/include/mon_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2007-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2007-2015 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -169,8 +169,13 @@ extern const char __vmm_pathnames_start;
  * seen to hoist code into the failing arm of the assertion, where it
  * can then tell that, because of the assertion failure, the code ends
  * up accessing an array out of bounds.
+ *
+ * Assertion failures for the monitor's bootstrap are reduced to panics
+ * logging the current %rip.  As such, no .assert_info section is created
+ * and VMX merely processes the panic.
  */
 
+#ifndef VMM_BOOTSTRAP
 #define ASSERT_RECORDINFO(assembly, assertType, bugNr)                   \
    __asm__ __volatile__(".pushsection .assert_info;"                     \
                         ".quad 0f;"                                      \
@@ -182,6 +187,16 @@ extern const char __vmm_pathnames_start;
                         [file] "i" (__VMM__FILE__),                      \
                         [type] "i" (assertType),                         \
                         [bug]  "i" (bugNr))
+#else
+
+extern uint64 bsAssertRIP;
+#define ASSERT_RECORDINFO(assembly, assertType, bugNr)                   \
+   __asm__ __volatile__("lea 0(%%rip), %0\n\t"                           \
+                        : "=r"(bsAssertRIP));                            \
+   Panic("Bootstrap: %s failure at rip=0x%lx",                           \
+         assertType == AssertType_AssertVerify ? "VERIFY" : "ASSERT",    \
+         bsAssertRIP);
+#endif /* VMM_BOOTSTRAP */
 
 #define _ASSERT_PANIC(name)                                              \
    ({COMPILER_MEM_BARRIER();                                             \
diff --git a/vmmon-only/include/monitorAction_exported.h b/vmmon-only/include/monitorAction_exported.h
index 28b57c2c..745b1d91 100644
--- a/vmmon-only/include/monitorAction_exported.h
+++ b/vmmon-only/include/monitorAction_exported.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2010-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 2010-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -22,8 +22,6 @@
 #define INCLUDE_ALLOW_VMX
 #define INCLUDE_ALLOW_VMCORE
 #define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMKERNEL
 #define INCLUDE_ALLOW_DISTRIBUTE
 #include "includeCheck.h"
@@ -32,6 +30,11 @@
 #include "vm_atomic.h"
 #include "vm_basic_types.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 /*
  * Please bump the version number if your change will break the
  * compatability to the drivers.
@@ -106,7 +109,7 @@ MonitorActionSet_AtomicInclude(MonitorActionSet *set, const uint32 actionID)
    do {
       oldWord = Atomic_Read64(atomicSet);
       newWord = oldWord | mask;
-   } while (!Atomic_CMPXCHG64(atomicSet, &oldWord, &newWord));
+   } while (!Atomic_CMPXCHG64(atomicSet, oldWord, newWord));
    return (oldWord & mask) == 0;
 }
 
@@ -153,4 +156,9 @@ typedef enum {
    VMM_C1_STATE_PAUSE
 } vmmC1StateType;
 
+
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif // _MONITORACTION_EXPORTED_H_
diff --git a/vmmon-only/include/numa_defs.h b/vmmon-only/include/numa_defs.h
index f14a8b54..fd2a0fc5 100644
--- a/vmmon-only/include/numa_defs.h
+++ b/vmmon-only/include/numa_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006,2009-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,15 +39,16 @@
 
 /* Machine NUMA nodes */
 typedef uint32 NUMA_Node;
-typedef uint32 NUMA_NodeMask;
+typedef uint32 NUMA_PxmID;
+typedef uint64 NUMA_NodeMask;
 typedef uint8  NUMA_MemRangeID;
 
 /*
  * Constants
  */
-#define NUMA_MAX_NODES              32
+#define NUMA_MAX_NODES              64
 #define NUMA_MAX_CPUS_PER_NODE      (vmx86_server ? MAX_PCPUS : 32)
-#define NUMA_MAX_MEM_RANGES         64
+#define NUMA_MAX_MEM_RANGES         (vm_arm_64 ? 128 : 64)
 #define INVALID_NUMANODE            ((NUMA_Node)-1)
 #define NUMA_NODE_MASK_ANY          ((NUMA_NodeMask)-1)
 #define NUMA_NODE_MASK_NONE         ((NUMA_NodeMask)0)
@@ -59,7 +60,7 @@ typedef uint8  NUMA_MemRangeID;
 typedef struct {
    MPN          startMPN;
    MPN          endMPN;
-   NUMA_Node    id;
+   NUMA_PxmID   id;
    Bool         isReliable;
    Bool         isVolatile;
 } NUMA_MemRange;
diff --git a/vmmon-only/include/pagelist.h b/vmmon-only/include/pagelist.h
index 46ed1424..8628c350 100644
--- a/vmmon-only/include/pagelist.h
+++ b/vmmon-only/include/pagelist.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2010-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2010-2014,2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -36,6 +36,11 @@
 #include "vm_assert.h"
 #include "vmcore_types.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 /*
  * Sets of pages are passed between the monitor and the platform to be 
  * shared, invalidated, remapped, or swapped.
@@ -53,13 +58,11 @@ typedef struct PageListEntry {
 
 #define PAGELIST_MAX     (PAGE_SIZE / sizeof(PageListEntry))
 
-static INLINE PageListEntry
-PageList_CreateEntry(BPN bpn)
+static INLINE void
+PageList_SetEntry(PageListEntry *ple, BPN bpn)
 {
-   PageListEntry ple;
-   CompressedBPN_Write(&ple.cbpn, bpn);
-   ple.voided = FALSE;
-   return ple;
+   CompressedBPN_Write(&ple->cbpn, bpn);
+   ple->voided = FALSE;
 }   
 
 static INLINE BPN
@@ -98,4 +101,9 @@ PageList_IsBPNDup(const PageListEntry *pageList, unsigned i, BPN bpn)
    return FALSE;
 }
 
+
+#if defined __cplusplus
+} // extern "C"
 #endif
+
+#endif // _PAGELIST_H
diff --git a/vmmon-only/include/pshare_ext.h b/vmmon-only/include/pshare_ext.h
index ab42c3d1..2fab2abc 100644
--- a/vmmon-only/include/pshare_ext.h
+++ b/vmmon-only/include/pshare_ext.h
@@ -44,6 +44,7 @@
 #define PSHARE_P2M_BUFFER_MPNS_MAX      (16)
 #define PSHARE_P2M_BUFFER_MPNS_DEFAULT  (4)
 #define PSHARE_P2M_BUFFER_SLOTS_PER_MPN (PAGE_SIZE / sizeof(PShare_P2MUpdate))
+#define PSHARE_P2M_BUFFER_SLOTS_MIN     (2)
 
 #define PSHARE_POISON_MARKER            (CONST64U(0xAAAAAAAAAAAAAAAA))
 
@@ -57,8 +58,16 @@ MY_ASSERTS(PSHARE_EXT,
  * types
  */
 
+typedef union {
+   MPN mpn;
+   uint64 vpmemRef;
+} PShare_P2MUpdateReference;
+
+#define PSHARE_SET_INVALID_P2MUPDATE_REFERENCE(ref) ((ref).vpmemRef = CONST64U(-1))
+#define PSHARE_IS_INVALID_P2MUPDATE_REFERENCE(ref) ((ref).vpmemRef == CONST64U(-1))
+
 typedef struct PShare_P2MUpdate {
-   BPN     bpn;
-   MPN     mpn;
+   BPN bpn;
+   PShare_P2MUpdateReference reference;
 } PShare_P2MUpdate;
 #endif
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
index dfa0328a..584cf19c 100644
--- a/vmmon-only/include/ptsc.h
+++ b/vmmon-only/include/ptsc.h
@@ -170,7 +170,6 @@ int64 PTSC_CyclesToUS(VmRelativeTS ts);
 /*
  * ESX with userworld VMX
  */
-#include "x86types.h"
 #include "user_layout.h"
 
 #ifdef VM_ARM_64
diff --git a/vmmon-only/include/rateconv.h b/vmmon-only/include/rateconv.h
index 14f0195f..bc76f845 100644
--- a/vmmon-only/include/rateconv.h
+++ b/vmmon-only/include/rateconv.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,7 +31,6 @@
 #define _VM_RATECONV_H_
 
 #define INCLUDE_ALLOW_USERLEVEL
-
 #define INCLUDE_ALLOW_MODULE
 #define INCLUDE_ALLOW_VMKERNEL
 #define INCLUDE_ALLOW_VMK_MODULE
@@ -44,6 +43,12 @@
 #include "vm_basic_asm.h"
 #include "vm_assert.h"
 #include "vm_atomic.h"
+#include "versioned_atomic.h"
+
+#if defined __cplusplus
+extern "C" {
+#endif
+
 
 /* RateConv_Params is part of vmx<->vmmon interface (INIT_PSEUDO_TSC ioctl) */
 typedef struct RateConv_Params {
@@ -54,8 +59,7 @@ typedef struct RateConv_Params {
 
 typedef struct RateConv_ParamsVolatile {
    RateConv_Params p;
-   Bool            changed;
-   uint8           pad[7];
+   VersionedAtomic vers;
 } RateConv_ParamsVolatile;
 
 typedef struct RateConv_Ratio {
@@ -115,4 +119,8 @@ RateConv_Signed(const RateConv_Params *conv, int64 x)
 }
 
 
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif // _VM_RATECONV_H_
diff --git a/vmmon-only/include/vcpuid.h b/vmmon-only/include/vcpuid.h
index c12dcef0..a1bde887 100644
--- a/vmmon-only/include/vcpuid.h
+++ b/vmmon-only/include/vcpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014, 2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,15 +38,19 @@
 
 #include "vm_basic_types.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
 
-typedef uint32 Vcpuid;			// VCPU number
 
-#define VCPUID_INVALID	(~0U)
+typedef uint32 Vcpuid;                 // VCPU number
+
+#define VCPUID_INVALID  (~0U)
 
 #define BOOT_VCPU_ID     0
 #define IS_BOOT_VCPUID(vcpuid)  ((vcpuid) == BOOT_VCPU_ID)
 
-#define MAX_VCPUS      128
+#define MAX_VCPUS      192
 
 #define MAX_CORES_PER_SOCKET   64
 
@@ -62,4 +66,8 @@ extern const VCPUSet     curVcpuidSet;
 
 #endif  /* VMM */
 
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif // ifndef _VCPUID_H_
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
index 4bbe3a08..838726e6 100644
--- a/vmmon-only/include/vcpuset.h
+++ b/vmmon-only/include/vcpuset.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -417,13 +417,13 @@ VCPUSet_PackCareful(unsigned numVCPUs, const VCPUSet *vcs, void *ptr)
  *
  * VCPUSet_UnpackCareful --
  *      
- *      Unpack a VCPUSet from the bytes at "src".
+ *      Unpack a VCPUSet from the bytes at "ptr".
  *
  *----------------------------------------------------------------------
  */
 
 static INLINE void
-VCPUSet_UnpackCareful(unsigned numVCPUs, VCPUSet *vcs, void *ptr)
+VCPUSet_UnpackCareful(unsigned numVCPUs, VCPUSet *vcs, const void *ptr)
 {
    memcpy(vcs->subset, ptr, (numVCPUs + 7) / 8);
 }
diff --git a/vmmon-only/include/vcpuset_types.h b/vmmon-only/include/vcpuset_types.h
index bbb1990d..3df1f8c2 100644
--- a/vmmon-only/include/vcpuset_types.h
+++ b/vmmon-only/include/vcpuset_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2013, 2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 /*
  * vcpuset_types.h --
  *
- *	ADT for a set of VCPUs.  Implemented as an array of bitmasks.
+ *    ADT for a set of VCPUs.  Implemented as an array of bitmasks.
  *
  */
 
@@ -35,14 +35,14 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
-#include "vm_basic_asm.h"
-#include "vm_atomic.h"
 #include "vcpuid.h"
+#include "vm_assert.h"
 
 #define VCS_SUBSET_WIDTH                                                   64
 #define VCS_SUBSET_SHIFT                                                    6
 #define VCS_SUBSET_MASK               ((CONST64U(1) << VCS_SUBSET_SHIFT) - 1)
-#define VCS_SUBSET_COUNT                                                    2
+#define VCS_SUBSET_COUNT                                                    4
+
 
 #define VCS_VCPUID_SUBSET_IDX(v)                    ((v) >> VCS_SUBSET_SHIFT)
 #define VCS_VCPUID_SUBSET_BIT(v)     (CONST64U(1) << ((v) & VCS_SUBSET_MASK))
@@ -55,4 +55,16 @@ typedef struct VCPUSet {
    uint64 subset[VCS_SUBSET_COUNT];
 } VCPUSet;
 
+MY_ASSERTS(VCPUSET_ASSERTS,
+           /*
+            * Catch changes in VCPUSet which need to be reflected in
+            * bora/public/iocontrolsMacosTable.h.
+            */
+           ASSERT_ON_COMPILE(VCS_SUBSET_COUNT == 4);
+           /*
+            * There is code that depends on sizeof(VCPUSet) being a power of
+            * 2 in at least vcpuHotPlug.c and possible other places.
+            */
+            ASSERT_ON_COMPILE((sizeof(VCPUSet) & (sizeof(VCPUSet) - 1)) == 0);
+)
 #endif
diff --git a/vmmon-only/include/versioned_atomic.h b/vmmon-only/include/versioned_atomic.h
index 7eb190d8..650b1e60 100644
--- a/vmmon-only/include/versioned_atomic.h
+++ b/vmmon-only/include/versioned_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2015-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,28 +17,62 @@
  *********************************************************/
 
 /*
- *  Versioned atomic synchronization:
+ * versioned_atomic.h --
  *
- *    These synchronization macros allow single-writer/many-reader
- *    access to data, based on Leslie Lamport's paper "Concurrent
- *    Reading and Writing", Communications of the ACM, November 1977.
+ *      This file implements versioned atomic synchronization, which allows
+ *      concurrent accesses to shared data by a single writer and multiple
+ *      readers. The algorithm is lock-free (it does not use a mutual exclusion
+ *      mechanism), and the writer is wait-free (it never waits for readers).
  *
- *    many-writer/many-reader can be implemented on top of versioned
- *    atomics by using an additional spin lock to synchronize
- *    writers. This is preferable for cases where readers are expected to
- *    greatly outnumber writers.
+ *      Many-writer/many-reader can be implemented on top of versioned atomics
+ *      by adding an external mutual exclusion mechanism to serialize all
+ *      writer threads into a single logical writer thread. This is preferable
+ *      for cases where readers are expected to greatly outnumber writers.
  *
- *    Multiple concurrent writers to the version variables are not
- *    allowed.  Even if writers are working on lock-free or disjoint
- *    data, the version counters are not interlocked for read-modify-write.
+ *      Implementation
+ *      --------------
+ *      This implementation is based on Leslie Lamport's paper "Concurrent
+ *      Reading and Writing", Communications of the ACM, November 1977
+ *      (http://url.eng.vmware.com/udcc ).
  *
- *    Recursive use of versioned atomics in writers is currently not supported.
+ *      Lamport's algorithm was designed for systems in which the reader and
+ *      the writers run on separate computers and where the version variables
+ *      (v0 and v1 in this implementation) are stored on a shared hard disk. So
+ *      it did not assume that the version variables could be accessed
+ *      atomically. Instead, it assumed that the version variables were made of
+ *      multiple basic units of data, called "digits", and that each digit
+ *      could be accessed atomically. The upper-left corner of page 4 of the
+ *      paper precisely and concisely describes the algorithm, and in
+ *      particular the order in which digits of the version variables must be
+ *      accessed (left to right, right to left, or no particular order).
+ *
+ *      This implementation is designed for systems in which the reader and the
+ *      writers run on the same computer and where the version variables are
+ *      stored in shared memory. So it assumes that the version variables can
+ *      be accessed atomically. As a result, this implementation uses a
+ *      simplified version of Lamport's algorithm, where:
+ *      o Each left to right or right to left access in Lamport's algorithm is
+ *        replaced with a single atomic access in this implementation.
+ *      o Each access in no particular order in Lamport's algorithm is replaced
+ *        with a single non-atomic access in this implementation.
+ *      Note: The writer is the only thread which writes to version variables,
+ *            so it is allowed to read them non-atomically.
+ *
+ *      Multiple concurrent writers to the version variables are not allowed.
+ *      Even if writers are working on lock-free or disjoint data, the version
+ *      variables are not interlocked for read-modify-write. See PR514764.
+ *
+ *      Recursive use of versioned atomics in writers is currently not
+ *      supported. See PR514764.
  */
 
 #ifndef _VERSIONED_ATOMIC_H
 #define _VERSIONED_ATOMIC_H
- 
+
+#define INCLUDE_ALLOW_MODULE
 #define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
 #define INCLUDE_ALLOW_VMKERNEL
 #define INCLUDE_ALLOW_VMCORE
 #define INCLUDE_ALLOW_VMMON
@@ -46,6 +80,12 @@
 
 #include "vm_basic_asm.h"
 #include "vm_assert.h"
+#include "vm_atomic.h"
+
+#if defined __cplusplus
+extern "C" {
+#endif
+
 
 /*
  * Users with attribute(packed) structs must ensure any
@@ -56,115 +96,193 @@
  */
 
 typedef struct {
-   volatile uint32 v0;
-   volatile uint32 v1;
+   uint32 v0;
+   uint32 v1;
 } ALIGNED(4) VersionedAtomic;
 
+
 /*
  *-----------------------------------------------------------------------------
  *
  * VersionedAtomic_BeginWrite --
- *    Called by a writer to indicate that the data protected by
- *    a given atomic version is about to change. Effectively locks out
- *    all readers until EndWrite is called.
- * 
+ *
+ *      Called by the writer to indicate that it is about to write to the
+ *      shared data protected by 'versions'. Effectively locks out all readers
+ *      until VersionedAtomic_EndWrite() is called.
+ *
  * Results:
- *      .
+ *      None
  *
  * Side effects:
- *
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
+
 static INLINE void
-VersionedAtomic_BeginWrite(VersionedAtomic *versions)
+VersionedAtomic_BeginWrite(VersionedAtomic *versions) // IN
 {
+   /* Catch improper initialization or unsupported recursive use. */
+   ASSERT(versions->v1 == versions->v0);
+
    /*
-    * As long as the variable is on natural boundary it is guaranteed
-    * to be atomic, so we don't need to write from left to right as in
-    * Lamport's original algorithm.
+    * Do not use Atomic_Inc32() below: it is more expensive than
+    * Atomic_Write32() and unnecessary: only the write needs to be atomic, not
+    * the whole read + inc + write.
     */
-   ASSERT(((size_t)(&versions->v0) & (sizeof(versions->v0) - 1)) == 0);
-   /* If recursive use is needed demand for support in PR514764 */
-   ASSERT(versions->v1 == versions->v0);
-   versions->v0++;
-   COMPILER_MEM_BARRIER();
+#if !defined VMM
+   /*
+    * Atomic_Write32() below requires the address to be naturally aligned, but
+    * currently only checks that condition when VMM is defined (tracked by
+    * PR1055836). So until that PR is fixed, we must check that condition here
+    * when VMM is not defined.
+    */
+   ASSERT(((uintptr_t)&versions->v0 % sizeof versions->v0) == 0);
+#endif
+   Atomic_Write32((Atomic_uint32 *)&versions->v0, versions->v0 + 1);
+
+   /*
+    * The write to 'versions->v0' must be observed by all other OS CPUs before
+    * the write(s) to the shared data.
+    *
+    * On arm64, this barrier is Full System, which is probably too strong:
+    * Inner Shareable (== all OS CPUs) should work just fine.
+    */
+   SMP_W_BARRIER_W();
 }
 
+
 /*
  *-----------------------------------------------------------------------------
  *
  * VersionedAtomic_EndWrite --
- *    Called by a writer after it is done updating shared data. Lets
- *    pending and new readers proceed on shared data.
- * 
+ *
+ *      Called by the writer to indicate that it has finished writing to the
+ *      shared data protected by 'versions'. Lets pending and new readers
+ *      proceed.
+ *
  * Results:
- *      .
+ *      None
  *
  * Side effects:
- *
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
+
 static INLINE void
-VersionedAtomic_EndWrite(VersionedAtomic *versions)
+VersionedAtomic_EndWrite(VersionedAtomic *versions) // IN
 {
-   ASSERT(((size_t)(&versions->v1) & (sizeof(versions->v1) - 1)) == 0);
+   /*
+    * The write(s) to the shared data must be observed by all other OS CPUs
+    * before the write to 'versions->v1'.
+    *
+    * On arm64, this barrier is Full System, which is probably too strong:
+    * Inner Shareable (== all OS CPUs) should work just fine.
+    */
+   SMP_W_BARRIER_W();
+
    ASSERT(versions->v1 + 1 == versions->v0);
-   COMPILER_MEM_BARRIER();
-   versions->v1 = versions->v0;
+
+#if !defined VMM
+   /*
+    * Atomic_Write32() below requires the address to be naturally aligned, but
+    * currently only checks that condition when VMM is defined (tracked by
+    * PR1055836). So until that PR is fixed, we must check that condition here
+    * when VMM is not defined.
+    */
+   ASSERT(((uintptr_t)&versions->v1 % sizeof versions->v1) == 0);
+#endif
+   Atomic_Write32((Atomic_uint32 *)&versions->v1, versions->v0);
 }
 
+
 /*
  *-----------------------------------------------------------------------------
  *
  * VersionedAtomic_BeginTryRead --
- *    Called by a reader before it tried to read shared data.
- * 
+ *
+ *      Called by a reader before it starts reading the shared data protected
+ *      by 'versions'.
+ *
  * Results:
- *    Returns a version number to the reader. This version number
- *    is required to confirm validity of the read operation when reader
- *    calls EndTryRead.
+ *      A version number for the caller to pass to the matching call to
+ *      VersionedAtomic_EndTryRead(), if any.
  *
  * Side effects:
- *
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
+
 static INLINE uint32
-VersionedAtomic_BeginTryRead(const VersionedAtomic *versions)
+VersionedAtomic_BeginTryRead(VersionedAtomic const *versions) // IN
 {
-   uint32 readVersion;
+   uint32 readVersion = Atomic_Read32((Atomic_uint32 *)&versions->v1);
 
-   readVersion = versions->v1;
-   COMPILER_MEM_BARRIER();
+   /*
+    * The read from 'versions->v1' must happen on this CPU before the read(s)
+    * from the shared data.
+    *
+    * On arm64, this barrier is Full System, which is probably too strong:
+    * Inner Shareable (== all OS CPUs) should work just fine, and maybe
+    * Non-shareable (== current CPU) would work too.
+    */
+   SMP_R_BARRIER_R();
 
    return readVersion;
 }
 
+
 /*
  *-----------------------------------------------------------------------------
  *
  * VersionedAtomic_EndTryRead --
- *    Called by a reader after it finishes reading shared data, to confirm
- *    validity of the data that was just read (IOW, to make sure that a
- *    writer did not intervene while the read was in progress).
- * 
+ *
+ *      Called by a reader after it has finished reading the shared data
+ *      protected by 'versions', to confirm that the data is consistent, i.e.
+ *      that the writer has not modified the data while the reader was reading
+ *      it.
+ *
  * Results:
- *    TRUE if the data read between BeginTryRead() and this call is
- *    valid. FALSE otherwise.
+ *      TRUE if the shared data read between VersionedAtomic_BeginTryRead() and
+ *      this call is consistent.
+ *      FALSE otherwise.
  *
  * Side effects:
- *
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
+
 static INLINE Bool
-VersionedAtomic_EndTryRead(const VersionedAtomic *versions,
-                           uint32 readVersion)
+VersionedAtomic_EndTryRead(VersionedAtomic const *versions, // IN
+                           uint32 readVersion)              // IN
 {
-   COMPILER_MEM_BARRIER();
-   return LIKELY(versions->v0 == readVersion);
+   /*
+    * The read(s) from the shared data must happen on this CPU before the read
+    * from 'versions->v0'.
+    *
+    * On arm64, this barrier is Full System, which is probably too strong:
+    * Inner Shareable (== all OS CPUs) should work just fine, and maybe
+    * Non-shareable (== current CPU) would work too.
+    */
+   SMP_R_BARRIER_R();
+
+   /*
+    * There is a theoretical ABA issue here: if the writer updates the shared
+    * data exactly 2^32 times while a reader reads it, the read will
+    * incorrectly be considered consistent. In practice, this issue is
+    * unlikely, so we ignore it. But should we need it, we could make the issue
+    * even less likely by using 64-bit version variables.
+    */
+   return LIKELY(   Atomic_Read32((Atomic_uint32 *)&versions->v0)
+                 == readVersion);
 }
 
+
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif //_VERSIONED_ATOMIC_H
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index 2b37976a..364a4207 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -435,16 +435,13 @@ CLTS(void)
      __asm__ __volatile__("fs; invlpg %0": :"m" (*(char *) (_addr)):"memory"); \
 } while (0)
 
-#if ! defined(VMKBOOT)
 #define RESTORE_FLAGS _Set_flags
 #define ENABLE_INTERRUPTS() __asm__ __volatile__ ("sti": : :"memory")
 #define CLEAR_INTERRUPTS()  __asm__ __volatile__ ("cli": : :"memory")
-#endif
-
 #define RAISE_INTERRUPT(_x)  __asm__ __volatile__("int %0" :: "g" (_x))
 #define RETURN_FROM_INT()   __asm__ __volatile__("iret" :: )
 
-#if ! defined(VMKERNEL) && ! defined(VMKBOOT)
+#if ! defined(VMKERNEL)
 #define NO_INTERRUPTS_BEGIN()	do { \
                                    uintptr_t _flags; \
                                    SAVE_FLAGS(_flags); \
@@ -958,10 +955,12 @@ static INLINE uint64 GET_XCR0(void)
 
 static INLINE void SET_XCR0_IF_NEEDED(uint64 newVal, uint64 oldVal)
 {
+#ifndef VMM_BOOTSTRAP
    ASSERT(oldVal == GET_XCR0());
    if (newVal != oldVal) {
       SET_XCR0(newVal);
    }
+#endif
 }
 #endif
 
diff --git a/vmmon-only/include/vm_asm_x86_64.h b/vmmon-only/include/vm_asm_x86_64.h
index 902cd81b..db2131c7 100644
--- a/vmmon-only/include/vm_asm_x86_64.h
+++ b/vmmon-only/include/vm_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -32,6 +32,7 @@
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMK_MODULE
 #define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_USERLEVEL
 #define INCLUDE_ALLOW_DISTRIBUTE
 #include "includeCheck.h"
 
diff --git a/vmmon-only/include/vm_assert.h b/vmmon-only/include/vm_assert.h
index b368e1da..8cdbc93e 100644
--- a/vmmon-only/include/vm_assert.h
+++ b/vmmon-only/include/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -99,24 +99,13 @@ void Warning(const char *fmt, ...) PRINTF_DECL(1, 2);
 #if defined VMKPANIC
 void Panic_SaveRegs(void);
 
-#ifdef VMX86_DEBUG
-void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
-#else
 NORETURN void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
-#endif
-
-NORETURN void Panic_NoSaveNoReturn(const char *fmt, ...) PRINTF_DECL(1, 2);
 
 #define Panic(fmt...) do { \
    Panic_SaveRegs();       \
    Panic_NoSave(fmt);      \
 } while(0)
 
-#define Panic_NoReturn(fmt...) do { \
-   Panic_SaveRegs();                \
-   Panic_NoSaveNoReturn(fmt);       \
-} while(0)
-
 #else
 NORETURN void Panic(const char *fmt, ...) PRINTF_DECL(1, 2);
 #endif
@@ -176,8 +165,6 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 
 #define ASSERT_NOT_IMPLEMENTED(cond) \
            ASSERT_IFNOT(cond, NOT_IMPLEMENTED())
-#define ASSERT_NOT_IMPLEMENTED_BUG(bug, cond) \
-           ASSERT_IFNOT(cond, NOT_IMPLEMENTED_BUG(bug))
 
 #if defined VMKPANIC || defined VMM
 #define NOT_IMPLEMENTED()        _ASSERT_PANIC_NORETURN(AssertNotImplemented)
@@ -202,10 +189,8 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
            ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertMemAlloc))
 
 #ifdef VMX86_DEVEL
-#define ASSERT_DEVEL(cond) ASSERT(cond)
 #define NOT_TESTED()       Warning(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
 #else
-#define ASSERT_DEVEL(cond) ((void)0)
 #define NOT_TESTED()       Log(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
 #endif
 
@@ -305,7 +290,7 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 #define ASSERT_ON_COMPILE(e) \
    do {                      \
       _Static_assert(e, #e); \
-   } while (0);
+   } while (0)
 #endif
 
 /*
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index 07f32eab..38d45fde 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -32,7 +32,6 @@
 #define _ATOMIC_H_
 
 #define INCLUDE_ALLOW_USERLEVEL
-
 #define INCLUDE_ALLOW_MODULE
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMKDRIVERS
@@ -45,6 +44,10 @@
 #include "vm_basic_types.h"
 #include "vm_assert.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
 /*
  * In the Atomic_* definitions below, memory ordering and atomicity are somewhat
  * conflated in an inconsistent manner. First, we have Atomic_{Read,Write},
@@ -84,153 +87,15 @@
  */
 
 #ifdef VM_ARM_64
-#include "vm_basic_asm_arm64.h"
-
-#define ARM_64_ATOMIC_16_OPV_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint16 _sample;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxrh   %w0, [%2]      \n\t" \
-      #op "       %w0, %w0, %w3  \n\t" \
-      "   stxrh   %w1, %w0, [%2] \n\t" \
-      "   cbnz    %w1, 1b        \n\t" \
-      : "=&r" (_sample),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-})
-
-#define ARM_64_ATOMIC_16_OPO_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint16 _newval;                     \
-   uint16 _oldval;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxrh   %w0, [%3]      \n\t" \
-      #op "       %w1, %w0, %w4  \n\t" \
-      "   stxrh   %w2, %w1, [%3] \n\t" \
-      "   cbnz    %w2, 1b        \n\t" \
-      : "=&r" (_oldval),               \
-        "=&r" (_newval),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-   _oldval;                            \
-})
-
-#define ARM_64_ATOMIC_32_OPV_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint32 _sample;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxr    %w0, [%2]      \n\t" \
-      #op "       %w0, %w0, %w3  \n\t" \
-      "   stxr    %w1, %w0, [%2] \n\t" \
-      "   cbnz    %w1, 1b        \n\t" \
-      : "=&r" (_sample),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-})
-
-#define ARM_64_ATOMIC_32_OPO_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint32 _newval;                     \
-   uint32 _oldval;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxr    %w0, [%3]      \n\t" \
-      #op "       %w1, %w0, %w4  \n\t" \
-      "   stxr    %w2, %w1, [%3] \n\t" \
-      "   cbnz    %w2, 1b        \n\t" \
-      : "=&r" (_oldval),               \
-        "=&r" (_newval),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-   _oldval;                            \
-})
-
-#define ARM_64_ATOMIC_64_OPV_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint64 _sample;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxr    %x0, [%2]      \n\t" \
-      #op "       %x0, %x0, %x3  \n\t" \
-      "   stxr    %w1, %x0, [%2] \n\t" \
-      "   cbnz    %w1, 1b        \n\t" \
-      : "=&r" (_sample),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-})
-
-#define ARM_64_ATOMIC_64_OPO_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint64 _newval;                     \
-   uint64 _oldval;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxr    %x0, [%3]      \n\t" \
-      #op "       %x1, %x0, %x4  \n\t" \
-      "   stxr    %w2, %x1, [%3] \n\t" \
-      "   cbnz    %w2, 1b        \n\t" \
-      : "=&r" (_oldval),               \
-        "=&r" (_newval),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-   _oldval;                            \
-})
-
-#define ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
-   DMB();                                       \
-   ARM_64_ATOMIC_16_OPV_PRIVATE(atm,modval,op); \
-   DMB();                                       \
-})
-
-#define ARM_64_ATOMIC_16_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
-   uint16 _oldval_fenced;                                        \
-   DMB();                                                        \
-   _oldval_fenced = ARM_64_ATOMIC_16_OPO_PRIVATE(atm,modval,op); \
-   DMB();                                                        \
-   _oldval_fenced;                                               \
-})
-
-#define ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
-   DMB();                                       \
-   ARM_64_ATOMIC_32_OPV_PRIVATE(atm,modval,op); \
-   DMB();                                       \
-})
-
-#define ARM_64_ATOMIC_32_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
-   uint32 _oldval_fenced;                                        \
-   DMB();                                                        \
-   _oldval_fenced = ARM_64_ATOMIC_32_OPO_PRIVATE(atm,modval,op); \
-   DMB();                                                        \
-   _oldval_fenced;                                               \
-})
-
-#define ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
-   DMB();                                       \
-   ARM_64_ATOMIC_64_OPV_PRIVATE(atm,modval,op); \
-   DMB();                                       \
-})
-
-#define ARM_64_ATOMIC_64_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
-   uint64 _oldval_fenced;                                        \
-   DMB();                                                        \
-   _oldval_fenced = ARM_64_ATOMIC_64_OPO_PRIVATE(atm,modval,op); \
-   DMB();                                                        \
-   _oldval_fenced;                                               \
-})
-
-#endif /* VM_ARM_64 */
-
-
-/* Basic atomic types: 16, 32 and 64 bits */
+#   include "vm_atomic_arm64_begin.h"
+#endif
+
+
+/* Basic atomic types: 8, 16, 32, 64 and 128 bits */
+typedef struct Atomic_uint8 {
+   volatile uint8 value;
+} Atomic_uint8 ALIGNED(1);
+
 typedef struct Atomic_uint16 {
    volatile uint16 value;
 } Atomic_uint16 ALIGNED(2);
@@ -239,10 +104,17 @@ typedef struct Atomic_uint32 {
    volatile uint32 value;
 } Atomic_uint32 ALIGNED(4);
 
-typedef struct  Atomic_uint64 {
+typedef struct Atomic_uint64 {
    volatile uint64 value;
 } Atomic_uint64 ALIGNED(8);
 
+#if defined __GNUC__ && defined VM_64BIT && \
+     (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
+typedef struct Atomic_uint128 {
+   volatile uint128 value;
+} Atomic_uint128 ALIGNED(16);
+#endif
+
 /*
  * Prototypes for msft atomics.  These are defined & inlined by the
  * compiler so no function definition is needed.  The prototypes are
@@ -258,7 +130,7 @@ typedef struct  Atomic_uint64 {
  * Windows typedefs. This avoids having to include windows header files
  * to get to the windows types.
  */
-#if defined(_MSC_VER) && _MSC_VER >= 1310 && !defined(BORA_NO_WIN32_INTRINS)
+#if defined _MSC_VER && _MSC_VER >= 1310 && !defined BORA_NO_WIN32_INTRINS
 #ifdef __cplusplus
 extern "C" {
 #endif
@@ -267,10 +139,11 @@ long  _InterlockedCompareExchange(long volatile*, long, long);
 long  _InterlockedExchangeAdd(long volatile*, long);
 long  _InterlockedDecrement(long volatile*);
 long  _InterlockedIncrement(long volatile*);
-void  _ReadWriteBarrier(void);
+__int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
 #pragma intrinsic(_InterlockedExchange, _InterlockedCompareExchange)
 #pragma intrinsic(_InterlockedExchangeAdd, _InterlockedDecrement)
-#pragma intrinsic(_InterlockedIncrement, _ReadWriteBarrier)
+#pragma intrinsic(_InterlockedIncrement)
+#pragma intrinsic(_InterlockedCompareExchange64)
 
 # if _MSC_VER >= 1600
 char     _InterlockedExchange8(char volatile *, char);
@@ -278,7 +151,7 @@ char     _InterlockedCompareExchange8(char volatile *, char, char);
 #pragma intrinsic(_InterlockedCompareExchange8, _InterlockedCompareExchange8)
 #endif
 
-#if defined(VM_X86_64)
+#if defined VM_X86_64
 long     _InterlockedAnd(long volatile*, long);
 __int64  _InterlockedAnd64(__int64 volatile*, __int64);
 long     _InterlockedOr(long volatile*, long);
@@ -289,14 +162,12 @@ __int64  _InterlockedExchangeAdd64(__int64 volatile*, __int64);
 __int64  _InterlockedIncrement64(__int64 volatile*);
 __int64  _InterlockedDecrement64(__int64 volatile*);
 __int64  _InterlockedExchange64(__int64 volatile*, __int64);
-__int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
-#if !defined(_WIN64)
+#if !defined _WIN64
 #pragma intrinsic(_InterlockedAnd, _InterlockedAnd64)
 #pragma intrinsic(_InterlockedOr, _InterlockedOr64)
 #pragma intrinsic(_InterlockedXor, _InterlockedXor64)
 #pragma intrinsic(_InterlockedExchangeAdd64, _InterlockedIncrement64)
 #pragma intrinsic(_InterlockedDecrement64, _InterlockedExchange64)
-#pragma intrinsic(_InterlockedCompareExchange64)
 #endif /* !_WIN64 */
 #endif /* __x86_64__ */
 
@@ -305,7 +176,7 @@ __int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
 #endif
 #endif /* _MSC_VER */
 
-#if defined(__arm__)
+#if defined __arm__
 /*
  * LDREX without STREX or CLREX may cause problems in environments where the
  * context switch may not clear the reference monitor - according ARM manual
@@ -313,8 +184,8 @@ __int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
  * may not like Linux kernel's non-preemptive context switch path. So use of
  * ARM routines in kernel code may not be safe.
  */
-#   if defined(__ARM_ARCH_7__) || defined(__ARM_ARCH_7A__) ||  \
-       defined(__ARM_ARCH_7R__)|| defined(__ARM_ARCH_7M__)
+#   if defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ ||  \
+       defined __ARM_ARCH_7R__|| defined __ARM_ARCH_7M__
 #      define VM_ARM_V7
 #      ifdef __KERNEL__
 #         warning LDREX/STREX may not be safe in linux kernel, since it      \
@@ -335,10 +206,12 @@ __int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
 
 /* Convert a volatile uint32 to Atomic_uint32. */
 static INLINE Atomic_uint32 *
-Atomic_VolatileToAtomic(volatile uint32 *var)  // IN:
+Atomic_VolatileToAtomic32(volatile uint32 *var)  // IN:
 {
    return (Atomic_uint32 *)var;
 }
+#define Atomic_VolatileToAtomic Atomic_VolatileToAtomic32
+
 
 /* Convert a volatile uint64 to Atomic_uint64. */
 static INLINE Atomic_uint64 *
@@ -347,235 +220,617 @@ Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
    return (Atomic_uint64 *)var;
 }
 
+
+/*
+ * All the assembly code is tricky and written conservatively.
+ * For example, to make sure gcc won't introduce copies,
+ * we force the addressing mode like this:
+ *
+ *    "xchgl %0, (%1)"
+ *    : "=r" (val)
+ *    : "r" (&var->value),
+ *      "0" (val)
+ *    : "memory"
+ *
+ * - edward
+ *
+ * Actually - turns out that gcc never generates memory aliases (it
+ * still does generate register aliases though), so we can be a bit
+ * more agressive with the memory constraints. The code above can be
+ * modified like this:
+ *
+ *    "xchgl %0, %1"
+ *    : "=r" (val),
+ *      "=m" (var->value),
+ *    : "0" (val),
+ *      "1" (var->value)
+ *
+ * The advantages are that gcc can use whatever addressing mode it
+ * likes to access the memory value, and that we dont have to use a
+ * way-too-generic "memory" clobber as there is now an explicit
+ * declaration that var->value is modified.
+ *
+ * see also /usr/include/asm/atomic.h to convince yourself this is a
+ * valid optimization.
+ *
+ * - walken
+ */
+
+#if defined _MSC_VER && _MSC_VER < 1600 && defined __x86_64__
+uint8 VMWInterlockedExchange8(uint8 volatile *ptr,
+                              uint8 val);
+
+uint8 VMWInterlockedCompareExchange8(uint8 volatile *ptr,
+                                     uint8 newVal,
+                                     uint8 oldVal);
+#endif
+
+#if defined __GNUC__ && defined VM_ARM_32
+/* Force the link step to fail for unimplemented functions. */
+extern int AtomicUndefined(void const *);
+#endif
+
+
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Init, Atomic_SetFence, AtomicUseFence --
+ * Atomic_ReadIfEqualWrite128 --
+ *
+ *      Compare and exchange a 16 byte tuple.
  *
- *      Determine whether an lfence intruction is executed after
- *	every locked instruction.
+ * Results:
+ *      old value
  *
- *	Certain AMD processors have a bug (see bug 107024) that
- *	requires an lfence after every locked instruction.
+ * Side effects:
+ *      None
  *
- *	The global variable AtomicUseFence controls whether lfence
- *	is used (see AtomicEpilogue).
+ *-----------------------------------------------------------------------------
+ */
+#if defined __GNUC__ && defined VM_64BIT && \
+     (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
+static INLINE uint128
+Atomic_ReadIfEqualWrite128(Atomic_uint128 *ptr,   // IN/OUT
+                           uint128        oldVal, // IN
+                           uint128        newVal) // IN
+{
+#ifdef __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16
+   return __sync_val_compare_and_swap(&ptr->value, oldVal, newVal);
+#elif defined VM_ARM_64
+   union {
+      uint128 raw;
+      struct {
+         uint64 lo;
+         uint64 hi;
+      };
+   } res, _old = { oldVal }, _new = { newVal };
+   uint32 failed;
+
+   SMP_RW_BARRIER_RW();
+   __asm__ __volatile__(
+      "1: ldxp    %x0, %x1, %3        \n\t"
+      "   cmp     %x0, %x4            \n\t"
+      "   ccmp    %x1, %x5, #0, eq    \n\t"
+      "   b.ne    2f                  \n\t"
+      "   stxp    %w2, %x6, %x7, %3   \n\t"
+      "   cbnz    %w2, 1b             \n\t"
+      "2:                             \n\t"
+      : "=&r" (res.lo),
+        "=&r" (res.hi),
+        "=&r" (failed),
+        "+Q" (ptr->value)
+      : "r" (_old.lo),
+        "r" (_old.hi),
+        "r" (_new.lo),
+        "r" (_new.hi)
+      : "cc"
+   );
+   SMP_RW_BARRIER_RW();
+
+   return res.raw;
+#endif
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
  *
- *	Atomic_SetFence sets AtomicUseFence to the given value.
+ * Atomic_Read8 --
  *
- *	Atomic_Init computes and sets AtomicUseFence for x86.
- *	It does not take into account the number of processors.
+ *      Read the value of the specified object atomically.
  *
- *	The rationale for all this complexity is that Atomic_Init
- *	is the easy-to-use interface.  It can be called a number
- *	of times cheaply, and does not depend on other libraries.
- *	However, because the number of CPUs is difficult to compute,
- *	it does without it and always assumes there are more than one.
+ * Results:
+ *      The value of the atomic variable.
  *
- *	For programs that care or have special requirements,
- *	Atomic_SetFence can be called directly, in addition to Atomic_Init.
- *	It overrides the effect of Atomic_Init, and can be called
- *	before, after, or between calls to Atomic_Init.
+ * Side effects:
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
 
-// The freebsd assembler doesn't know the lfence instruction
-#if defined(__GNUC__) &&                                                \
-     __GNUC__ >= 3 &&                                                   \
-    (defined(__VMKERNEL__) || !defined(__FreeBSD__)) &&                 \
-    (!defined(MODULE) || defined(__VMKERNEL_MODULE__)) &&               \
-    !defined(__APPLE__) &&                                              \
-    (defined(__i386__) || defined(__x86_64__)) /* PR136775 */
-#define ATOMIC_USE_FENCE
+static INLINE uint8
+Atomic_Read8(Atomic_uint8 const *var)  // IN:
+{
+   uint8 val;
+
+#if defined __GNUC__ && defined VM_ARM_32
+   val = AtomicUndefined(var);
+#elif defined VM_ARM_64
+   val = _VMATOM_X(R, 8, &var->value);
+#elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=q" (val)
+      : "m" (var->value)
+   );
+#elif defined _MSC_VER
+   val = var->value;
+#else
+#error No compiler defined for Atomic_Read8
 #endif
 
-/* 
- * Starting with vSphere 2014, we no longer support ESX on AMD Rev F. 
- * Thus, we can eliminate all dynamic checks for whether to enable 
- * the Errata 147 work-around when compiling many of our binaries. 
- * However, we use an opt-in approach here rather than assuming all 
- * parts of our builds are safe. For example, the "fdm" binary from 
- * a new build may time travel back to hosts running older versions 
- * of ESX on Rev F, so "fdm" continues to require the ability to 
- * dynamically enable the errata work-around. With vSphere 2017,
- * this will no longer be required as the oldest version of ESX that 
- * VC 2017 will support is ESX 2014 (which won't run on Rev F).
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWrite8 --
  *
- * Modules may explicitly define MAY_NEED_AMD_REVF_WORKAROUND as 0 prior to
- * inclusion of vm_atomic.h when they are safe on AMD Rev F with the elided
- * lfence.
+ *      Read followed by write.
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
  */
-#if !defined(MAY_NEED_AMD_REVF_WORKAROUND)
-#if (!defined(VMX86_SERVER) ||                                          \
-      (!defined(VMX86_VMX) && !defined(VMKERNEL) &&                     \
-       !defined(VMM)       && !defined(VMCORE)))
-#define MAY_NEED_AMD_REVF_WORKAROUND 1
+
+static INLINE uint8
+Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
+                  uint8 val)          // IN:
+{
+#if defined __GNUC__ && defined VM_ARM_32
+   return AtomicUndefined(var + val);
+#elif defined VM_ARM_64
+   return _VMATOM_X(RW, 8, TRUE, &var->value, val);
+#elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
+   __asm__ __volatile__(
+      "xchgb %0, %1"
+      : "=q" (val),
+        "+m" (var->value)
+      : "0" (val)
+   );
+   return val;
+#elif defined _MSC_VER && _MSC_VER >= 1600
+   return _InterlockedExchange8((volatile char *)&var->value, val);
+#elif defined _MSC_VER && defined __i386__
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm movzx eax, val
+      __asm mov ebx, var
+      __asm xchg [ebx]Atomic_uint8.value, al
+   }
+#pragma warning(pop)
+#elif defined _MSC_VER && defined __x86_64__
+   return VMWInterlockedExchange8(&var->value, val);
 #else
-#define MAY_NEED_AMD_REVF_WORKAROUND 0
+#error No compiler defined for Atomic_ReadWrite8
 #endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write8 --
+ *
+ *      Write the specified value to the specified object atomically.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
+              uint8 val)          // IN:
+{
+#if defined __GNUC__ && defined VM_ARM_32
+   AtomicUndefined(var + val);
+#elif defined VM_ARM_64
+   _VMATOM_X(W, 8, &var->value, val);
+#elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=m" (var->value)
+      : "qn" (val)
+   );
+#elif defined _MSC_VER
+   var->value = val;
+#else
+#error No compiler defined for Atomic_Write8
 #endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWrite8 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal.
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
+                         uint8 oldVal,       // IN:
+                         uint8 newVal)       // IN:
+{
+#if defined __GNUC__ && defined VM_ARM_32
+   return AtomicUndefined(var + oldVal + newVal);
+#elif defined VM_ARM_64
+   return _VMATOM_X(RIFEQW, 8, TRUE, &var->value, oldVal, newVal);
+#elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
+   uint8 val;
+
+   __asm__ __volatile__(
+      "lock; cmpxchgb %2, %1"
+      : "=a" (val),
+        "+m" (var->value)
+      : "q" (newVal),
+        "0" (oldVal)
+      : "cc"
+   );
 
-#if MAY_NEED_AMD_REVF_WORKAROUND
-#if defined(VMATOMIC_IMPORT_DLLDATA)
-VMX86_EXTERN_DATA Bool AtomicUseFence;
+   return val;
+#elif defined _MSC_VER && _MSC_VER >= 1600
+   return _InterlockedCompareExchange8((volatile char *)&var->value,
+                                       newVal, oldVal);
+#elif defined _MSC_VER && defined __i386__
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov al, oldVal
+      __asm mov ebx, var
+      __asm mov cl, newVal
+      __asm lock cmpxchg [ebx]Atomic_uint8.value, cl
+      __asm movzx eax, al
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#elif defined _MSC_VER && defined __x86_64__
+   return VMWInterlockedCompareExchange8(&var->value, newVal, oldVal);
 #else
-EXTERN Bool AtomicUseFence;
+#error No compiler defined for Atomic_ReadIfEqualWrite8
 #endif
-EXTERN Bool atomicFenceInitialized;
-#else   /* MAY_NEED_AMD_REVF_WORKAROUND */
-#define AtomicUseFence         FALSE
-#define atomicFenceInitialized TRUE
-#endif  /* MAY_NEED_AMD_REVF_WORKAROUND */
+}
 
 
-void AtomicInitFence(void);
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAnd8 --
+ *
+ *      Atomic read (returned), bitwise AND with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadAnd8(Atomic_uint8 *var, // IN/OUT
+                uint8 val)         // IN
+{
+   uint8 res;
+
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 8, TRUE, &var->value, and, val);
+#else
+   do {
+      res = Atomic_Read8(var);
+   } while (res != Atomic_ReadIfEqualWrite8(var, res, res & val));
+#endif
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_And8 --
+ *
+ *      Atomic read, bitwise AND with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
 
 static INLINE void
-Atomic_Init(void)
+Atomic_And8(Atomic_uint8 *var, // IN/OUT
+            uint8 val)         // IN
 {
-#ifdef ATOMIC_USE_FENCE
-   if (MAY_NEED_AMD_REVF_WORKAROUND && !atomicFenceInitialized) {
-      AtomicInitFence();
-   }
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, and, val);
+#else
+   (void)Atomic_ReadAnd8(var, val);
 #endif
 }
 
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadOr8 --
+ *
+ *      Atomic read (returned), bitwise OR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadOr8(Atomic_uint8 *var, // IN/OUT
+               uint8 val)         // IN
+{
+   uint8 res;
+
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 8, TRUE, &var->value, orr, val);
+#else
+   do {
+      res = Atomic_Read8(var);
+   } while (res != Atomic_ReadIfEqualWrite8(var, res, res | val));
+#endif
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Or8 --
+ *
+ *      Atomic read, bitwise OR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
 static INLINE void
-Atomic_SetFence(Bool fenceAfterLock)  // IN:
+Atomic_Or8(Atomic_uint8 *var, // IN/OUT
+           uint8 val)         // IN
 {
-   (void)fenceAfterLock;     /* Work around unused parameter. */
-#if MAY_NEED_AMD_REVF_WORKAROUND
-   AtomicUseFence = fenceAfterLock;
-   atomicFenceInitialized = TRUE;
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, orr, val);
+#else
+   (void)Atomic_ReadOr8(var, val);
 #endif
 }
 
 
-/* Conditionally execute fence after interlocked instruction. */
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadXor8 --
+ *
+ *      Atomic read (returned), bitwise XOR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadXor8(Atomic_uint8 *var, // IN/OUT
+                uint8 val)         // IN
+{
+   uint8 res;
+
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 8, TRUE, &var->value, eor, val);
+#else
+   do {
+      res = Atomic_Read8(var);
+   } while (res != Atomic_ReadIfEqualWrite8(var, res, res ^ val));
+#endif
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Xor8 --
+ *
+ *      Atomic read, bitwise XOR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
 static INLINE void
-AtomicEpilogue(void)
+Atomic_Xor8(Atomic_uint8 *var, // IN/OUT
+            uint8 val)         // IN
 {
-#if MAY_NEED_AMD_REVF_WORKAROUND && defined(ATOMIC_USE_FENCE)
-#ifdef VMM
-      /* The monitor conditionally patches out the lfence when not needed.*/
-      /* Construct a MonitorPatchTextEntry in the .patchtext section. */
-      asm volatile ("1:\n\t"
-                    "lfence\n\t"
-                    "2:\n\t"
-                    ".pushsection .patchtext\n\t"
-                    ".quad 1b\n\t"
-                    ".quad 2b\n\t"
-                    ".quad 0\n\t"
-                    ".popsection\n\t" ::: "memory");
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, eor, val);
 #else
-      if (UNLIKELY(AtomicUseFence)) {
-         asm volatile ("lfence" ::: "memory");
-      }
+   (void)Atomic_ReadXor8(var, val);
 #endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAdd8 --
+ *
+ *      Atomic read (returned), add a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadAdd8(Atomic_uint8 *var, // IN/OUT
+                uint8 val)         // IN
+{
+   uint8 res;
+
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 8, TRUE, &var->value, add, val);
+#else
+   do {
+      res = Atomic_Read8(var);
+   } while (res != Atomic_ReadIfEqualWrite8(var, res, res + val));
 #endif
+
+   return res;
 }
 
 
 /*
- * All the assembly code is tricky and written conservatively.
- * For example, to make sure gcc won't introduce copies,
- * we force the addressing mode like this:
+ *-----------------------------------------------------------------------------
  *
- *    "xchgl %0, (%1)"
- *    : "=r" (val)
- *    : "r" (&var->value),
- *      "0" (val)
- *    : "memory"
+ * Atomic_Add8 --
  *
- * - edward
+ *      Atomic read, add a value, write.
  *
- * Actually - turns out that gcc never generates memory aliases (it
- * still does generate register aliases though), so we can be a bit
- * more agressive with the memory constraints. The code above can be
- * modified like this:
+ * Results:
+ *      None
  *
- *    "xchgl %0, %1"
- *    : "=r" (val),
- *      "=m" (var->value),
- *    : "0" (val),
- *      "1" (var->value)
+ * Side effects:
+ *      None
  *
- * The advantages are that gcc can use whatever addressing mode it
- * likes to access the memory value, and that we dont have to use a
- * way-too-generic "memory" clobber as there is now an explicit
- * declaration that var->value is modified.
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Add8(Atomic_uint8 *var, // IN/OUT
+            uint8 val)         // IN
+{
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, add, val);
+#else
+   (void)Atomic_ReadAdd8(var, val);
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Sub8 --
+ *
+ *      Atomic read, subtract a value, write.
+ *
+ * Results:
+ *      None
  *
- * see also /usr/include/asm/atomic.h to convince yourself this is a
- * valid optimization.
+ * Side effects:
+ *      None
  *
- * - walken
+ *-----------------------------------------------------------------------------
  */
 
-#if defined(_MSC_VER) && _MSC_VER < 1600 && defined(__x86_64__)
-Bool VMWInterlockedExchangeBool(Bool volatile *ptr,
-                                Bool val);
-
-Bool VMWInterlockedCompareExchangeBool(Bool volatile *ptr,
-                                       Bool newVal,
-                                       Bool oldVal);
+static INLINE void
+Atomic_Sub8(Atomic_uint8 *var, // IN/OUT
+            uint8 val)         // IN
+{
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, sub, val);
+#else
+   Atomic_Add8(var, -val);
 #endif
+}
 
-typedef struct Atomic_Bool {
-   volatile Bool value;
-} Atomic_Bool;
-
-/* The ARM team can come along and add the code real soon now */
-extern Bool AtomicUndefinedOnARM(void);
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadBool --
+ * Atomic_Inc8 --
  *
- *      Read the value of the specified object atomically.
+ *      Atomic read, increment, write.
  *
  * Results:
- *      The value of the atomic variable.
+ *      None
  *
  * Side effects:
- *      None.
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
 
-static INLINE Bool
-Atomic_ReadBool(Atomic_Bool const *var)  // IN:
+static INLINE void
+Atomic_Inc8(Atomic_uint8 *var) // IN/OUT
 {
-   Bool val;
-
-#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
-   val = AtomicUndefinedOnARM();
-#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-   __asm__ __volatile__(
-      "movb %1, %0"
-      : "=q" (val)
-      : "m" (var->value)
-   );
-#elif defined(_MSC_VER)
-   val = var->value;
-#else
-#error No compiler defined for Atomic_ReadBool
-#endif
-
-   return val;
+   Atomic_Add8(var, 1);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadWriteBool --
+ * Atomic_Dec8 --
  *
- *      Read followed by write.
+ *      Atomic read, decrement, write.
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      None
  *
  * Side effects:
  *      None
@@ -583,138 +838,63 @@ Atomic_ReadBool(Atomic_Bool const *var)  // IN:
  *-----------------------------------------------------------------------------
  */
 
-static INLINE Bool
-Atomic_ReadWriteBool(Atomic_Bool *var,  // IN/OUT:
-                     Bool val)          // IN:
+static INLINE void
+Atomic_Dec8(Atomic_uint8 *var) // IN/OUT
 {
-#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
-   return AtomicUndefinedOnARM();
-#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-   __asm__ __volatile__(
-      "xchgb %0, %1"
-      : "=q" (val),
-        "+m" (var->value)
-      : "0" (val)
-   );
-   AtomicEpilogue();
-   return val;
-#elif defined(_MSC_VER) && _MSC_VER >= 1600
-   return _InterlockedExchange8(&var->value, val);
-#elif defined(_MSC_VER) && defined(__i386__)
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm movzx eax, val
-      __asm mov ebx, var
-      __asm xchg [ebx]Atomic_Bool.value, al
-   }
-#pragma warning(pop)
-#elif defined(_MSC_VER) && defined(__x86_64__)
-   return VMWInterlockedExchangeBool(&var->value, val);
-#else
-#error No compiler defined for Atomic_ReadBool
-#endif
+   Atomic_Sub8(var, 1);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_WriteBool --
+ * Atomic_ReadInc8 --
  *
- *      Write the specified value to the specified object atomically.
+ *      Atomic read (returned), increment, write.
  *
  * Results:
- *      None.
+ *      The value of the variable before the operation.
  *
  * Side effects:
- *      None.
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
 
-static INLINE void
-Atomic_WriteBool(Atomic_Bool *var,  // IN/OUT:
-                 Bool val)          // IN:
+static INLINE uint8
+Atomic_ReadInc8(Atomic_uint8 *var) // IN/OUT
 {
-#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
-   AtomicUndefinedOnARM();
-#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-   __asm__ __volatile__(
-      "movb %1, %0"
-      : "=m" (var->value)
-      : "qn" (val)
-   );
-#elif defined(_MSC_VER)
-   var->value = val;
-#else
-#error No compiler defined for Atomic_WriteBool
-#endif
+   return Atomic_ReadAdd8(var, 1);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadIfEqualWriteBool --
+ * Atomic_ReadDec8 --
  *
- *      Compare exchange: Read variable, if equal to oldVal, write newVal.
+ *      Atomic read (returned), decrement, write.
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value of the variable before the operation.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
 
-static INLINE Bool
-Atomic_ReadIfEqualWriteBool(Atomic_Bool *var,  // IN/OUT:
-                            Bool oldVal,       // IN:
-                            Bool newVal)       // IN:
+static INLINE uint8
+Atomic_ReadDec8(Atomic_uint8 *var) // IN/OUT
 {
-#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
-   return AtomicUndefinedOnARM();
-#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-   Bool val;
-
-   __asm__ __volatile__(
-      "lock; cmpxchgb %2, %1"
-      : "=a" (val),
-        "+m" (var->value)
-      : "q" (newVal),
-        "0" (oldVal)
-      : "cc"
-   );
-   AtomicEpilogue();
-   return val;
-#elif defined(_MSC_VER) && _MSC_VER >= 1600
-   return _InterlockedCompareExchange8(&var->value, newVal, oldVal);
-#elif defined(_MSC_VER) && defined(__i386__)
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov al, oldVal
-      __asm mov ebx, var
-      __asm mov cl, newVal
-      __asm lock cmpxchg [ebx]Atomic_Bool.value, cl
-      __asm movzx eax, al
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#elif defined(_MSC_VER) && defined(__x86_64__)
-   return VMWInterlockedCompareExchangeBool(&var->value, newVal, oldVal);
-#else
-#error No compiler defined for Atomic_ReadIfEqualWriteBool
-#endif
+   return Atomic_ReadAdd8(var, (uint8)-1);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Read --
+ * Atomic_Read32 --
  *
  *      Read
  *
@@ -728,33 +908,29 @@ Atomic_ReadIfEqualWriteBool(Atomic_Bool *var,  // IN/OUT:
  */
 
 static INLINE uint32
-Atomic_Read(Atomic_uint32 const *var) // IN
+Atomic_Read32(Atomic_uint32 const *var) // IN
 {
    uint32 value;
 
-#if defined(VMM)
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT(((uintptr_t)var % 4) == 0);
 #endif
 
-#if defined(__GNUC__)
+#if defined __GNUC__
    /*
     * Use inline assembler to force using a single load instruction to
     * ensure that the compiler doesn't split a transfer operation into multiple
     * instructions.
     */
 
-#if defined(VM_ARM_32)
+#if defined VM_ARM_32
    __asm__ __volatile__(
       "ldr %0, [%1]"
       : "=r" (value)
       : "r" (&var->value)
    );
-#elif defined(VM_ARM_64)
-   __asm__ __volatile__ (
-      "ldr    %w0, [%1]"
-      : "=r" (value)
-      : "r" (&var->value)
-   );
+#elif defined VM_ARM_64
+   value = _VMATOM_X(R, 32, &var->value);
 #else
    __asm__ __volatile__(
       "mov %1, %0"
@@ -762,7 +938,7 @@ Atomic_Read(Atomic_uint32 const *var) // IN
       : "m" (var->value)
    );
 #endif
-#elif defined(_MSC_VER)
+#elif defined _MSC_VER
    /*
     * Microsoft docs guarantee simple reads and writes to properly
     * aligned 32-bit variables use only a single instruction.
@@ -776,13 +952,13 @@ Atomic_Read(Atomic_uint32 const *var) // IN
 
    return value;
 }
-#define Atomic_Read32 Atomic_Read
+#define Atomic_Read Atomic_Read32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadWrite --
+ * Atomic_ReadWrite32 --
  *
  *      Read followed by write
  *
@@ -796,10 +972,10 @@ Atomic_Read(Atomic_uint32 const *var) // IN
  */
 
 static INLINE uint32
-Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
-                 uint32 val)         // IN
+Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
+                   uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 retVal;
    register volatile uint32 res;
@@ -819,22 +995,8 @@ Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint32 retVal;
-   register uint32 failed;
-
-   __asm__ __volatile__(
-      "   dmb     sy             \n\t"
-      "1: ldxr   %w0, [%2]       \n\t"
-      "   stxr   %w1, %w3, [%2]  \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (val)
-      : "memory"
-   );
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RW, 32, TRUE, &var->value, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -843,7 +1005,6 @@ Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
 	"+m" (var->value)
       : "0" (val)
    );
-   AtomicEpilogue();
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -864,13 +1025,13 @@ Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_ReadWrite
 #endif // __GNUC__
 }
-#define Atomic_ReadWrite32 Atomic_ReadWrite
+#define Atomic_ReadWrite Atomic_ReadWrite32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Write --
+ * Atomic_Write32 --
  *
  *      Write
  *
@@ -884,16 +1045,21 @@ Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Write(Atomic_uint32 *var, // OUT
-             uint32 val)         // IN
+Atomic_Write32(Atomic_uint32 *var, // OUT
+               uint32 val)         // IN
 {
-#if defined(VMM)
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT(((uintptr_t)var % 4) == 0);
 #endif
 
-#if defined(__GNUC__)
-#if defined(VM_ARM_ANY)
+#if defined __GNUC__
+#if defined VM_ARM_64
+   _VMATOM_X(W, 32, &var->value, val);
+#elif defined VM_ARM_32
    /*
+    * Best left this way due to the intricacies of exclusive load/store
+    * operations on legacy (32-bit) ARM.
+    *
     * A3.4.1 ARM DDI 0406C:
     *
     * When a processor writes using any instruction other than a
@@ -915,7 +1081,7 @@ Atomic_Write(Atomic_uint32 *var, // OUT
     * - it is not necessary for every LDREX to have a subsequent STREX.
     */
 
-   Atomic_ReadWrite(var, val);
+   Atomic_ReadWrite32(var, val);
 #else
    /*
     * Use inline assembler to force using a single store instruction to
@@ -929,7 +1095,7 @@ Atomic_Write(Atomic_uint32 *var, // OUT
       : "r" (val)
    );
 #endif
-#elif defined(_MSC_VER)
+#elif defined _MSC_VER
    /*
     * Microsoft docs guarantee simple reads and writes to properly
     * aligned 32-bit variables use only a single instruction.
@@ -941,13 +1107,13 @@ Atomic_Write(Atomic_uint32 *var, // OUT
 #error No compiler defined for Atomic_Write
 #endif
 }
-#define Atomic_Write32 Atomic_Write
+#define Atomic_Write Atomic_Write32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadIfEqualWrite --
+ * Atomic_ReadIfEqualWrite32 --
  *
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
@@ -961,11 +1127,11 @@ Atomic_Write(Atomic_uint32 *var, // OUT
  */
 
 static INLINE uint32
-Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
-                        uint32 oldVal,      // IN
-                        uint32 newVal)      // IN
+Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
+                          uint32 oldVal,      // IN
+                          uint32 newVal)      // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register uint32 retVal;
    register uint32 res;
@@ -987,24 +1153,8 @@ Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint32 retVal;
-   register uint32 failed;
-
-   __asm__ __volatile__ (
-      "   dmb     sy             \n\t"
-      "1: ldxr   %w0, [%2]       \n\t"
-      "   cmp     %w0, %w3       \n\t"
-      "   b.ne    2f             \n\t"
-      "   stxr   %w1, %w4, [%2]  \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "2: clrex                  \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (oldVal), "r" (newVal)
-      : "cc", "memory");
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RIFEQW, 32, TRUE, &var->value, oldVal, newVal);
 #else /* VM_X86_ANY */
    uint32 val;
 
@@ -1017,7 +1167,6 @@ Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
 	"0" (oldVal)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1041,10 +1190,10 @@ Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_ReadIfEqualWrite
 #endif
 }
-#define Atomic_ReadIfEqualWrite32 Atomic_ReadIfEqualWrite
+#define Atomic_ReadIfEqualWrite Atomic_ReadIfEqualWrite32
 
 
-#if defined(VM_64BIT) || defined(VM_ARM_V7)
+#if defined VM_64BIT || defined VM_ARM_V7
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1066,7 +1215,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
                           uint64 oldVal,      // IN
                           uint64 newVal)      // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register uint64 retVal;
    register uint32 res;
@@ -1087,7 +1236,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
     * Furthermore, using a 32-bits register to store a
     * 64-bits value of an variable looks risky.
     */
-#if defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#if defined __APPLE__ && __clang__ == 1 && __clang_major__ >= 5
 #pragma clang diagnostic push
 #pragma clang diagnostic ignored "-Wasm-operand-widths"
 #endif
@@ -1103,30 +1252,14 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
       : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
       : "cc"
    );
-#if defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#if defined __APPLE__ && __clang__ == 1 && __clang_major__ >= 5
 #pragma clang diagnostic pop
-#endif // defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#endif // defined __APPLE__ && __clang__ == 1 && __clang_major__ >= 5
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint64 retVal;
-   register uint32 failed;
-
-   __asm__ __volatile__ (
-      "   dmb     sy             \n\t"
-      "1: ldxr    %x0, [%2]      \n\t"
-      "   cmp     %x0, %x3       \n\t"
-      "   b.ne    2f             \n\t"
-      "   stxr    %w1, %x4, [%2] \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "2: clrex                  \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (oldVal), "r" (newVal)
-      : "cc", "memory");
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RIFEQW, 64, TRUE, &var->value, oldVal, newVal);
 #else /* VM_X86_64 */
    uint64 val;
 
@@ -1139,7 +1272,6 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
 	"0" (oldVal)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
@@ -1156,7 +1288,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_And --
+ * Atomic_And32 --
  *
  *      Atomic read, bitwise AND with a value, write.
  *
@@ -1170,10 +1302,10 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_And(Atomic_uint32 *var, // IN/OUT
-           uint32 val)         // IN
+Atomic_And32(Atomic_uint32 *var, // IN/OUT
+             uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1192,8 +1324,8 @@ Atomic_And(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, and);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, and, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1202,10 +1334,9 @@ Atomic_And(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined(__x86_64__)
+#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedAnd((long *)&var->value, (long)val);
 #else
    __asm mov eax, val
@@ -1216,13 +1347,13 @@ Atomic_And(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_And
 #endif
 }
-#define Atomic_And32 Atomic_And
+#define Atomic_And Atomic_And32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Or --
+ * Atomic_Or32 --
  *
  *      Atomic read, bitwise OR with a value, write.
  *
@@ -1236,10 +1367,10 @@ Atomic_And(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Or(Atomic_uint32 *var, // IN/OUT
-          uint32 val)         // IN
+Atomic_Or32(Atomic_uint32 *var, // IN/OUT
+            uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1258,8 +1389,8 @@ Atomic_Or(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, orr);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, orr, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1268,10 +1399,9 @@ Atomic_Or(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined(__x86_64__)
+#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedOr((long *)&var->value, (long)val);
 #else
    __asm mov eax, val
@@ -1282,13 +1412,13 @@ Atomic_Or(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_Or
 #endif
 }
-#define Atomic_Or32 Atomic_Or
+#define Atomic_Or Atomic_Or32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Xor --
+ * Atomic_Xor32 --
  *
  *      Atomic read, bitwise XOR with a value, write.
  *
@@ -1302,10 +1432,10 @@ Atomic_Or(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Xor(Atomic_uint32 *var, // IN/OUT
-           uint32 val)         // IN
+Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
+             uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1324,8 +1454,8 @@ Atomic_Xor(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, eor);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, eor, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1334,10 +1464,9 @@ Atomic_Xor(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined(__x86_64__)
+#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedXor((long *)&var->value, (long)val);
 #else
    __asm mov eax, val
@@ -1348,10 +1477,10 @@ Atomic_Xor(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_Xor
 #endif
 }
-#define Atomic_Xor32 Atomic_Xor
+#define Atomic_Xor Atomic_Xor32
 
 
-#if defined(VM_64BIT)
+#if defined VM_64BIT
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1372,9 +1501,9 @@ static INLINE void
 Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined(__GNUC__)
-#if defined(VM_ARM_64)
-   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, eor);
+#if defined __GNUC__
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, eor, val);
 #else /* VM_X86_64 */
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -1383,7 +1512,6 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif
 #elif defined _MSC_VER
    _InterlockedXor64((__int64 *)&var->value, (__int64)val);
@@ -1397,7 +1525,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Add --
+ * Atomic_Add32 --
  *
  *      Atomic read, add a value, write.
  *
@@ -1411,10 +1539,10 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Add(Atomic_uint32 *var, // IN/OUT
-           uint32 val)         // IN
+Atomic_Add32(Atomic_uint32 *var, // IN/OUT
+             uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1433,8 +1561,8 @@ Atomic_Add(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, add);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, add, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1443,7 +1571,6 @@ Atomic_Add(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
 #if _MSC_VER >= 1310
@@ -1457,13 +1584,13 @@ Atomic_Add(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_Add
 #endif
 }
-#define Atomic_Add32 Atomic_Add
+#define Atomic_Add Atomic_Add32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Sub --
+ * Atomic_Sub32 --
  *
  *      Atomic read, subtract a value, write.
  *
@@ -1477,10 +1604,10 @@ Atomic_Add(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Sub(Atomic_uint32 *var, // IN/OUT
-           uint32 val)         // IN
+Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
+             uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1499,8 +1626,8 @@ Atomic_Sub(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, sub);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, sub, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1509,7 +1636,6 @@ Atomic_Sub(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
 #if _MSC_VER >= 1310
@@ -1523,13 +1649,13 @@ Atomic_Sub(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_Sub
 #endif
 }
-#define Atomic_Sub32 Atomic_Sub
+#define Atomic_Sub Atomic_Sub32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Inc --
+ * Atomic_Inc32 --
  *
  *      Atomic read, increment, write.
  *
@@ -1543,11 +1669,11 @@ Atomic_Sub(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Inc(Atomic_uint32 *var) // IN/OUT
+Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
 {
 #ifdef __GNUC__
-#if defined(VM_ARM_ANY)
-   Atomic_Add(var, 1);
+#if defined VM_ARM_ANY
+   Atomic_Add32(var, 1);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1556,7 +1682,6 @@ Atomic_Inc(Atomic_uint32 *var) // IN/OUT
       :
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
 #if _MSC_VER >= 1310
@@ -1569,13 +1694,13 @@ Atomic_Inc(Atomic_uint32 *var) // IN/OUT
 #error No compiler defined for Atomic_Inc
 #endif
 }
-#define Atomic_Inc32 Atomic_Inc
+#define Atomic_Inc Atomic_Inc32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Dec --
+ * Atomic_Dec32 --
  *
  *      Atomic read, decrement, write.
  *
@@ -1589,11 +1714,11 @@ Atomic_Inc(Atomic_uint32 *var) // IN/OUT
  */
 
 static INLINE void
-Atomic_Dec(Atomic_uint32 *var) // IN/OUT
+Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
 {
 #ifdef __GNUC__
-#if defined(VM_ARM_ANY)
-   Atomic_Sub(var, 1);
+#if defined VM_ARM_ANY
+   Atomic_Sub32(var, 1);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1602,7 +1727,6 @@ Atomic_Dec(Atomic_uint32 *var) // IN/OUT
       :
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
 #if _MSC_VER >= 1310
@@ -1615,7 +1739,7 @@ Atomic_Dec(Atomic_uint32 *var) // IN/OUT
 #error No compiler defined for Atomic_Dec
 #endif
 }
-#define Atomic_Dec32 Atomic_Dec
+#define Atomic_Dec Atomic_Dec32
 
 
 /*
@@ -1646,9 +1770,13 @@ Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 32, TRUE, &var->value, orr, val);
+#else
    do {
-      res = Atomic_Read(var);
-   } while (res != Atomic_ReadIfEqualWrite(var, res, res | val));
+      res = Atomic_Read32(var);
+   } while (res != Atomic_ReadIfEqualWrite32(var, res, res | val));
+#endif
 
    return res;
 }
@@ -1676,15 +1804,19 @@ Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 32, TRUE, &var->value, and, val);
+#else
    do {
-      res = Atomic_Read(var);
-   } while (res != Atomic_ReadIfEqualWrite(var, res, res & val));
+      res = Atomic_Read32(var);
+   } while (res != Atomic_ReadIfEqualWrite32(var, res, res & val));
+#endif
 
    return res;
 }
 
 
-#if defined(VM_64BIT)
+#if defined VM_64BIT
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1707,9 +1839,13 @@ Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 64, TRUE, &var->value, orr, val);
+#else
    do {
       res = var->value;
    } while (res != Atomic_ReadIfEqualWrite64(var, res, res | val));
+#endif
 
    return res;
 }
@@ -1737,13 +1873,17 @@ Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 64, TRUE, &var->value, and, val);
+#else
    do {
       res = var->value;
    } while (res != Atomic_ReadIfEqualWrite64(var, res, res & val));
+#endif
 
    return res;
 }
-#endif /* defined(VM_64BIT) */
+#endif /* defined VM_64BIT */
 
 
 /*
@@ -1770,7 +1910,7 @@ static INLINE uint32
 Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
                  uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 retVal;
@@ -1792,8 +1932,8 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   return ARM_64_ATOMIC_32_OPO_PRIVATE_FENCED(var, val, add);
+#elif defined VM_ARM_64
+   return _VMATOM_X(ROP, 32, TRUE, &var->value, add, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1803,7 +1943,6 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
       : "0" (val)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1871,51 +2010,6 @@ Atomic_ReadDec32(Atomic_uint32 *var) // IN/OUT
 }
 
 
-#if defined VMKERNEL || defined VMM
-#if !defined(VM_ARM_64)
-/*
- *-----------------------------------------------------------------------------
- *
- * CMPXCHG1B --
- *
- *      Compare and exchange a single byte.
- *
- * Results:
- *      The value read from ptr.
- *
- * Side effects:
- *      None
- *
- *-----------------------------------------------------------------------------
- */
-static INLINE uint8
-CMPXCHG1B(volatile uint8 *ptr, // IN/OUT
-          uint8 oldVal,        // IN
-          uint8 newVal)        // IN
-{
-   uint8 val;
-   __asm__ __volatile__("lock; cmpxchgb %b2, %1"
-                        : "=a" (val),
-                          "+m" (*ptr)
-                        : "r" (newVal),
-                          "0" (oldVal)
-                        : "cc");
-   return val;
-}
-#endif /* !defined(VM_ARM_64) */
-#endif
-
-
-/*
- * Usage of this helper struct is strictly reserved to the following
- * function. --hpreg
- */
-typedef struct {
-   uint32 lowValue;
-   uint32 highValue;
-} S_uint64;
-
-
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1923,12 +2017,6 @@ typedef struct {
  *
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
- *      XXX: Ensure that if this function is to be inlined by gcc, it is
- *      compiled with -fno-strict-aliasing. Otherwise it will break.
- *      Unfortunately we know that gcc 2.95.3 (used to build the FreeBSD 3.2
- *      Tools) does not honor -fno-strict-aliasing. As a workaround, we avoid
- *      inlining the function entirely for versions of gcc under 3.0.
- *
  * Results:
  *      TRUE if equal, FALSE if not equal
  *
@@ -1938,23 +2026,19 @@ typedef struct {
  *-----------------------------------------------------------------------------
  */
 
-#if defined(__GNUC__) && __GNUC__ < 3
-static Bool
-#else
 static INLINE Bool
-#endif
 Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
-                 uint64 const *oldVal, // IN
-                 uint64 const *newVal) // IN
+                 uint64 oldVal,        // IN
+                 uint64 newVal)        // IN
 {
-#if defined(__GNUC__)
-#if defined(VM_ARM_ANY)
-   return (Atomic_ReadIfEqualWrite64(var, *oldVal, *newVal) == *oldVal);
+#if defined __GNUC__
+#if defined VM_ARM_ANY
+   return Atomic_ReadIfEqualWrite64(var, oldVal, newVal) == oldVal;
 #else /* VM_X86_ANY */
 
    Bool equal;
    /* Checked against the Intel manual and GCC --walken */
-#if defined(__x86_64__)
+#if defined __x86_64__
    uint64 dummy;
    __asm__ __volatile__(
       "lock; cmpxchgq %3, %0" "\n\t"
@@ -1962,11 +2046,16 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
       : "+m" (*var),
 	"=qm" (equal),
 	"=a" (dummy)
-      : "r" (*newVal),
-        "2" (*oldVal)
+      : "r" (newVal),
+        "2" (oldVal)
       : "cc"
    );
 #else /* 32-bit version for non-ARM */
+   typedef struct {
+      uint32 lowValue;
+      uint32 highValue;
+   } S_uint64;
+
    int dummy1, dummy2;
 #   if defined __PIC__
    /*
@@ -1994,28 +2083,6 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
     * where it temporarily modifies %ebx as small as possible, and should
     * prefer specific register assignments.
     */
-#      if __GNUC__ < 3 // Part of #188541 - for RHL 6.2 etc.
-   __asm__ __volatile__(
-      "xchg %%ebx, %6"       "\n\t"
-      "mov 4(%%ebx), %%ecx"  "\n\t"
-      "mov (%%ebx), %%ebx"   "\n\t"
-      "lock; cmpxchg8b (%3)" "\n\t"
-      "xchg %%ebx, %6"       "\n\t"
-      "sete %0"
-      : "=a" (equal),
-        "=d" (dummy2),
-        "=D" (dummy1)
-      : /*
-         * See the "Rules for __asm__ statements in __PIC__ code" above: %3
-         * must use a register class which does not contain %ebx.
-         */
-        "S" (var),
-        "0" (((S_uint64 const *)oldVal)->lowValue),
-        "1" (((S_uint64 const *)oldVal)->highValue),
-        "D" (newVal)
-      : "ecx", "cc", "memory"
-   );
-#      else
    __asm__ __volatile__(
       "xchgl %%ebx, %6"      "\n\t"
       "lock; cmpxchg8b (%3)" "\n\t"
@@ -2033,13 +2100,12 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
          * stack, %ebp reserved for frame, %ebx reserved for PIC).
          */
         "S" (var),
-        "1" (((S_uint64 const *)oldVal)->lowValue),
-        "2" (((S_uint64 const *)oldVal)->highValue),
-        "D" (((S_uint64 const *)newVal)->lowValue),
-        "c" (((S_uint64 const *)newVal)->highValue)
+        "1" (((S_uint64 *)&oldVal)->lowValue),
+        "2" (((S_uint64 *)&oldVal)->highValue),
+        "D" (((S_uint64 *)&newVal)->lowValue),
+        "c" (((S_uint64 *)&newVal)->highValue)
       : "cc", "memory"
    );
-#      endif
 #   else
    __asm__ __volatile__(
       "lock; cmpxchg8b %0" "\n\t"
@@ -2048,40 +2114,20 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
 	"=qm" (equal),
 	"=a" (dummy1),
 	"=d" (dummy2)
-      : "2" (((S_uint64 const *)oldVal)->lowValue),
-        "3" (((S_uint64 const *)oldVal)->highValue),
-        "b" (((S_uint64 const *)newVal)->lowValue),
-        "c" (((S_uint64 const *)newVal)->highValue)
+      : "2" (((S_uint64 *)&oldVal)->lowValue),
+        "3" (((S_uint64 *)&oldVal)->highValue),
+        "b" (((S_uint64 *)&newVal)->lowValue),
+        "c" (((S_uint64 *)&newVal)->highValue)
       : "cc"
    );
 #   endif
 #endif
-   AtomicEpilogue();
    return equal;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
-#if defined(__x86_64__)
-   return (__int64)*oldVal == _InterlockedCompareExchange64((__int64 *)&var->value,
-                                                            (__int64)*newVal,
-                                                            (__int64)*oldVal);
-#else
-#pragma warning(push)
-#pragma warning(disable : 4035)		// disable no-return warning
-   {
-      __asm mov esi, var
-      __asm mov edx, oldVal
-      __asm mov ecx, newVal
-      __asm mov eax, [edx]S_uint64.lowValue
-      __asm mov edx, [edx]S_uint64.highValue
-      __asm mov ebx, [ecx]S_uint64.lowValue
-      __asm mov ecx, [ecx]S_uint64.highValue
-      __asm lock cmpxchg8b [esi]
-      __asm sete al
-      __asm movzx eax, al
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#endif
+   return (__int64)oldVal == _InterlockedCompareExchange64((__int64 *)&var->value,
+                                                           (__int64)newVal,
+                                                           (__int64)oldVal);
 #else
 #error No compiler defined for Atomic_CMPXCHG64
 #endif // !GNUC
@@ -2109,9 +2155,9 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
                  uint32 oldVal,        // IN
                  uint32 newVal)        // IN
 {
-#if defined(__GNUC__)
-#if defined(VM_ARM_ANY)
-   return (Atomic_ReadIfEqualWrite(var, oldVal, newVal) == oldVal);
+#if defined __GNUC__
+#if defined VM_ARM_ANY
+   return Atomic_ReadIfEqualWrite32(var, oldVal, newVal) == oldVal;
 #else /* VM_X86_ANY */
    Bool equal;
    uint32 dummy;
@@ -2126,12 +2172,11 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
         "2" (oldVal)
       : "cc"
    );
-   AtomicEpilogue();
    return equal;
 #endif /* VM_X86_ANY */
-#else // defined(__GNUC__)
-   return (Atomic_ReadIfEqualWrite(var, oldVal, newVal) == oldVal);
-#endif // !defined(__GNUC__)
+#else // defined __GNUC__
+   return Atomic_ReadIfEqualWrite32(var, oldVal, newVal) == oldVal;
+#endif // !defined __GNUC__
 }
 
 
@@ -2154,12 +2199,15 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
 static INLINE uint64
 Atomic_Read64(Atomic_uint64 const *var) // IN
 {
-#if defined(__GNUC__) && defined(__x86_64__)
+#if defined __GNUC__
    uint64 value;
+#endif
 
-#ifdef VMM
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 8 == 0);
 #endif
+
+#if defined __GNUC__ && defined __x86_64__
    /*
     * Use asm to ensure we emit a single load.
     */
@@ -2168,9 +2216,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
       : "=r" (value)
       : "m" (var->value)
    );
-   return value;
-#elif defined(__GNUC__) && defined(__i386__)
-   uint64 value;
+#elif defined __GNUC__ && defined __i386__
    /*
     * Since cmpxchg8b will replace the contents of EDX:EAX with the
     * value in memory if there is no match, we need only execute the
@@ -2188,9 +2234,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
       : "m" (*var)
       : "cc"
    );
-   AtomicEpilogue();
-   return value;
-#elif defined (_MSC_VER) && defined(__x86_64__)
+#elif defined _MSC_VER && defined __x86_64__
    /*
     * Microsoft docs guarantee "Simple reads and writes to properly
     * aligned 64-bit variables are atomic on 64-bit Windows."
@@ -2199,7 +2243,9 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
     * XXX Verify that value is properly aligned. Bug 61315.
     */
    return var->value;
-#elif defined (_MSC_VER) && defined(__i386__)
+#elif defined _MSC_VER && defined VM_ARM_32
+   return _InterlockedAdd64((__int64 *)&var->value, 0);
+#elif defined _MSC_VER && defined __i386__
 #   pragma warning(push)
 #   pragma warning(disable : 4035)		// disable no-return warning
    {
@@ -2210,26 +2256,19 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
       // edx:eax is the return value; this is documented to work. --mann
    }
 #   pragma warning(pop)
-#elif defined(__GNUC__) && defined (VM_ARM_V7)
-   uint64 value;
-
+#elif defined __GNUC__ && defined VM_ARM_V7
    __asm__ __volatile__(
       "ldrexd %[value], %H[value], [%[var]] \n\t"
       : [value] "=&r" (value)
       : [var] "r" (&var->value)
    );
+#elif defined VM_ARM_64
+   value = _VMATOM_X(R, 64, &var->value);
+#endif
 
+#if defined __GNUC__
    return value;
-#elif defined(__GNUC__) && defined(VM_ARM_64)
-   uint64 value;
-
-   __asm__ __volatile__(
-      "ldr     %0, [%1]"
-      : "=r" (value)
-      : "r" (&var->value));
-
-   return value;
-#endif /* defined(__GNUC__) && defined(VM_ARM_64) */
+#endif
 }
 
 
@@ -2241,7 +2280,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
  *      Atomically read a 64 bit integer, possibly misaligned.
  *      This function can be *very* expensive, costing over 50 kcycles
  *      on Nehalem.
- * 
+ *
  *      Note that "var" needs to be writable, even though it will not
  *      be modified.
  *
@@ -2254,7 +2293,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
  *----------------------------------------------------------------------
  */
 
-#if defined(VM_64BIT)
+#if defined VM_64BIT
 static INLINE uint64
 Atomic_ReadUnaligned64(Atomic_uint64 const *var)  // IN:
 {
@@ -2283,11 +2322,11 @@ static INLINE uint64
 Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined(VM_ARM_64)
-   return ARM_64_ATOMIC_64_OPO_PRIVATE_FENCED(var, val, add);
-#elif defined(__x86_64__)
+#if defined VM_ARM_64
+   return _VMATOM_X(ROP, 64, TRUE, &var->value, add, val);
+#elif defined __x86_64__
 
-#if defined(__GNUC__)
+#if defined __GNUC__
    __asm__ __volatile__(
       "lock; xaddq %0, %1"
       : "=r" (val),
@@ -2295,7 +2334,6 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
       : "0" (val)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
 #elif defined _MSC_VER
    return _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
@@ -2310,7 +2348,7 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal + val;
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 
    return oldVal;
 #endif
@@ -2337,7 +2375,11 @@ static INLINE uint64
 Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
+#if defined VM_ARM_64
+   return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
+#else
    return Atomic_ReadAdd64(var, -val);
+#endif
 }
 
 
@@ -2407,12 +2449,12 @@ static INLINE void
 Atomic_Add64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if !defined(VM_64BIT)
+#if !defined VM_64BIT
    Atomic_ReadAdd64(var, val); /* Return value is unused. */
-#elif defined(__GNUC__)
-#if defined(VM_ARM_64)
-   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, add);
-#else /* defined(VM_X86_64) */
+#elif defined __GNUC__
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, add, val);
+#else /* defined VM_X86_64 */
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; addq %1, %0"
@@ -2420,7 +2462,6 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif
 #elif defined _MSC_VER
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
@@ -2450,11 +2491,11 @@ static INLINE void
 Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if !defined(__x86_64__)
+#if !defined VM_64BIT
    Atomic_ReadSub64(var, val); /* Return value is unused. */
-#elif defined(__GNUC__)
-#if defined(VM_ARM_64)
-   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, sub);
+#elif defined __GNUC__
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, sub, val);
 #else /* VM_X86_64 */
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -2463,7 +2504,6 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif
 #elif defined _MSC_VER
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)-val);
@@ -2492,9 +2532,11 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
 static INLINE void
 Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 {
-#if !defined(__x86_64__)
+#if defined VM_ARM_64
+   Atomic_Add64(var, 1);
+#elif !defined __x86_64__
    Atomic_ReadInc64(var);  /* Return value is unused. */
-#elif defined(__GNUC__)
+#elif defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; incq %0"
@@ -2502,7 +2544,6 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
       :
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    _InterlockedIncrement64((__int64 *)&var->value);
 #else
@@ -2530,9 +2571,11 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 static INLINE void
 Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
 {
-#if !defined(__x86_64__)
+#if defined VM_ARM_64
+   Atomic_Sub64(var, 1);
+#elif !defined __x86_64__
    Atomic_ReadDec64(var);  /* Return value is unused. */
-#elif defined(__GNUC__)
+#elif defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; decq %0"
@@ -2540,7 +2583,6 @@ Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
       :
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    _InterlockedDecrement64((__int64 *)&var->value);
 #else
@@ -2569,8 +2611,8 @@ static INLINE uint64
 Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
                    uint64 val)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "xchgq %0, %1"
@@ -2578,19 +2620,20 @@ Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
 	"+m" (var->value)
       : "0" (val)
    );
-   AtomicEpilogue();
    return val;
 #elif defined _MSC_VER
    return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
 #else
 #error No compiler defined for Atomic_ReadWrite64
 #endif
+#elif defined VM_ARM_64
+   return _VMATOM_X(RW, 64, TRUE, &var->value, val);
 #else
    uint64 oldVal;
 
    do {
       oldVal = var->value;
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &val));
+   } while (!Atomic_CMPXCHG64(var, oldVal, val));
 
    return oldVal;
 #endif
@@ -2617,12 +2660,12 @@ static INLINE void
 Atomic_Write64(Atomic_uint64 *var, // OUT
                uint64 val)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
-
-#ifdef VMM
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 8 == 0);
 #endif
+
+#if defined __x86_64__
+#if defined __GNUC__
    /*
     * There is no move instruction for 64-bit immediate to memory, so unless
     * the immediate value fits in 32-bit (i.e. can be sign-extended), GCC
@@ -2637,7 +2680,7 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
    );
 #elif defined _MSC_VER
    /*
-    * Microsoft docs guarantee "Simple reads and writes to properly aligned 
+    * Microsoft docs guarantee "Simple reads and writes to properly aligned
     * 64-bit variables are atomic on 64-bit Windows."
     * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
     *
@@ -2648,7 +2691,9 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
 #else
 #error No compiler defined for Atomic_Write64
 #endif
-#else  /* defined(__x86_64__) */
+#elif defined VM_ARM_64
+   _VMATOM_X(W, 64, &var->value, val);
+#else
    (void)Atomic_ReadWrite64(var, val);
 #endif
 }
@@ -2674,8 +2719,8 @@ static INLINE void
 Atomic_Or64(Atomic_uint64 *var, // IN/OUT
             uint64 val)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; orq %1, %0"
@@ -2683,19 +2728,20 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    _InterlockedOr64((__int64 *)&var->value, (__int64)val);
 #else
 #error No compiler defined for Atomic_Or64
 #endif
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, orr, val);
 #else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    do {
       oldVal = var->value;
       newVal = oldVal | val;
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #endif
 }
 
@@ -2720,8 +2766,8 @@ static INLINE void
 Atomic_And64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; andq %1, %0"
@@ -2729,19 +2775,20 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
 #else
 #error No compiler defined for Atomic_And64
 #endif
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, and, val);
 #else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    do {
       oldVal = var->value;
       newVal = oldVal & val;
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #endif
 }
 
@@ -2766,8 +2813,8 @@ static INLINE void
 Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
                 uint64 bit)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    ASSERT(bit <= 63);
    __asm__ __volatile__(
       "lock; bts %1, %0"
@@ -2775,7 +2822,6 @@ Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
       : "ri" (bit)
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    uint64 oldVal;
    uint64 newVal;
@@ -2783,7 +2829,7 @@ Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal | (CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #else
 #error No compiler defined for Atomic_SetBit64
 #endif
@@ -2794,7 +2840,7 @@ Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal | (CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #endif
 }
 
@@ -2819,8 +2865,8 @@ static INLINE void
 Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
                   uint64 bit)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    ASSERT(bit <= 63);
    __asm__ __volatile__(
       "lock; btr %1, %0"
@@ -2828,7 +2874,6 @@ Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
       : "ri" (bit)
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    uint64 oldVal;
    uint64 newVal;
@@ -2836,7 +2881,7 @@ Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal & ~(CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #else
 #error No compiler defined for Atomic_ClearBit64
 #endif
@@ -2847,7 +2892,7 @@ Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal & ~(CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #endif
 }
 
@@ -2872,8 +2917,8 @@ static INLINE Bool
 Atomic_TestBit64(Atomic_uint64 *var, // IN
                  uint64 bit)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    Bool out = FALSE;
    ASSERT(bit <= 63);
    __asm__ __volatile__(
@@ -2897,7 +2942,7 @@ Atomic_TestBit64(Atomic_uint64 *var, // IN
 }
 
 
-#if defined(__GNUC__)
+#if defined __GNUC__
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2919,19 +2964,19 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
 {
    uint16 value;
 
-#ifdef VMM
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 2 == 0);
 #endif
 
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
 
    __asm__ __volatile__(
       "movw %1, %0"
       : "=r" (value)
       : "m" (var->value)
    );
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    NOT_TESTED();
 
    __asm__ __volatile__(
@@ -2939,13 +2984,8 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
       : "=r" (value)
       : "r" (&var->value)
    );
-#elif defined(VM_ARM_64)
-   __asm__ __volatile__ (
-      "ldrh   %w0, [%1]"
-      : "=r" (value)
-      : "r" (&var->value)
-   );
-
+#elif defined VM_ARM_64
+   value = _VMATOM_X(R, 16, &var->value);
 #else
 #error No 16-bits atomics.
 #endif
@@ -2975,17 +3015,16 @@ static INLINE uint16
 Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
                    uint16 val)          // IN:
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "xchgw %0, %1"
       : "=r" (val),
 	"+m" (var->value)
       : "0" (val)
    );
-   AtomicEpilogue();
    return val;
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 retVal;
    register volatile uint16 res;
 
@@ -3006,22 +3045,8 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint16 retVal;
-   register uint16 failed;
-
-   __asm__ __volatile__(
-      "   dmb     sy             \n\t"
-      "1: ldxrh  %w0, [%2]       \n\t"
-      "   stxrh  %w1, %w3, [%2]  \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (val)
-      : "memory"
-   );
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RW, 16, TRUE, &var->value, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3049,19 +3074,24 @@ static INLINE void
 Atomic_Write16(Atomic_uint16 *var,  // OUT:
                uint16 val)          // IN:
 {
-#ifdef VMM
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 2 == 0);
 #endif
 
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
-
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "movw %1, %0"
       : "=m" (var->value)
       : "r" (val)
    );
-#elif defined(VM_ARM_ANY)
+#elif defined VM_ARM_64
+   _VMATOM_X(W, 16, &var->value, val);
+#elif defined VM_ARM_32
+   /*
+    * Best left this way due to the intricacies of exclusive load/store
+    * operations on legacy (32-bit) ARM.
+    */
    Atomic_ReadWrite16(var, val);
 #else
 #error No 16-bits atomics.
@@ -3091,8 +3121,8 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
                           uint16 oldVal,        // IN
                           uint16 newVal)        // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    uint16 val;
 
    __asm__ __volatile__(
@@ -3103,9 +3133,8 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
 	"0" (oldVal)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register uint16 retVal;
    register uint16 res;
 
@@ -3128,24 +3157,8 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint16 retVal;
-   register uint16 failed;
-
-   __asm__ __volatile__ (
-      "   dmb     sy             \n\t"
-      "1: ldxrh  %w0, [%2]       \n\t"
-      "   cmp     %w0, %w3       \n\t"
-      "   b.ne    2f             \n\t"
-      "   stxrh  %w1, %w4, [%2]  \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "2: clrex                  \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (oldVal), "r" (newVal)
-      : "cc", "memory");
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RIFEQW, 16, TRUE, &var->value, oldVal, newVal);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3173,16 +3186,15 @@ static INLINE void
 Atomic_And16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; andw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3202,8 +3214,8 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, and);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, and, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3231,16 +3243,15 @@ static INLINE void
 Atomic_Or16(Atomic_uint16 *var, // IN/OUT
             uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; orw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3260,14 +3271,15 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, orr);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, orr, val);
 #else
 #error No 16-bits atomics.
 #endif
 #endif
 }
 
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -3288,16 +3300,15 @@ static INLINE void
 Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; xorw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3317,8 +3328,8 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, eor);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, eor, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3346,16 +3357,15 @@ static INLINE void
 Atomic_Add16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; addw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3375,8 +3385,8 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, add);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, add, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3404,16 +3414,15 @@ static INLINE void
 Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; subw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3433,8 +3442,8 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, sub);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, sub, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3461,16 +3470,15 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
 static INLINE void
 Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; incw %0"
       : "+m" (var->value)
       :
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_ANY)
+#elif defined VM_ARM_ANY
    Atomic_Add16(var, 1);
 #else
 #error No 16-bits atomics.
@@ -3498,16 +3506,15 @@ Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 static INLINE void
 Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; decw %0"
       : "+m" (var->value)
       :
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_ANY)
+#elif defined VM_ARM_ANY
    Atomic_Sub16(var, 1);
 #else
 #error No 16-bits atomics.
@@ -3538,9 +3545,13 @@ Atomic_ReadOr16(Atomic_uint16 *var, // IN/OUT
 {
    uint16 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 16, TRUE, &var->value, orr, val);
+#else
    do {
       res = var->value;
    } while (res != Atomic_ReadIfEqualWrite16(var, res, res | val));
+#endif
 
    return res;
 }
@@ -3566,8 +3577,8 @@ static INLINE uint16
 Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
                  uint16 val)          // IN:
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; xaddw %0, %1"
       : "=r" (val),
@@ -3575,9 +3586,8 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
       : "0" (val)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 retVal;
    register volatile uint16 tmp;
@@ -3600,8 +3610,8 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   return ARM_64_ATOMIC_16_OPO_PRIVATE_FENCED(var, val, add);
+#elif defined VM_ARM_64
+   return _VMATOM_X(ROP, 16, TRUE, &var->value, add, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3631,8 +3641,8 @@ Atomic_ReadInc16(Atomic_uint16 *var) // IN/OUT
    return Atomic_ReadAdd16(var, 1);
 }
 
-/*
 
+/*
  *----------------------------------------------------------------------
  *
  * Atomic_ReadDec16 --
@@ -3840,57 +3850,38 @@ Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
  * Atomic_ReadAddInt --
  * Atomic_ReadIncInt --
  * Atomic_ReadDecInt --
- */
-#if defined(VM_64BIT)
+ *
+ * Atomic_Bool
+ * Atomic_ReadBool --
+ * Atomic_WriteBool --
+ * Atomic_ReadWriteBool --
+ * Atomic_ReadIfEqualWriteBool --
+ * Atomic_AndBool --
+ * Atomic_OrBool --
+ * Atomic_XorBool --
+ * Atomic_AddBool --
+ * Atomic_SubBool --
+ * Atomic_IncBool --
+ * Atomic_DecBool --
+ * Atomic_ReadOrBool --
+ * Atomic_ReadAddBool --
+ * Atomic_ReadIncBool --
+ * Atomic_ReadDecBool --
+ */
+#if defined VM_64BIT
 MAKE_ATOMIC_TYPE(Ptr, 64, void const *, void *, uintptr_t)
 #else
 MAKE_ATOMIC_TYPE(Ptr, 32, void const *, void *, uintptr_t)
 #endif
 MAKE_ATOMIC_TYPE(Int, 32, int, int, int)
+MAKE_ATOMIC_TYPE(Bool, 8, Bool, Bool, Bool)
 
-
-/* Prevent the compiler from re-ordering memory references. */
-#ifdef __GNUC__
-#define ATOMIC_COMPILER_BARRIER()   __asm__ __volatile__ ("": : :"memory")
-#elif defined(_MSC_VER)
-#define ATOMIC_COMPILER_BARRIER()   _ReadWriteBarrier()
-#else
-#error No compiler defined for ATOMIC_COMPILER_BARRIER
+#ifdef VM_ARM_64
+#   include "vm_atomic_arm64_end.h"
 #endif
 
-
-/*
- *-----------------------------------------------------------------------------
- *
- * Atomic_MFence --
- *
- *      Implements mfence in terms of a lock xor. The reason for implementing
- *      our own mfence is that not all of our supported cpus have an assembly
- *      mfence (P3, Athlon). We put it here to avoid duplicating code which is
- *      also why it is prefixed with "Atomic_". Moreover, this implementation
- *      performs slightly better than 'mfence' on modern CPUs (See PR 817059).
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      Cause loads and stores prior to this to be globally
- *      visible.
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE void
-Atomic_MFence(void)
-{
-   Atomic_uint32 fence;
-   ATOMIC_COMPILER_BARRIER();
-   Atomic_Xor(&fence, 0x1);
-   ATOMIC_COMPILER_BARRIER();
-}
-
-#ifdef ATOMIC_COMPILER_BARRIER
-#undef ATOMIC_COMPILER_BARRIER
-#endif /* ATOMIC_COMPILER_BARRIER */
+#if defined __cplusplus
+}  // extern "C"
+#endif
 
 #endif // ifndef _ATOMIC_H_
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index 0e4adae6..11c3abac 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -43,6 +43,10 @@
 #elif defined VM_X86_32
 #include "vm_basic_asm_x86_common.h"
 #include "vm_basic_asm_x86.h"
+#elif defined VM_ARM_32
+#include "vm_basic_asm_arm32.h"
+#define MUL64_NO_ASM 1
+#include "mul64.h"
 #elif defined VM_ARM_64
 #include "arm64_basic_defs.h"
 #include "vm_basic_asm_arm64.h"
@@ -51,6 +55,11 @@
 #include "mul64.h"
 #endif
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 /*
  * Locate most and least significant bit set functions. Use our own name
  * space to avoid namespace collisions. The new names follow a pattern,
@@ -623,6 +632,11 @@ uint16set(void *dst, uint16 val, size_t count)
 {
 #ifdef VM_X86_64
    __stosw((uint16*)dst, val, count);
+#elif defined(VM_ARM_32)
+   size_t i;
+   for (i = 0; i < count; i++) {
+      ((uint16 *)dst)[i] = val;
+   }
 #else
    __asm { pushf;
            mov ax, val;
@@ -641,6 +655,11 @@ uint32set(void *dst, uint32 val, size_t count)
 {
 #ifdef VM_X86_64
    __stosd((unsigned long*)dst, (unsigned long)val, count);
+#elif defined(VM_ARM_32)
+   size_t i;
+   for (i = 0; i < count; i++) {
+      ((uint32 *)dst)[i] = val;
+   }
 #else
    __asm { pushf;
            mov eax, val;
@@ -673,7 +692,7 @@ static INLINE uint16
 Bswap16(uint16 v)
 {
 #if defined(VM_ARM_64)
-   __asm__("rev16 %0, %0" : "+r"(v));
+   __asm__("rev16 %w0, %w0" : "+r"(v));
    return v;
 #else
    return ((v >> 8) & 0x00ff) | ((v << 8) & 0xff00);
@@ -702,12 +721,12 @@ Bswap32(uint32 v) // IN
       : "0" (v)
    );
    return v;
-#elif defined(VM_ARM_32) && !defined(__ANDROID__)
+#elif defined(VM_ARM_32) && !defined(__ANDROID__) && !defined(_MSC_VER)
     __asm__("rev %0, %0" : "+r"(v));
     return v;
 #elif defined(VM_ARM_64)
-   __asm__("rev32 %0, %0" : "+r"(v));
-    return v;
+   __asm__("rev32 %x0, %x0" : "+r"(v));
+   return v;
 #else
    return    (v >> 24)
           | ((v >>  8) & 0xFF00)
@@ -740,63 +759,6 @@ Bswap64(uint64 v) // IN
 }
 
 
-/*
- * COMPILER_MEM_BARRIER prevents the compiler from re-ordering memory
- * references accross the barrier.  NOTE: It does not generate any
- * instruction, so the CPU is free to do whatever it wants to...
- */
-#ifdef __GNUC__
-#define COMPILER_MEM_BARRIER()   __asm__ __volatile__ ("": : :"memory")
-#define COMPILER_READ_BARRIER()  COMPILER_MEM_BARRIER()
-#define COMPILER_WRITE_BARRIER() COMPILER_MEM_BARRIER()
-#elif defined(_MSC_VER)
-#define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
-#define COMPILER_READ_BARRIER()  _ReadBarrier()
-#define COMPILER_WRITE_BARRIER() _WriteBarrier()
-#endif
-
-
-/*
- *----------------------------------------------------------------------
- *
- * COMPILER_FORCED_LOAD_AND_MEM_BARRIER --
- *
- *        This macro prevents the compiler from re-ordering memory references
- *        across the barrier. In addition it emits a forced load from the given
- *        memory reference. The memory reference has to be either 1, 2, 4 or 8
- *        bytes wide.
- *        The forced load of a memory reference can be used exploit details of a
- *        given CPUs memory model. For example x86 CPUs won't reorder stores to
- *        a memory location x with loads from a memory location x.
- *        NOTE: It does not generate any fencing instruction, so the CPU is free
- *              to reorder instructions according to its memory model.
- *
- * Results:
- *        None
- *
- * Side Effects:
- *        None.
- *
- *----------------------------------------------------------------------
- */
-
-#ifdef VM_X86_64
-#ifdef __GNUC__
-
-#define COMPILER_FORCED_LOAD_AND_MEM_BARRIER(_memory_reference)               \
-   do {                                                                       \
-      typeof(_memory_reference) _dummy;                                       \
-                                                                              \
-      asm volatile("mov %1, %0\n\t"                                           \
-                   : "=r" (_dummy) /* Let compiler choose reg for _dummy */   \
-                   : "m" (_memory_reference)                                  \
-                   : "memory");                                               \
-   } while(0)
-
-#endif /* __GNUC__ */
-#endif /* VM_X86_64 */
-
-
 /*
  * PAUSE is a P4 instruction that improves spinlock power+performance;
  * on non-P4 IA32 systems, the encoding is interpreted as a REPZ-NOP.
@@ -804,7 +766,7 @@ Bswap64(uint64 v) // IN
  */
 static INLINE void
 PAUSE(void)
-#ifdef __GNUC__
+#if defined(__GNUC__) || defined(VM_ARM_32)
 {
 #ifdef VM_ARM_ANY
    /*
@@ -878,6 +840,15 @@ RDTSC(void)
 {
    return __rdtsc();
 }
+#elif defined(VM_ARM_32)
+{
+   /*
+    * We need to do more inverstagetion here to find
+    * a microsoft equivalent of that code
+    */
+   NOT_IMPLEMENTED();
+   return 0;
+}
 #else
 #pragma warning( disable : 4035)
 {
@@ -1254,5 +1225,10 @@ RoundUpPow2_32(uint32 value)
 #endif
 }
 
+
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif // _VM_BASIC_ASM_H_
 
diff --git a/vmmon-only/include/vm_basic_asm_x86.h b/vmmon-only/include/vm_basic_asm_x86.h
index 2c4232c3..b9c684f4 100644
--- a/vmmon-only/include/vm_basic_asm_x86.h
+++ b/vmmon-only/include/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -35,6 +35,11 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 #ifdef VM_X86_64
 /*
  * The gcc inline asm uses the "A" constraint which differs in 32 & 64
@@ -545,4 +550,9 @@ Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
 #pragma warning(default: 4035)
 #endif
 
+
+#if defined __cplusplus
+} // extern "C"
 #endif
+
+#endif // _VM_BASIC_ASM_X86_H_
diff --git a/vmmon-only/include/vm_basic_asm_x86_64.h b/vmmon-only/include/vm_basic_asm_x86_64.h
index bef0056d..4f9fd4f2 100644
--- a/vmmon-only/include/vm_basic_asm_x86_64.h
+++ b/vmmon-only/include/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -59,24 +59,23 @@ uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
 
 #if defined(__GNUC__)
 /*
- * GET_CURRENT_RIP
+ * GET_CURRENT_PC
  *
- * Returns the current instruction pointer. In the example below:
+ * Returns the current program counter (i.e. instruction pointer i.e. rip
+ * register on x86_64). In the example below:
  *
  *   foo.c
- *   L123: Foo(GET_CURRENT_RIP())
+ *   L123: Foo(GET_CURRENT_PC())
  *
- * the return value from GET_CURRENT_RIP will point a debugger to L123.
+ * the return value from GET_CURRENT_PC will point a debugger to L123.
  */
-#define GET_CURRENT_RIP() ({                                          \
+#define GET_CURRENT_PC() ({                                           \
       void *__rip;                                                    \
       asm("lea 0(%%rip), %0;\n\t"                                     \
          : "=r" (__rip));                                             \
       __rip;                                                          \
 })
 
-#define GET_CURRENT_PC() GET_CURRENT_RIP()
-
 /*
  * GET_CURRENT_LOCATION
  *
diff --git a/vmmon-only/include/vm_basic_asm_x86_common.h b/vmmon-only/include/vm_basic_asm_x86_common.h
index 6bbbc3e6..06ae1b5f 100644
--- a/vmmon-only/include/vm_basic_asm_x86_common.h
+++ b/vmmon-only/include/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -89,6 +89,9 @@ void _mm_mfence(void);
 void _mm_lfence(void);
 #pragma intrinsic(_mm_mfence, _mm_lfence)
 
+long _InterlockedXor(long volatile *, long);
+#pragma intrinsic(_InterlockedXor)
+
 unsigned int __getcallerseflags(void);
 #pragma intrinsic(__getcallerseflags)
 
@@ -294,20 +297,150 @@ RDTSC_BARRIER(void)
 
 
 /*
- * Compiler/CPU barriers. These take the form of <mem access type>_<mem access
- * type>_MEM_BARRIER, where <mem access type> is either LD (load), ST (store) or
- * LDST (any). On x86 we only need to care specifically about store-load
- * reordering on normal memory types and mfence, otherwise only a compiler
- * barrier is needed.
+ * Memory Barriers
+ * ===============
+ *
+ *    Terminology
+ *    -----------
+ *
+ * A compiler memory barrier prevents the compiler from re-ordering memory
+ * accesses accross the barrier. It is not a CPU instruction, it is a compiler
+ * directive (i.e. it does not emit any code).
+ *
+ * A CPU memory barrier prevents the CPU from re-ordering memory accesses
+ * accross the barrier. It is a CPU instruction.
+ *
+ * A memory barrier is the union of a compiler memory barrier and a CPU memory
+ * barrier. A compiler memory barrier is a useless construct by itself. It is
+ * only useful when combined with a CPU memory barrier, to implement a memory
+ * barrier.
+ *
+ *    Semantics
+ *    ---------
+ *
+ * At the time COMPILER_*_BARRIER were created (and references to them were
+ * added to the code), the code was only targetting x86. The intent of the code
+ * was really to use a memory barrier, but because x86 uses a strongly ordered
+ * memory model, the CPU would not re-order memory accesses, and the code could
+ * get away with using just a compiler memory barrier. So COMPILER_*_BARRIER
+ * were born and were implemented as compiler memory barriers _on x86_. But
+ * make no mistake, _the semantics that the code expects from
+ * COMPILER_*_BARRIER are that of a memory barrier_!
+ *
+ *    DO NOT USE!
+ *    -----------
+ *
+ * On at least one non-x86 architecture, COMPILER_*_BARRIER are
+ * 1) Misnomers
+ * 2) Not fine-grained enough to provide the best performance.
+ * For the above two reasons, usage of COMPILER_*_BARRIER is now deprecated.
+ * _Do not add new references to COMPILER_*_BARRIER._ Instead, precisely
+ * document the intent of your code by using
+ * <mem_type/purpose>_<before_access_type>_BARRIER_<after_access_type>.
+ * Existing references to COMPILER_*_BARRIER are being slowly but surely
+ * converted, and when no references are left, COMPILER_*_BARRIER will be
+ * retired.
+ *
+ * Thanks for pasting this whole comment into every architecture header.
+ */
+
+#if defined __GNUC__
+#   define COMPILER_READ_BARRIER()  COMPILER_MEM_BARRIER()
+#   define COMPILER_WRITE_BARRIER() COMPILER_MEM_BARRIER()
+#   define COMPILER_MEM_BARRIER()   __asm__ __volatile__("" ::: "memory")
+#elif defined _MSC_VER
+#   define COMPILER_READ_BARRIER()  _ReadBarrier()
+#   define COMPILER_WRITE_BARRIER() _WriteBarrier()
+#   define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
+#endif
+
+
+/*
+ * Memory barriers. These take the form of
+ *
+ * <mem_type/purpose>_<before_access_type>_BARRIER_<after_access_type>
+ *
+ * where:
+ *   <mem_type/purpose> is either SMP, DMA, or MMIO.
+ *   <*_access type> is either R(load), W(store) or RW(any).
+ *
+ * Above every use of these memory barriers in the code, there _must_ be a
+ * comment to justify the use, i.e. a comment which:
+ *
+ * 1) Precisely identifies which memory accesses must not be re-ordered across
+ *    the memory barrier.
+ * 2) Explains why it is important that the memory accesses not be re-ordered.
+ *
+ * Thanks for pasting this whole comment into every architecture header.
+ *
+ * On x86, we only need to care specifically about store-load reordering on
+ * normal memory types. In other cases, only a compiler barrier is needed. The
+ * ST_LD barrier is implemented with a locked xor operation (instead of the
+ * mfence instruction) for performance reasons. See PR 1674199 for more
+ * details.
+ *
+ * On x64, special instructions are only provided for load-load (lfence) and
+ * store-store (sfence) ordering, and they don't apply to normal memory.
+ */
+
+
+static INLINE void
+SMP_W_BARRIER_R(void)
+{
+   volatile long temp;
+
+   COMPILER_MEM_BARRIER();
+#if defined __GNUC__
+   __asm__ __volatile__ (
+      "lock xorl $1, %0\n"
+      : "+m" (temp)
+      : /* no additional inputs */
+      : "cc");
+#elif defined _MSC_VER
+   _InterlockedXor(&temp, 1);
+#else
+#error SMP_W_BARRIER_R not defined for this compiler
+#endif
+   COMPILER_MEM_BARRIER();
+}
+
+#define SMP_R_BARRIER_R()     COMPILER_READ_BARRIER()
+#define SMP_R_BARRIER_W()     COMPILER_MEM_BARRIER()
+#define SMP_R_BARRIER_RW()    COMPILER_MEM_BARRIER()
+#define SMP_W_BARRIER_W()     COMPILER_WRITE_BARRIER()
+#define SMP_W_BARRIER_RW()    SMP_W_BARRIER_R()
+#define SMP_RW_BARRIER_R()    SMP_W_BARRIER_R()
+#define SMP_RW_BARRIER_W()    COMPILER_MEM_BARRIER()
+#define SMP_RW_BARRIER_RW()   SMP_W_BARRIER_R()
+
+/*
+ * Like the above, only for use with observers other than CPUs,
+ * i.e. DMA masters.
+ */
+
+#define DMA_R_BARRIER_R()     SMP_R_BARRIER_R()
+#define DMA_R_BARRIER_W()     SMP_R_BARRIER_W()
+#define DMA_R_BARRIER_RW()    SMP_R_BARRIER_RW()
+#define DMA_W_BARRIER_R()     SMP_W_BARRIER_R()
+#define DMA_W_BARRIER_W()     SMP_W_BARRIER_W()
+#define DMA_W_BARRIER_RW()    SMP_W_BARRIER_RW()
+#define DMA_RW_BARRIER_R()    SMP_RW_BARRIER_R()
+#define DMA_RW_BARRIER_W()    SMP_RW_BARRIER_W()
+#define DMA_RW_BARRIER_RW()   SMP_RW_BARRIER_RW()
+
+/*
+ * And finally a set for use with MMIO accesses.
  */
-#define LD_LD_MEM_BARRIER()      COMPILER_MEM_BARRIER()
-#define LD_ST_MEM_BARRIER()      COMPILER_MEM_BARRIER()
-#define LD_LDST_MEM_BARRIER()    COMPILER_MEM_BARRIER()
-#define ST_LD_MEM_BARRIER()      asm volatile ("mfence" ::: "memory")
-#define ST_ST_MEM_BARRIER()      COMPILER_MEM_BARRIER()
-#define ST_LDST_MEM_BARRIER()    ST_LD_MEM_BARRIER()
-#define LDST_LD_MEM_BARRIER()    ST_LD_MEM_BARRIER()
-#define LDST_ST_MEM_BARRIER()    COMPILER_MEM_BARRIER()
-#define LDST_LDST_MEM_BARRIER()  ST_LD_MEM_BARRIER()
+
+#define MMIO_R_BARRIER_R()    SMP_R_BARRIER_R()
+#define MMIO_R_BARRIER_W()    SMP_R_BARRIER_W()
+#define MMIO_R_BARRIER_RW()   SMP_R_BARRIER_RW()
+#define MMIO_W_BARRIER_R()    SMP_W_BARRIER_R()
+#define MMIO_W_BARRIER_W()    SMP_W_BARRIER_W()
+#define MMIO_W_BARRIER_RW()   SMP_W_BARRIER_RW()
+#define MMIO_RW_BARRIER_R()   SMP_RW_BARRIER_R()
+#define MMIO_RW_BARRIER_W()   SMP_RW_BARRIER_W()
+#define MMIO_RW_BARRIER_RW()  SMP_RW_BARRIER_RW()
+
 
 #endif // _VM_BASIC_ASM_X86_COMMON_H_
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index efe492ab..47022384 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -251,12 +251,16 @@ Max(int a, int b)
 #define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
 #endif
 
+#ifndef MBYTES_SHIFT
+#define MBYTES_SHIFT 20
+#endif
+
 #ifndef MBYTES_2_PAGES
-#define MBYTES_2_PAGES(_nbytes) ((_nbytes) << (20 - PAGE_SHIFT))
+#define MBYTES_2_PAGES(_nbytes) ((_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_MBYTES
-#define PAGES_2_MBYTES(_npages) ((_npages) >> (20 - PAGE_SHIFT))
+#define PAGES_2_MBYTES(_npages) ((_npages) >> (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef GBYTES_2_PAGES
@@ -268,11 +272,11 @@ Max(int a, int b)
 #endif
 
 #ifndef BYTES_2_MBYTES
-#define BYTES_2_MBYTES(_nbytes) ((_nbytes) >> 20)
+#define BYTES_2_MBYTES(_nbytes) ((_nbytes) >> MBYTES_SHIFT)
 #endif
 
 #ifndef MBYTES_2_BYTES
-#define MBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << 20)
+#define MBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << MBYTES_SHIFT)
 #endif
 
 #ifndef BYTES_2_GBYTES
@@ -299,6 +303,26 @@ Max(int a, int b)
 #define VM_PAE_LARGE_2_SMALL_PAGES (BYTES_2_PAGES(VM_PAE_LARGE_PAGE_SIZE))
 #endif
 
+#ifndef VM_PAE_LARGE_2_BYTES
+#define VM_PAE_LARGE_2_BYTES(_2mbytes) ((_2mbytes) << VM_PAE_LARGE_PAGE_SHIFT)
+#endif
+
+#ifndef VM_1GB_PAGE_SHIFT
+#define VM_1GB_PAGE_SHIFT 30
+#endif
+
+#ifndef VM_1GB_PAGE_SIZE
+#define VM_1GB_PAGE_SIZE (1 << VM_1GB_PAGE_SHIFT)
+#endif
+
+#ifndef VM_1GB_2_PAGES
+#define VM_1GB_2_PAGES (BYTES_2_PAGES(VM_1GB_PAGE_SIZE))
+#endif
+
+#ifndef VM_1GB_2_PDIRS
+#define VM_1GB_2_PDIRS (VM_1GB_PAGE_SIZE / VM_PAE_LARGE_PAGE_SIZE)
+#endif
+
 /*
  * Word operations
  */
@@ -394,9 +418,7 @@ void *_ReturnAddress(void);
  * guarantee.  Bummer.  --Jeremy.
  */
 
-#if defined(N_PLAT_NLM)
-/* We do not have YIELD() as we do not need it yet... */
-#elif defined(_WIN32)
+#if defined(_WIN32)
 #      define YIELD()		Sleep(0)
 #elif defined(VMKERNEL)
 /* We don't have a YIELD macro in the vmkernel */
@@ -412,7 +434,11 @@ void *_ReturnAddress(void);
 
 #ifdef _WIN32 // {
 
+/* Conflict with definition of Visual Studio 2015 */
+#if (_MSC_VER < 1900)
 #define snprintf  _snprintf
+#endif
+
 #define strtok_r  strtok_s
 
 #if (_MSC_VER < 1500)
@@ -652,14 +678,24 @@ typedef int pid_t;
 #define APPLE_ONLY(x) x
 #else
 #define vmx86_apple 0
-#define APPLE_ONLY(x) 
+#define APPLE_ONLY(x)
+#endif
+
+#if defined(__APPLE__) && defined(VMW_APPLE_SANDBOX)
+#define vmw_apple_sandbox 1
+#else
+#define vmw_apple_sandbox 0
 #endif
 
 #ifdef VMM
 #define VMM_ONLY(x) x
-#define USER_ONLY(x)
 #else
 #define VMM_ONLY(x)
+#endif
+
+#if defined(VMM) || defined(VMKERNEL)
+#define USER_ONLY(x)
+#else
 #define USER_ONLY(x) x
 #endif
 
@@ -781,6 +817,22 @@ typedef int pid_t;
 #define SIZE_80BIT  10
 #define SIZE_128BIT 16
 #define SIZE_256BIT 32
+#define SIZE_512BIT 64
+
+/*
+ * Allocate a variable of type _type, aligned to _align bytes, returning a
+ * pointer to the variable in _var.  Potentially _align - 1 bytes may be
+ * wasted.  On x86, GCC 6.3.0 behaves sub-optimally when variables are declared
+ * on the stack using the aligned attribute, so this pattern is preferred.
+ * See PRs 1795155, 1819963.
+ */
+#define WITH_PTR_TO_ALIGNED_VAR(_type, _align, _var)                     \
+   do {                                                                  \
+      uint8 _buf_##_var[sizeof(_type) + (_align) - 1];                   \
+      _type *_var = (_type *) ((uintptr_t)(_buf_##_var + (_align) - 1) & \
+                               ~((uintptr_t) ((_align) - 1)));
 
+#define END_PTR_TO_ALIGNED_VAR \
+   } while (0)
 
 #endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmmon-only/include/vm_basic_math.h b/vmmon-only/include/vm_basic_math.h
index cef94cf1..b6f5486b 100644
--- a/vmmon-only/include/vm_basic_math.h
+++ b/vmmon-only/include/vm_basic_math.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,6 +38,10 @@
 #include "vm_basic_types.h" // For INLINE.
 #include "vm_basic_asm.h"   // For Div64...
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
 
 static INLINE uint32
 RatioOf(uint32 numer1, uint32 numer2, uint32 denom)
@@ -62,13 +66,36 @@ ExponentialAvg(uint32 avg, uint32 value, uint32 gainNumer, uint32 gainDenom)
    return (term1 + term2) / gainDenom;
 }
 
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * IsZeroOrPowerOfTwo --
+ * IsZeroOrPowerOfTwo64 --
+ *
+ * Results:
+ *      TRUE iff the value is 0 or a power of two.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+IsZeroOrPowerOfTwo64(uint64 x)
+{
+   return !(x & (x - 1));
+}
+
+
 static INLINE Bool
-IsPowerOfTwo(uint32 x)
+IsZeroOrPowerOfTwo(uint32 x)     // IN
 {
-   /* Does not check for zero. Callers depend on this. */
    return !(x & (x - 1));
 }
 
+
 static INLINE uint32
 GetPowerOfTwo(uint32 x)
 {
@@ -163,4 +190,8 @@ RotateRight64(uint64 value, uint8 shift)
 #endif // if !defined(_WIN32) && !defined(_WIN64)
 
 
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif // ifndef _VM_BASIC_MATH_H_
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index 17b11b96..01aa0c9f 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,7 +40,8 @@
 
 /* STRICT ANSI means the Xserver build and X defines Bool differently. */
 #if !defined(_XTYPEDEF_BOOL) && \
-    (!defined(__STRICT_ANSI__) || defined(__FreeBSD__) || defined(__MINGW32__))
+    (!defined(__STRICT_ANSI__) || defined(__FreeBSD__) || \
+      defined(__MINGW32__) || defined(__APPLE__))
 #define _XTYPEDEF_BOOL
 typedef char           Bool;
 #endif
@@ -53,8 +54,7 @@ typedef char           Bool;
 #define TRUE           1
 #endif
 
-#define IsBool(x)      (((x) & ~1) == 0)
-#define IsBool2(x, y)  ((((x) | (y)) & ~1) == 0)
+#define IS_BOOL(x)     (((x) & ~1) == 0)
 
 /*
  * Macros __i386__ and __ia64 are intrinsically defined by GCC
@@ -312,6 +312,19 @@ typedef uint32    uintptr_t;
 #endif
 
 
+#if defined(__GNUC__) && defined(__SIZEOF_INT128__)
+
+typedef unsigned __int128 uint128;
+typedef          __int128  int128;
+
+#define MIN_INT128   ((int128)1 << 127)
+#define MAX_INT128   (~MIN_INT128)
+#define MIN_UINT128  ((uint128)0)
+#define MAX_UINT128  (~MIN_UINT128)
+
+#endif
+
+
 /*
  * Time
  * XXX These should be cleaned up.  -- edward
@@ -353,14 +366,7 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
    #define FMTH ""
 #elif __GNUC__
    #define FMTH ""
-   #if defined(N_PLAT_NLM) || defined(sun) || \
-       (defined(__FreeBSD__) && (__FreeBSD__ + 0) && ((__FreeBSD__ + 0) < 5))
-      /*
-       * Why (__FreeBSD__ + 0)?  See bug 141008.
-       * Yes, we really need to test both (__FreeBSD__ + 0) and
-       * ((__FreeBSD__ + 0) < 5).  No, we can't remove "+ 0" from
-       * ((__FreeBSD__ + 0) < 5).
-       */
+   #if defined(sun)
       #if defined(VM_X86_64) || defined(VM_ARM_64)
          #define FMTSZ  "l"
          #define FMTPD  "l"
@@ -368,7 +374,8 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
          #define FMTSZ  ""
          #define FMTPD  ""
       #endif
-   #elif defined(__linux__) \
+   #elif defined(__linux__) || \
+        (defined(__FreeBSD__) && (__FreeBSD__ + 0))\
       || (defined(_POSIX_C_SOURCE) && _POSIX_C_SOURCE >= 200112L) \
       || (defined(_POSIX_VERSION) && _POSIX_VERSION >= 200112L) \
       || (defined(_POSIX2_VERSION) && _POSIX2_VERSION >= 200112L)
@@ -543,6 +550,11 @@ typedef uint16  UReg16;
 typedef uint32  UReg32;
 typedef uint64  UReg64;
 
+#if defined(__GNUC__) && defined(__SIZEOF_INT128__)
+typedef  int128  Reg128;
+typedef uint128 UReg128;
+#endif
+
 #if defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
     defined (VMKERNEL) || defined (VMKBOOT)
 typedef  Reg64  Reg;
@@ -673,10 +685,17 @@ typedef void * UserVA;
 #endif
 #define CONST         const
 
-
 #ifndef INLINE
 #   ifdef _MSC_VER
-#      define INLINE        __inline
+       /*
+        * On UWP(Universal Windows Platform),
+        * Only X86 32bit support '__inline'
+        */
+#      if defined(VM_WIN_UWP) && !defined(VM_X86_32)
+#            define INLINE
+#      else
+#            define INLINE        __inline
+#      endif
 #   else
 #      define INLINE        inline
 #   endif
@@ -887,6 +906,8 @@ typedef void * UserVA;
 #ifndef UNUSED_PARAM
 # if defined(__GNUC__)
 #  define UNUSED_PARAM(_parm) _parm  __attribute__((__unused__))
+# elif defined _MSC_VER
+#  define UNUSED_PARAM(_parm) __pragma(warning(suppress:4100)) _parm
 # else
 #  define UNUSED_PARAM(_parm) _parm
 # endif
@@ -921,6 +942,21 @@ typedef void * UserVA;
 #define ALIGNED(n)
 #endif
 
+
+/*
+ * Encapsulate the syntactic differences between gcc and msvc alignment control.
+ * BOUNDARY must match in the prefix and suffix.
+ */
+
+#ifdef _WIN32
+#define ALIGN_PREFIX(BOUNDRY) __declspec(align(BOUNDRY))
+#define ALIGN_SUFFIX(BOUNDRY)
+#else
+#define ALIGN_PREFIX(BOUNDRY)
+#define ALIGN_SUFFIX(BOUNDRY) __attribute__((__aligned__(BOUNDRY)))
+#endif
+
+
 /*
  * Once upon a time, this was used to silence compiler warnings that
  * get generated when the compiler thinks that a function returns
@@ -1102,16 +1138,6 @@ typedef void * UserVA;
 #endif
 
 
-/*
- * Define MXSemaHandle here so both vmmon and vmx see this definition.
- */
-
-#ifdef _WIN32
-typedef uintptr_t MXSemaHandle;
-#else
-typedef int MXSemaHandle;
-#endif
-
 /*
  * Define type for poll device handles.
  */
diff --git a/vmmon-only/include/vm_pagetable.h b/vmmon-only/include/vm_pagetable.h
new file mode 100644
index 00000000..1aaac73d
--- /dev/null
+++ b/vmmon-only/include/vm_pagetable.h
@@ -0,0 +1,128 @@
+/*********************************************************
+ * Copyright (C) 2014,2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_pagetable.h --
+ *
+ *      Virtual memory page table definitions
+ */
+
+#ifndef _VM_PAGETABLE_H_
+#define _VM_PAGETABLE_H_
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_USERLEVEL
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+
+/*
+ * These definitions suit both the x64 and arm64 architectures. In particular
+ * - At all levels, a page table is a 4KB page containing 512 8-byte entries.
+ * - Each entry maps 39, 30, 21 and 12 bits at the respective page table
+ *   levels (with standard page sizes).
+ */
+
+typedef uint64 PT_L4E;
+typedef uint64 PT_L3E;
+typedef uint64 PT_L2E;
+typedef uint64 PT_L1E;
+
+typedef enum {
+   PT_LEVEL_1 = 1,
+   PT_LEVEL_2,
+   PT_LEVEL_3,
+   PT_LEVEL_4,
+   PT_MAX_LEVELS = PT_LEVEL_4
+} PT_Level;
+
+#define PT_PTE_SIZE           8
+#define PT_LEVEL_SHIFT        9
+
+#define PT_PTE_PFN_SHIFT      PAGE_SHIFT
+#define PT_ENTRIES_PER_PT     (1 << PT_LEVEL_SHIFT)
+#define PT_OFF_MASK           (PT_ENTRIES_PER_PT - 1)
+
+/*
+ * log2 of the
+ * address space size (in 4KB pages) covered by a level-_l page table entry.
+ */
+#define PT_LE_PG_SHIFT(_l)    (PT_LEVEL_SHIFT * ((_l) - PT_LEVEL_1))
+
+/* Address space size (in 4KB pages) covered by a level-_l page table entry. */
+#define PT_PAGES_PER_LE(_l)   ((uint64)1 << PT_LE_PG_SHIFT(_l))
+#define PT_PAGES_PER_L4E      PT_PAGES_PER_LE(PT_LEVEL_4)
+#define PT_PAGES_PER_L3E      PT_PAGES_PER_LE(PT_LEVEL_3)
+#define PT_PAGES_PER_L2E      PT_PAGES_PER_LE(PT_LEVEL_2)
+#define PT_PAGES_PER_L1E      PT_PAGES_PER_LE(PT_LEVEL_1)
+
+/*
+ * log2 of the
+ * address space size (in bytes) covered by a level-_l page table entry.
+ */
+#define PT_LE_SHIFT(_l)       (PAGE_SHIFT + PT_LE_PG_SHIFT(_l))
+#define PT_L4E_SHIFT          PT_LE_SHIFT(PT_LEVEL_4)
+#define PT_L3E_SHIFT          PT_LE_SHIFT(PT_LEVEL_3)
+#define PT_L2E_SHIFT          PT_LE_SHIFT(PT_LEVEL_2)
+#define PT_L1E_SHIFT          PT_LE_SHIFT(PT_LEVEL_1)
+
+/* Address space size (in bytes) covered by a level-_l page table entry. */
+#define PT_LE_SIZE(_l)        ((uint64)1 << PT_LE_SHIFT(_l))
+#define PT_L4E_SIZE           PT_LE_SIZE(PT_LEVEL_4)
+#define PT_L3E_SIZE           PT_LE_SIZE(PT_LEVEL_3)
+#define PT_L2E_SIZE           PT_LE_SIZE(PT_LEVEL_2)
+#define PT_L1E_SIZE           PT_LE_SIZE(PT_LEVEL_1)
+
+/*
+ * For a given LA,
+ * determine the offset (== index) of the level-_l page table entry.
+ */
+#define PT_LA_2_LOFF(_a, _l)  (((_a) >> PT_LE_SHIFT(_l)) & PT_OFF_MASK)
+#define PT_LA_2_L4OFF(_a)     PT_LA_2_LOFF(_a, PT_LEVEL_4)
+#define PT_LA_2_L3OFF(_a)     PT_LA_2_LOFF(_a, PT_LEVEL_3)
+#define PT_LA_2_L2OFF(_a)     PT_LA_2_LOFF(_a, PT_LEVEL_2)
+#define PT_LA_2_L1OFF(_a)     PT_LA_2_LOFF(_a, PT_LEVEL_1)
+
+/*
+ * For a given LPN,
+ * determine the offset (== index) of the level-_l page table entry.
+ */
+#define PT_LPN_2_LOFF(_a, _l) (((_a) >> PT_LE_PG_SHIFT(_l)) & PT_OFF_MASK)
+#define PT_LPN_2_L4OFF(_a)    PT_LPN_2_LOFF(_a, PT_LEVEL_4)
+#define PT_LPN_2_L3OFF(_a)    PT_LPN_2_LOFF(_a, PT_LEVEL_3)
+#define PT_LPN_2_L2OFF(_a)    PT_LPN_2_LOFF(_a, PT_LEVEL_2)
+#define PT_LPN_2_L1OFF(_a)    PT_LPN_2_LOFF(_a, PT_LEVEL_1)
+
+/* Size (in bytes) of a 1GB page. */
+#define PT_1G_PAGE_SIZE       PT_L3E_SIZE
+#define PT_1G_PAGE_MASK       (PT_L3E_SIZE - 1)
+
+/* Size (in bytes) of a 2MB page. */
+#define PT_2M_PAGE_SIZE       PT_L2E_SIZE
+#define PT_2M_PAGE_MASK       (PT_L2E_SIZE - 1)
+
+#define PT_LE_NXT_PG(_a, _l)  ((((_a) >> PT_LE_PG_SHIFT(_l)) + 1) \
+                               << PT_LE_PG_SHIFT(_l))
+
+#endif
diff --git a/vmmon-only/include/vmm_constants.h b/vmmon-only/include/vmm_constants.h
index 54ad6724..b3e820d1 100644
--- a/vmmon-only/include/vmm_constants.h
+++ b/vmmon-only/include/vmm_constants.h
@@ -42,7 +42,4 @@
 
 #define VMM_PANIC_MSG_SIZE     256
 
-#define VMM_CPL0_STACK 1
-#define VMM_CPL1_STACK 2
-
 #endif
diff --git a/vmmon-only/include/vmmem_shared.h b/vmmon-only/include/vmmem_shared.h
index 4f9fefc9..291d1700 100644
--- a/vmmon-only/include/vmmem_shared.h
+++ b/vmmon-only/include/vmmem_shared.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2000-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2000-2015,2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,7 +40,7 @@
 #define VMMEM_FLAG_BIT(x) (1 << (x))
 
 #define VMMEM_ANON_LOW_MEM        VMMEM_FLAG_BIT(0)
-#define VMMEM_ANON_LARGE_PAGE     VMMEM_FLAG_BIT(1)
+#define VMMEM_ANON_CONTIG         VMMEM_FLAG_BIT(1)
 #define VMMEM_ANON_CAN_FAIL       VMMEM_FLAG_BIT(2)
 #define VMMEM_ANON_USE_PREALLOC   VMMEM_FLAG_BIT(3)
 #define VMMEM_ANON_IOABLE_PAGE    VMMEM_FLAG_BIT(4)
@@ -64,10 +64,14 @@
 #define VMMEM_PLATFORM_COW                VMMEM_FLAG_BIT(2)
 #define VMMEM_PLATFORM_EXPOSED_TO_VMM     VMMEM_FLAG_BIT(3)
 #define VMMEM_PLATFORM_P2M_UPDATE_PENDING VMMEM_FLAG_BIT(4)
-#define VMMEM_PLATFORM_TRY_COW_SUCCESS    VMMEM_FLAG_BIT(5)
-#define VMMEM_PLATFORM_DIRTY              VMMEM_FLAG_BIT(6)
-#define VMMEM_PLATFORM_BACKED_LARGE       VMMEM_FLAG_BIT(7)
+#define VMMEM_PLATFORM_DIRTY              VMMEM_FLAG_BIT(5)
+#define VMMEM_PLATFORM_IS_2M_PAGE         VMMEM_FLAG_BIT(6)
+#define VMMEM_PLATFORM_IS_1G_PAGE         VMMEM_FLAG_BIT(7)
 #define VMMEM_PLATFORM_LARGE_RETRY        VMMEM_FLAG_BIT(8)
+#define VMMEM_PLATFORM_TRY_COW_SUCCESS    VMMEM_FLAG_BIT(9)
+
+#define VMMEM_PLATFORM_BACKED_LARGE      (VMMEM_PLATFORM_IS_2M_PAGE |   \
+                                          VMMEM_PLATFORM_IS_1G_PAGE)
 
 
 #define MAX_PLATFORM_PAGE_INFO_PAGES  240
diff --git a/vmmon-only/include/vmware.h b/vmmon-only/include/vmware.h
index fa6881ff..4e2fa8b0 100644
--- a/vmmon-only/include/vmware.h
+++ b/vmmon-only/include/vmware.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vmware_pack_begin.h b/vmmon-only/include/vmware_pack_begin.h
index d0eb4bd9..fe0aec8d 100644
--- a/vmmon-only/include/vmware_pack_begin.h
+++ b/vmmon-only/include/vmware_pack_begin.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vmware_pack_end.h b/vmmon-only/include/vmware_pack_end.h
index f02e2152..75575590 100644
--- a/vmmon-only/include/vmware_pack_end.h
+++ b/vmmon-only/include/vmware_pack_end.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vmware_pack_init.h b/vmmon-only/include/vmware_pack_init.h
index c401d66c..4aa426e7 100644
--- a/vmmon-only/include/vmware_pack_init.h
+++ b/vmmon-only/include/vmware_pack_init.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index 7a5ba992..abfb0b8b 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -54,7 +54,20 @@
 #define CR0_NW         0x20000000
 #define CR0_CD         0x40000000
 #define CR0_PG         0x80000000
+
+#define CR0_CACHE_CONTROL (CR0_CD | CR0_NW)
+
 #define CR0_RESERVED   CONST64U(0xffffffff1ffaffc0)
+/*
+ * Note: The "Not Reserved" bits in CR0 are:
+ *   PG, CD, NW, AM, WP, NE, ET, TS, EM, MP, PE
+ *        |   |   |               |   |   |
+ *        |   |   +---------------+---+---+---> CR0_MUTABLE
+ *        |   |
+ *        +---+--> CR0_CACHE_CONTROL
+ *
+ * (CR0_MUTABLE is defined in vmkernel/private/x86/cpu.h)
+ */
 
 #define CR3_PWT        0x00000008
 #define CR3_PCD        0x00000010
@@ -83,8 +96,8 @@
 #define CR4_OSXSAVE    0x00040000
 #define CR4_SMEP       0x00100000
 #define CR4_SMAP       0x00200000
-/* Removing a bit from CR4_RESERVED causes Task_Switch to leave the bit set. */
-#define CR4_RESERVED   CONST64U(0xffffffffffc89800) 
+#define CR4_PKE        0x00400000
+#define CR4_RESERVED   CONST64U(0xffffffffff889800)
 #define CR8_RESERVED   CONST64U(0xfffffffffffffff0)
 
 /*
@@ -186,8 +199,9 @@
 #define EXC_MF           16
 #define EXC_AC           17
 #define EXC_MC           18
-#define EXC_XF           19  /* SIMD exception.                */
-#define EXC_SX           30  /* Security exception (SVM only). */
+#define EXC_XF           19  // SIMD exception.
+#define EXC_VE           20  // Virtualization exception - VT only.
+#define EXC_SX           30  // Security exception (SVM only).
 
 /*
  * eflag/rflag definitions.
@@ -238,5 +252,12 @@ typedef enum x86_FLAGS {
    EFLAGS__4           = 0x7fffffff    /* ensure 4 byte encoding */
 } x86_FLAGS;
 
+/*
+ *   MPX bound configuration registers
+ */
+#define BNDCFG_EN        0x00000001
+#define BNDCFG_BNDPRSV   0x00000002
+#define BNDCFG_RSVD      0x00000ffc
+#define BNDCFG_BDBASE    CONST64U(0xfffffffffffff000)
 
 #endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmmon-only/include/x86apic.h b/vmmon-only/include/x86apic.h
index 325b6d03..791ca8dc 100644
--- a/vmmon-only/include/x86apic.h
+++ b/vmmon-only/include/x86apic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2015 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -45,6 +45,7 @@
 #define X2APIC_VERSION_0x15       0x15
 #define APIC_MAXLVT_0x4           0x4
 #define XAPIC_MAXLVT_0x5          0x5
+#define XAPIC_MAXLVT_0x6          0x6 // Intel only: Nehalem (1A) and onward
 #define APIC_VERSION_MASK         0xff
 #define APIC_MAX_LVT_MASK         0xff
 #define APIC_MAX_LVT_SHIFT        16
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 2a237ac6..251e526b 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,6 +37,11 @@
 #include "x86vendor.h"
 #include "vm_assert.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 /*
  * The linux kernel's ptrace.h stupidly defines the bare
  * EAX/EBX/ECX/EDX, which wrecks havoc with our preprocessor tricks.
@@ -59,7 +64,10 @@ typedef union CPUIDRegsUnion {
  * Results of calling cpuid(eax, ecx) on all host logical CPU.
  */
 #ifdef _MSC_VER
+// TODO: Move this under the push
 #pragma warning (disable :4200) // non-std extension: zero-sized array in struct
+#pragma warning (push)
+#pragma warning (disable :4100) // unreferenced parameters
 #endif
 
 typedef
@@ -91,56 +99,73 @@ CPUIDQuery;
  * CPUID levels the monitor caches.
  *
  * The first parameter defines whether the level has its default masks
- * generated from the values in this file.  Any level which is marked
- * as FALSE here *must* have all monitor support types set to NA.  A
- * static assert in lib/cpuidcompat/cpuidcompat.c will check this.
+ * generated from the values in this file. Any level which is marked as FALSE
+ * here *must* have all monitor support types set to NA. A static assert in
+ * lib/cpuidcompat/cpuidcompat.c will check this.
+ *
+ * The second parameter is the "short name" of the level. It's mainly used for
+ * token concatenation in various macros.
+ *
+ * The third parameter is the actual numeric value of that level (the EAX input
+ * value).
+ *
+ * The fourth parameter is a "subleaf count", where 0 means that ecx is
+ * ignored, otherwise is the count of sub-leaves.
  *
- * The fourth parameter is a "sub leaf count", where 0 means that ecx
- * is ignored, otherwise is the count of sub-leaves cached/supported.
+ * The fifth parameter is the first hardware version that is *aware* of the
+ * CPUID level (0 = existed since dawn of time), even though we may not expose
+ * this level or parts of it to guest.
  */
 
 #define CPUID_CACHED_LEVELS                         \
-   CPUIDLEVEL(TRUE,  0,   0,          0)            \
-   CPUIDLEVEL(TRUE,  1,   1,          0)            \
-   CPUIDLEVEL(FALSE, 2,   2,          0)            \
-   CPUIDLEVEL(FALSE, 4,   4,          7)            \
-   CPUIDLEVEL(FALSE, 5,   5,          0)            \
-   CPUIDLEVEL(FALSE, 6,   6,          0)            \
-   CPUIDLEVEL(TRUE,  7,   7,          1)            \
-   CPUIDLEVEL(FALSE, A,   0xA,        0)            \
-   CPUIDLEVEL(FALSE, B,   0xB,        2)            \
-   CPUIDLEVEL(TRUE,  D,   0xD,        4)            \
-   CPUIDLEVEL(FALSE, 12,  0x12,       4)            \
-   CPUIDLEVEL(FALSE, 400, 0x40000000, 0)            \
-   CPUIDLEVEL(FALSE, 401, 0x40000001, 0)            \
-   CPUIDLEVEL(FALSE, 402, 0x40000002, 0)            \
-   CPUIDLEVEL(FALSE, 403, 0x40000003, 0)            \
-   CPUIDLEVEL(FALSE, 404, 0x40000004, 0)            \
-   CPUIDLEVEL(FALSE, 405, 0x40000005, 0)            \
-   CPUIDLEVEL(FALSE, 406, 0x40000006, 0)            \
-   CPUIDLEVEL(FALSE, 410, 0x40000010, 0)            \
-   CPUIDLEVEL(FALSE, 80,  0x80000000, 0)            \
-   CPUIDLEVEL(TRUE,  81,  0x80000001, 0)            \
-   CPUIDLEVEL(FALSE, 82,  0x80000002, 0)            \
-   CPUIDLEVEL(FALSE, 83,  0x80000003, 0)            \
-   CPUIDLEVEL(FALSE, 84,  0x80000004, 0)            \
-   CPUIDLEVEL(FALSE, 85,  0x80000005, 0)            \
-   CPUIDLEVEL(FALSE, 86,  0x80000006, 0)            \
-   CPUIDLEVEL(FALSE, 87,  0x80000007, 0)            \
-   CPUIDLEVEL(FALSE, 88,  0x80000008, 0)            \
-   CPUIDLEVEL(TRUE,  8A,  0x8000000A, 0)            \
-   CPUIDLEVEL(FALSE, 819, 0x80000019, 0)            \
-   CPUIDLEVEL(FALSE, 81A, 0x8000001A, 0)            \
-   CPUIDLEVEL(FALSE, 81B, 0x8000001B, 0)            \
-   CPUIDLEVEL(FALSE, 81C, 0x8000001C, 0)            \
-   CPUIDLEVEL(FALSE, 81D, 0x8000001D, 5)            \
-   CPUIDLEVEL(FALSE, 81E, 0x8000001E, 0)
+   CPUIDLEVEL(TRUE,  0,   0,          0,  0)        \
+   CPUIDLEVEL(TRUE,  1,   1,          0,  0)        \
+   CPUIDLEVEL(FALSE, 2,   2,          0,  0)        \
+   CPUIDLEVEL(FALSE, 4,   4,          7,  0)        \
+   CPUIDLEVEL(FALSE, 5,   5,          0,  0)        \
+   CPUIDLEVEL(TRUE,  6,   6,          0,  0)        \
+   CPUIDLEVEL(TRUE,  7,   7,          1,  0)        \
+   CPUIDLEVEL(FALSE, A,   0xA,        0,  0)        \
+   CPUIDLEVEL(FALSE, B,   0xB,        2,  0)        \
+   CPUIDLEVEL(TRUE,  D,   0xD,       10,  0)        \
+   CPUIDLEVEL(TRUE,  F,   0xF,        2, 13)        \
+   CPUIDLEVEL(TRUE,  10,  0x10,       2, 13)        \
+   CPUIDLEVEL(TRUE,  12,  0x12,       4, 13)        \
+   CPUIDLEVEL(TRUE,  14,  0x14,       2, 13)        \
+   CPUIDLEVEL(TRUE,  15,  0x15,       0, 13)        \
+   CPUIDLEVEL(TRUE,  16,  0x16,       0, 13)        \
+   CPUIDLEVEL(TRUE,  17,  0x17,       4, 14)        \
+   CPUIDLEVEL(FALSE, 400, 0x40000000, 0,  0)        \
+   CPUIDLEVEL(FALSE, 401, 0x40000001, 0,  0)        \
+   CPUIDLEVEL(FALSE, 402, 0x40000002, 0,  0)        \
+   CPUIDLEVEL(FALSE, 403, 0x40000003, 0,  0)        \
+   CPUIDLEVEL(FALSE, 404, 0x40000004, 0,  0)        \
+   CPUIDLEVEL(FALSE, 405, 0x40000005, 0,  0)        \
+   CPUIDLEVEL(FALSE, 406, 0x40000006, 0,  0)        \
+   CPUIDLEVEL(FALSE, 410, 0x40000010, 0,  0)        \
+   CPUIDLEVEL(FALSE, 80,  0x80000000, 0,  0)        \
+   CPUIDLEVEL(TRUE,  81,  0x80000001, 0,  0)        \
+   CPUIDLEVEL(FALSE, 82,  0x80000002, 0,  0)        \
+   CPUIDLEVEL(FALSE, 83,  0x80000003, 0,  0)        \
+   CPUIDLEVEL(FALSE, 84,  0x80000004, 0,  0)        \
+   CPUIDLEVEL(FALSE, 85,  0x80000005, 0,  0)        \
+   CPUIDLEVEL(FALSE, 86,  0x80000006, 0,  0)        \
+   CPUIDLEVEL(FALSE, 87,  0x80000007, 0,  0)        \
+   CPUIDLEVEL(TRUE,  88,  0x80000008, 0,  0)        \
+   CPUIDLEVEL(TRUE,  8A,  0x8000000A, 0,  0)        \
+   CPUIDLEVEL(FALSE, 819, 0x80000019, 0,  0)        \
+   CPUIDLEVEL(FALSE, 81A, 0x8000001A, 0,  0)        \
+   CPUIDLEVEL(FALSE, 81B, 0x8000001B, 0,  0)        \
+   CPUIDLEVEL(FALSE, 81C, 0x8000001C, 0,  0)        \
+   CPUIDLEVEL(FALSE, 81D, 0x8000001D, 5,  0)        \
+   CPUIDLEVEL(FALSE, 81E, 0x8000001E, 0,  0)        \
+   CPUIDLEVEL(TRUE,  81F, 0x8000001F, 0, 14)
 
 #define CPUID_ALL_LEVELS CPUID_CACHED_LEVELS
 
 /* Define cached CPUID levels in the form: CPUID_LEVEL_<ShortName> */
 typedef enum {
-#define CPUIDLEVEL(t, s, v, c) CPUID_LEVEL_##s,
+#define CPUIDLEVEL(t, s, v, c, h) CPUID_LEVEL_##s,
    CPUID_CACHED_LEVELS
 #undef CPUIDLEVEL
    CPUID_NUM_CACHED_LEVELS
@@ -148,7 +173,7 @@ typedef enum {
 
 /* Enum to translate between shorthand name and actual CPUID level value. */
 enum {
-#define CPUIDLEVEL(t, s, v, c) CPUID_LEVEL_VAL_##s = v,
+#define CPUIDLEVEL(t, s, v, c, h) CPUID_LEVEL_VAL_##s = v,
    CPUID_ALL_LEVELS
 #undef CPUIDLEVEL
 };
@@ -159,6 +184,8 @@ enum {
 #define CPUID_PROCESSOR_TOPOLOGY   4
 #define CPUID_MWAIT_FEATURES       5
 #define CPUID_XSAVE_FEATURES       0xd
+#define CPUID_SGX_FEATURES         0x12
+#define CPUID_PT_FEATURES          0x14
 #define CPUID_HYPERVISOR_LEVEL_0   0x40000000
 #define CPUID_SVM_FEATURES         0x8000000a
 
@@ -196,28 +223,41 @@ typedef enum {
 #define CPUID_VIA_VENDOR_STRING_FIXED   "CentaurHauls"
 
 /*
- * FIELD can be defined to process the CPUID information provided
- * in the following CPUID_FIELD_DATA macro.  The first parameter is
- * the CPUID level of the feature (must be defined in
- * CPUID_ALL_LEVELS, above.  The second parameter is the CPUID result
- * register in which the field is returned (defined in CPUID_REGS).
- * The third field is the vendor(s) this feature applies to.  "COMMON"
- * means all vendors apply.  UNKNOWN may not be used here.  The fourth
- * and fifth parameters are the bit position of the field and the
- * width, respectively.  The sixth is the text name of the field.
+ * FIELD can be defined to process the CPUID information provided in the
+ * following CPUID_FIELD_DATA macro.
+ *
+ * The first parameter is the CPUID level of the feature (must be defined in
+ * CPUID_ALL_LEVELS, above).
+ *
+ * The second parameter is the CPUID sub-level (subleaf) of the feature. Please
+ * make sure here the number is consistent with the "subleaf count" in
+ * CPUIDLEVEL macro. I.e., if a feature is being added to a _new_ subleaf,
+ * update the subleaf count above as well.
+ *
+ * The third parameter is the result register.
+ *
+ * The fourth and fifth parameters are the bit position of the field and the
+ * width, respectively.
+ *
+ * The sixth is the name of the field.
+ *
+ * The seventh parameter specifies the monitor support characteristics for
+ * this field. The value must be a valid CpuidFieldSupported value (omitting
+ * CPUID_FIELD_SUPPORT_ for convenience). The meaning of those values are
+ * described below.
  *
- * The seventh parameters specifies the monitor support
- * characteristics for this field.  The value must be a valid
- * CpuidFieldSupported value (omitting CPUID_FIELD_SUPPORT_ for
- * convenience).  The meaning of those values are described below.
+ * The eighth parameter specifies the first virtual hardware version that
+ * implements the field (if 7th field is YES or ANY), or 0 (if 7th field is
+ * NO or NA).  The field's hardware version must match the version in
+ * defaultMasks (cpuidcompat.c) if defined there, and must be less than or
+ * equal to the version of the cpuid leaf it's in.
  *
- * The eighth parameter describes whether the feature is capable of
- * being used by usermode code (TRUE), or just CPL0 kernel code
- * (FALSE).
+ * The eighth parameter describes whether the feature is capable of being used
+ * by usermode code (TRUE), or just CPL0 kernel code (FALSE).
  *
- * FLAG is defined identically to FIELD, but its accessors are more
- * appropriate for 1-bit flags, and compile-time asserts enforce that
- * the size is 1 bit wide.
+ * FLAG is defined identically to FIELD, but its accessors are more appropriate
+ * for 1-bit flags, and compile-time asserts enforce that the size is 1 bit
+ * wide.
  */
 
 
@@ -273,580 +313,775 @@ typedef enum {
    CPUID_NUM_FIELD_SUPPORTEDS
 } CpuidFieldSupported;
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_0                                               \
-FIELD(  0,  0, EAX,  0, 32, NUMLEVELS,                             ANY, FALSE) \
-FIELD(  0,  0, EBX,  0, 32, VENDOR1,                               YES, TRUE)  \
-FIELD(  0,  0, ECX,  0, 32, VENDOR3,                               YES, TRUE)  \
-FIELD(  0,  0, EDX,  0, 32, VENDOR2,                               YES, TRUE)
+FIELD(  0,  0, EAX,  0, 32, NUMLEVELS,                         ANY,  4, FALSE) \
+FIELD(  0,  0, EBX,  0, 32, VENDOR1,                           YES,  4, TRUE)  \
+FIELD(  0,  0, ECX,  0, 32, VENDOR3,                           YES,  4, TRUE)  \
+FIELD(  0,  0, EDX,  0, 32, VENDOR2,                           YES,  4, TRUE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_1                                               \
-FIELD(  1,  0, EAX,  0,  4, STEPPING,                              ANY, FALSE) \
-FIELD(  1,  0, EAX,  4,  4, MODEL,                                 ANY, FALSE) \
-FIELD(  1,  0, EAX,  8,  4, FAMILY,                                YES, FALSE) \
-FIELD(  1,  0, EAX, 12,  2, TYPE,                                  ANY, FALSE) \
-FIELD(  1,  0, EAX, 16,  4, EXTENDED_MODEL,                        ANY, FALSE) \
-FIELD(  1,  0, EAX, 20,  8, EXTENDED_FAMILY,                       YES, FALSE) \
-FIELD(  1,  0, EBX,  0,  8, BRAND_ID,                              ANY, FALSE) \
-FIELD(  1,  0, EBX,  8,  8, CLFL_SIZE,                             ANY, FALSE) \
-FIELD(  1,  0, EBX, 16,  8, LCPU_COUNT,                            ANY, FALSE) \
-FIELD(  1,  0, EBX, 24,  8, APICID,                                ANY, FALSE) \
-FLAG(   1,  0, ECX,  0,  1, SSE3,                                  YES, TRUE)  \
-FLAG(   1,  0, ECX,  1,  1, PCLMULQDQ,                             YES, TRUE)  \
-FLAG(   1,  0, ECX,  2,  1, DTES64,                                NO,  FALSE) \
-FLAG(   1,  0, ECX,  3,  1, MWAIT,                                 YES, FALSE) \
-FLAG(   1,  0, ECX,  4,  1, DSCPL,                                 NO,  FALSE) \
-FLAG(   1,  0, ECX,  5,  1, VMX,                                   YES, FALSE) \
-FLAG(   1,  0, ECX,  6,  1, SMX,                                   NO,  FALSE) \
-FLAG(   1,  0, ECX,  7,  1, EIST,                                  NO,  FALSE) \
-FLAG(   1,  0, ECX,  8,  1, TM2,                                   NO,  FALSE) \
-FLAG(   1,  0, ECX,  9,  1, SSSE3,                                 YES, TRUE)  \
-FLAG(   1,  0, ECX, 10,  1, CNXTID,                                NO,  FALSE) \
-FLAG(   1,  0, ECX, 11,  1, SDBG,                                  NO,  FALSE) \
-FLAG(   1,  0, ECX, 12,  1, FMA,                                   YES, TRUE)  \
-FLAG(   1,  0, ECX, 13,  1, CMPXCHG16B,                            YES, TRUE)  \
-FLAG(   1,  0, ECX, 14,  1, xTPR,                                  NO,  FALSE) \
-FLAG(   1,  0, ECX, 15,  1, PDCM,                                  NO,  FALSE) \
-FLAG(   1,  0, ECX, 17,  1, PCID,                                  YES, FALSE) \
-FLAG(   1,  0, ECX, 18,  1, DCA,                                   NO,  FALSE) \
-FLAG(   1,  0, ECX, 19,  1, SSE41,                                 YES, TRUE)  \
-FLAG(   1,  0, ECX, 20,  1, SSE42,                                 YES, TRUE)  \
-FLAG(   1,  0, ECX, 21,  1, x2APIC,                                ANY, FALSE) \
-FLAG(   1,  0, ECX, 22,  1, MOVBE,                                 YES, TRUE)  \
-FLAG(   1,  0, ECX, 23,  1, POPCNT,                                YES, TRUE)  \
-FLAG(   1,  0, ECX, 24,  1, TSC_DEADLINE,                          ANY, FALSE) \
-FLAG(   1,  0, ECX, 25,  1, AES,                                   YES, TRUE)  \
-FLAG(   1,  0, ECX, 26,  1, XSAVE,                                 YES, FALSE) \
-FLAG(   1,  0, ECX, 27,  1, OSXSAVE,                               ANY, FALSE) \
-FLAG(   1,  0, ECX, 28,  1, AVX,                                   YES, FALSE) \
-FLAG(   1,  0, ECX, 29,  1, F16C,                                  YES, TRUE)  \
-FLAG(   1,  0, ECX, 30,  1, RDRAND,                                YES, TRUE)  \
-FLAG(   1,  0, ECX, 31,  1, HYPERVISOR,                            ANY, TRUE)  \
-FLAG(   1,  0, EDX,  0,  1, FPU,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX,  1,  1, VME,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  2,  1, DE,                                    YES, FALSE) \
-FLAG(   1,  0, EDX,  3,  1, PSE,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  4,  1, TSC,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX,  5,  1, MSR,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  6,  1, PAE,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  7,  1, MCE,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  8,  1, CX8,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX,  9,  1, APIC,                                  ANY, FALSE) \
-FLAG(   1,  0, EDX, 11,  1, SEP,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX, 12,  1, MTRR,                                  YES, FALSE) \
-FLAG(   1,  0, EDX, 13,  1, PGE,                                   YES, FALSE) \
-FLAG(   1,  0, EDX, 14,  1, MCA,                                   YES, FALSE) \
-FLAG(   1,  0, EDX, 15,  1, CMOV,                                  YES, TRUE)  \
-FLAG(   1,  0, EDX, 16,  1, PAT,                                   YES, FALSE) \
-FLAG(   1,  0, EDX, 17,  1, PSE36,                                 YES, FALSE) \
-FLAG(   1,  0, EDX, 18,  1, PSN,                                   YES, FALSE) \
-FLAG(   1,  0, EDX, 19,  1, CLFSH,                                 YES, TRUE)  \
-FLAG(   1,  0, EDX, 21,  1, DS,                                    YES, FALSE) \
-FLAG(   1,  0, EDX, 22,  1, ACPI,                                  ANY, FALSE) \
-FLAG(   1,  0, EDX, 23,  1, MMX,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX, 24,  1, FXSR,                                  YES, TRUE)  \
-FLAG(   1,  0, EDX, 25,  1, SSE,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX, 26,  1, SSE2,                                  YES, TRUE)  \
-FLAG(   1,  0, EDX, 27,  1, SS,                                    YES, FALSE) \
-FLAG(   1,  0, EDX, 28,  1, HTT,                                   ANY, FALSE) \
-FLAG(   1,  0, EDX, 29,  1, TM,                                    NO,  FALSE) \
-FLAG(   1,  0, EDX, 30,  1, IA64,                                  NO,  FALSE) \
-FLAG(   1,  0, EDX, 31,  1, PBE,                                   NO,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FIELD(  1,  0, EAX,  0,  4, STEPPING,                          ANY,  4, FALSE) \
+FIELD(  1,  0, EAX,  4,  4, MODEL,                             ANY,  4, FALSE) \
+FIELD(  1,  0, EAX,  8,  4, FAMILY,                            YES,  4, FALSE) \
+FIELD(  1,  0, EAX, 12,  2, TYPE,                              ANY,  4, FALSE) \
+FIELD(  1,  0, EAX, 16,  4, EXTENDED_MODEL,                    ANY,  4, FALSE) \
+FIELD(  1,  0, EAX, 20,  8, EXTENDED_FAMILY,                   YES,  4, FALSE) \
+FIELD(  1,  0, EBX,  0,  8, BRAND_ID,                          ANY,  4, FALSE) \
+FIELD(  1,  0, EBX,  8,  8, CLFL_SIZE,                         ANY,  4, FALSE) \
+FIELD(  1,  0, EBX, 16,  8, LCPU_COUNT,                        ANY,  4, FALSE) \
+FIELD(  1,  0, EBX, 24,  8, APICID,                            ANY,  4, FALSE) \
+FLAG(   1,  0, ECX,  0,  1, SSE3,                              YES,  4, TRUE)  \
+FLAG(   1,  0, ECX,  1,  1, PCLMULQDQ,                         YES,  7, TRUE)  \
+FLAG(   1,  0, ECX,  2,  1, DTES64,                            NO,   0, FALSE) \
+FLAG(   1,  0, ECX,  3,  1, MWAIT,                             YES,  4, FALSE) \
+FLAG(   1,  0, ECX,  4,  1, DSCPL,                             NO,   0, FALSE) \
+FLAG(   1,  0, ECX,  5,  1, VMX,                               YES,  4, FALSE) \
+FLAG(   1,  0, ECX,  6,  1, SMX,                               NO,   0, FALSE) \
+FLAG(   1,  0, ECX,  7,  1, EIST,                              NO,   0, FALSE) \
+FLAG(   1,  0, ECX,  8,  1, TM2,                               NO,   0, FALSE) \
+FLAG(   1,  0, ECX,  9,  1, SSSE3,                             YES,  4, TRUE)  \
+FLAG(   1,  0, ECX, 10,  1, CNXTID,                            NO,   0, FALSE) \
+FLAG(   1,  0, ECX, 11,  1, SDBG,                              NO,   0, FALSE) \
+FLAG(   1,  0, ECX, 12,  1, FMA,                               YES,  8, TRUE)  \
+FLAG(   1,  0, ECX, 13,  1, CMPXCHG16B,                        YES,  4, TRUE)  \
+FLAG(   1,  0, ECX, 14,  1, xTPR,                              NO,   0, FALSE) \
+FLAG(   1,  0, ECX, 15,  1, PDCM,                              NO,   0, FALSE) \
+FLAG(   1,  0, ECX, 17,  1, PCID,                              YES,  8, FALSE) \
+FLAG(   1,  0, ECX, 18,  1, DCA,                               NO,   0, FALSE) \
+FLAG(   1,  0, ECX, 19,  1, SSE41,                             YES,  4, TRUE)  \
+FLAG(   1,  0, ECX, 20,  1, SSE42,                             YES,  4, TRUE)  \
+FLAG(   1,  0, ECX, 21,  1, x2APIC,                            ANY,  9, FALSE) \
+FLAG(   1,  0, ECX, 22,  1, MOVBE,                             YES,  7, TRUE)  \
+FLAG(   1,  0, ECX, 23,  1, POPCNT,                            YES,  4, TRUE)  \
+FLAG(   1,  0, ECX, 24,  1, TSC_DEADLINE,                      ANY, 11, FALSE) \
+FLAG(   1,  0, ECX, 25,  1, AES,                               YES,  7, TRUE)  \
+FLAG(   1,  0, ECX, 26,  1, XSAVE,                             YES,  8, FALSE) \
+FLAG(   1,  0, ECX, 27,  1, OSXSAVE,                           ANY,  8, FALSE) \
+FLAG(   1,  0, ECX, 28,  1, AVX,                               YES,  8, FALSE) \
+FLAG(   1,  0, ECX, 29,  1, F16C,                              YES,  9, TRUE)  \
+FLAG(   1,  0, ECX, 30,  1, RDRAND,                            YES,  9, TRUE)  \
+FLAG(   1,  0, ECX, 31,  1, HYPERVISOR,                        ANY,  4, TRUE)  \
+FLAG(   1,  0, EDX,  0,  1, FPU,                               YES,  4, TRUE)  \
+FLAG(   1,  0, EDX,  1,  1, VME,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX,  2,  1, DE,                                YES,  4, FALSE) \
+FLAG(   1,  0, EDX,  3,  1, PSE,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX,  4,  1, TSC,                               YES,  4, TRUE)  \
+FLAG(   1,  0, EDX,  5,  1, MSR,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX,  6,  1, PAE,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX,  7,  1, MCE,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX,  8,  1, CX8,                               YES,  4, TRUE)  \
+FLAG(   1,  0, EDX,  9,  1, APIC,                              ANY,  4, FALSE) \
+FLAG(   1,  0, EDX, 11,  1, SEP,                               YES,  4, TRUE)  \
+FLAG(   1,  0, EDX, 12,  1, MTRR,                              YES,  4, FALSE) \
+FLAG(   1,  0, EDX, 13,  1, PGE,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX, 14,  1, MCA,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX, 15,  1, CMOV,                              YES,  4, TRUE)  \
+FLAG(   1,  0, EDX, 16,  1, PAT,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX, 17,  1, PSE36,                             YES,  4, FALSE) \
+FLAG(   1,  0, EDX, 18,  1, PSN,                               YES,  4, FALSE) \
+FLAG(   1,  0, EDX, 19,  1, CLFSH,                             YES,  4, TRUE)  \
+FLAG(   1,  0, EDX, 21,  1, DS,                                YES,  4, FALSE) \
+FLAG(   1,  0, EDX, 22,  1, ACPI,                              ANY,  4, FALSE) \
+FLAG(   1,  0, EDX, 23,  1, MMX,                               YES,  4, TRUE)  \
+FLAG(   1,  0, EDX, 24,  1, FXSR,                              YES,  4, TRUE)  \
+FLAG(   1,  0, EDX, 25,  1, SSE,                               YES,  4, TRUE)  \
+FLAG(   1,  0, EDX, 26,  1, SSE2,                              YES,  4, TRUE)  \
+FLAG(   1,  0, EDX, 27,  1, SS,                                YES,  4, FALSE) \
+FLAG(   1,  0, EDX, 28,  1, HTT,                               ANY,  7, FALSE) \
+FLAG(   1,  0, EDX, 29,  1, TM,                                NO,   0, FALSE) \
+FLAG(   1,  0, EDX, 30,  1, IA64,                              NO,   0, FALSE) \
+FLAG(   1,  0, EDX, 31,  1, PBE,                               NO,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_2                                               \
-FIELD(  2,  0, EAX,  0,  8, LEAF2_COUNT,                           NA, FALSE)  \
-FIELD(  2,  0, EAX,  8,  8, LEAF2_CACHE1,                          NA, FALSE)  \
-FIELD(  2,  0, EAX, 16,  8, LEAF2_CACHE2,                          NA, FALSE)  \
-FIELD(  2,  0, EAX, 24,  8, LEAF2_CACHE3,                          NA, FALSE)  \
-FIELD(  2,  0, EBX,  0,  8, LEAF2_CACHE4,                          NA, FALSE)  \
-FIELD(  2,  0, EBX,  8,  8, LEAF2_CACHE5,                          NA, FALSE)  \
-FIELD(  2,  0, EBX, 16,  8, LEAF2_CACHE6,                          NA, FALSE)  \
-FIELD(  2,  0, EBX, 24,  8, LEAF2_CACHE7,                          NA, FALSE)  \
-FIELD(  2,  0, ECX,  0,  8, LEAF2_CACHE8,                          NA, FALSE)  \
-FIELD(  2,  0, ECX,  8,  8, LEAF2_CACHE9,                          NA, FALSE)  \
-FIELD(  2,  0, ECX, 16,  8, LEAF2_CACHE10,                         NA, FALSE)  \
-FIELD(  2,  0, ECX, 24,  8, LEAF2_CACHE11,                         NA, FALSE)  \
-FIELD(  2,  0, EDX,  0,  8, LEAF2_CACHE12,                         NA, FALSE)  \
-FIELD(  2,  0, EDX,  8,  8, LEAF2_CACHE13,                         NA, FALSE)  \
-FIELD(  2,  0, EDX, 16,  8, LEAF2_CACHE14,                         NA, FALSE)  \
-FIELD(  2,  0, EDX, 24,  8, LEAF2_CACHE15,                         NA, FALSE)  \
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FIELD(  2,  0, EAX,  0,  8, LEAF2_COUNT,                       NA,   0, FALSE) \
+FIELD(  2,  0, EAX,  8,  8, LEAF2_CACHE1,                      NA,   0, FALSE) \
+FIELD(  2,  0, EAX, 16,  8, LEAF2_CACHE2,                      NA,   0, FALSE) \
+FIELD(  2,  0, EAX, 24,  8, LEAF2_CACHE3,                      NA,   0, FALSE) \
+FIELD(  2,  0, EBX,  0,  8, LEAF2_CACHE4,                      NA,   0, FALSE) \
+FIELD(  2,  0, EBX,  8,  8, LEAF2_CACHE5,                      NA,   0, FALSE) \
+FIELD(  2,  0, EBX, 16,  8, LEAF2_CACHE6,                      NA,   0, FALSE) \
+FIELD(  2,  0, EBX, 24,  8, LEAF2_CACHE7,                      NA,   0, FALSE) \
+FIELD(  2,  0, ECX,  0,  8, LEAF2_CACHE8,                      NA,   0, FALSE) \
+FIELD(  2,  0, ECX,  8,  8, LEAF2_CACHE9,                      NA,   0, FALSE) \
+FIELD(  2,  0, ECX, 16,  8, LEAF2_CACHE10,                     NA,   0, FALSE) \
+FIELD(  2,  0, ECX, 24,  8, LEAF2_CACHE11,                     NA,   0, FALSE) \
+FIELD(  2,  0, EDX,  0,  8, LEAF2_CACHE12,                     NA,   0, FALSE) \
+FIELD(  2,  0, EDX,  8,  8, LEAF2_CACHE13,                     NA,   0, FALSE) \
+FIELD(  2,  0, EDX, 16,  8, LEAF2_CACHE14,                     NA,   0, FALSE) \
+FIELD(  2,  0, EDX, 24,  8, LEAF2_CACHE15,                     NA,   0, FALSE) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_4                                               \
-FIELD(  4,  0, EAX,  0,  5, LEAF4_CACHE_TYPE,                      NA,  FALSE) \
-FIELD(  4,  0, EAX,  5,  3, LEAF4_CACHE_LEVEL,                     NA,  FALSE) \
-FLAG(   4,  0, EAX,  8,  1, LEAF4_CACHE_SELF_INIT,                 NA,  FALSE) \
-FLAG(   4,  0, EAX,  9,  1, LEAF4_CACHE_FULLY_ASSOC,               NA,  FALSE) \
-FIELD(  4,  0, EAX, 14, 12, LEAF4_CACHE_NUMHT_SHARING,             NA,  FALSE) \
-FIELD(  4,  0, EAX, 26,  6, LEAF4_CORE_COUNT,                      NA,  FALSE) \
-FIELD(  4,  0, EBX,  0, 12, LEAF4_CACHE_LINE,                      NA,  FALSE) \
-FIELD(  4,  0, EBX, 12, 10, LEAF4_CACHE_PART,                      NA,  FALSE) \
-FIELD(  4,  0, EBX, 22, 10, LEAF4_CACHE_WAYS,                      NA,  FALSE) \
-FIELD(  4,  0, ECX,  0, 32, LEAF4_CACHE_SETS,                      NA,  FALSE) \
-FLAG(   4,  0, EDX,  0,  1, LEAF4_CACHE_WBINVD_NOT_GUARANTEED,     NA,  FALSE) \
-FLAG(   4,  0, EDX,  1,  1, LEAF4_CACHE_IS_INCLUSIVE,              NA,  FALSE) \
-FLAG(   4,  0, EDX,  2,  1, LEAF4_CACHE_COMPLEX_INDEXING,          NA,  FALSE)
-
-/*     LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                 MON SUPP, CPL3 */
+FIELD(  4,  0, EAX,  0,  5, LEAF4_CACHE_TYPE,                  NA,   0, FALSE) \
+FIELD(  4,  0, EAX,  5,  3, LEAF4_CACHE_LEVEL,                 NA,   0, FALSE) \
+FLAG(   4,  0, EAX,  8,  1, LEAF4_CACHE_SELF_INIT,             NA,   0, FALSE) \
+FLAG(   4,  0, EAX,  9,  1, LEAF4_CACHE_FULLY_ASSOC,           NA,   0, FALSE) \
+FIELD(  4,  0, EAX, 14, 12, LEAF4_CACHE_NUMHT_SHARING,         NA,   0, FALSE) \
+FIELD(  4,  0, EAX, 26,  6, LEAF4_CORE_COUNT,                  NA,   0, FALSE) \
+FIELD(  4,  0, EBX,  0, 12, LEAF4_CACHE_LINE,                  NA,   0, FALSE) \
+FIELD(  4,  0, EBX, 12, 10, LEAF4_CACHE_PART,                  NA,   0, FALSE) \
+FIELD(  4,  0, EBX, 22, 10, LEAF4_CACHE_WAYS,                  NA,   0, FALSE) \
+FIELD(  4,  0, ECX,  0, 32, LEAF4_CACHE_SETS,                  NA,   0, FALSE) \
+FLAG(   4,  0, EDX,  0,  1, LEAF4_CACHE_WBINVD_NOT_GUARANTEED, NA,   0, FALSE) \
+FLAG(   4,  0, EDX,  1,  1, LEAF4_CACHE_IS_INCLUSIVE,          NA,   0, FALSE) \
+FLAG(   4,  0, EDX,  2,  1, LEAF4_CACHE_COMPLEX_INDEXING,      NA,   0, FALSE)
+
+/*     LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,            MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_5                                               \
-FIELD(  5,  0, EAX,  0, 16, MWAIT_MIN_SIZE,                        NA,  FALSE) \
-FIELD(  5,  0, EBX,  0, 16, MWAIT_MAX_SIZE,                        NA,  FALSE) \
-FLAG(   5,  0, ECX,  0,  1, MWAIT_EXTENSIONS,                      NA,  FALSE) \
-FLAG(   5,  0, ECX,  1,  1, MWAIT_INTR_BREAK,                      NA,  FALSE) \
-FIELD(  5,  0, EDX,  0,  4, MWAIT_C0_SUBSTATE,                     NA,  FALSE) \
-FIELD(  5,  0, EDX,  4,  4, MWAIT_C1_SUBSTATE,                     NA,  FALSE) \
-FIELD(  5,  0, EDX,  8,  4, MWAIT_C2_SUBSTATE,                     NA,  FALSE) \
-FIELD(  5,  0, EDX, 12,  4, MWAIT_C3_SUBSTATE,                     NA,  FALSE) \
-FIELD(  5,  0, EDX, 16,  4, MWAIT_C4_SUBSTATE,                     NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FIELD(  5,  0, EAX,  0, 16, MWAIT_MIN_SIZE,                    NA,   0, FALSE) \
+FIELD(  5,  0, EBX,  0, 16, MWAIT_MAX_SIZE,                    NA,   0, FALSE) \
+FLAG(   5,  0, ECX,  0,  1, MWAIT_EXTENSIONS,                  NA,   0, FALSE) \
+FLAG(   5,  0, ECX,  1,  1, MWAIT_INTR_BREAK,                  NA,   0, FALSE) \
+FIELD(  5,  0, EDX,  0,  4, MWAIT_C0_SUBSTATE,                 NA,   0, FALSE) \
+FIELD(  5,  0, EDX,  4,  4, MWAIT_C1_SUBSTATE,                 NA,   0, FALSE) \
+FIELD(  5,  0, EDX,  8,  4, MWAIT_C2_SUBSTATE,                 NA,   0, FALSE) \
+FIELD(  5,  0, EDX, 12,  4, MWAIT_C3_SUBSTATE,                 NA,   0, FALSE) \
+FIELD(  5,  0, EDX, 16,  4, MWAIT_C4_SUBSTATE,                 NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_6                                               \
-FLAG(   6,  0, EAX,  0,  1, THERMAL_SENSOR,                        NA,  FALSE) \
-FLAG(   6,  0, EAX,  1,  1, TURBO_MODE,                            NA,  FALSE) \
-FLAG(   6,  0, EAX,  2,  1, APIC_INVARIANT,                        NA,  FALSE) \
-FLAG(   6,  0, EAX,  4,  1, PLN,                                   NA,  FALSE) \
-FLAG(   6,  0, EAX,  5,  1, ECMD,                                  NA,  FALSE) \
-FLAG(   6,  0, EAX,  6,  1, PTM,                                   NA,  FALSE) \
-FLAG(   6,  0, EAX,  7,  1, HWP,                                   NA,  FALSE) \
-FLAG(   6,  0, EAX,  8,  1, HWP_NOTIFICATION,                      NA,  FALSE) \
-FLAG(   6,  0, EAX,  9,  1, HWP_ACTIVITY_WINDOW,                   NA,  FALSE) \
-FLAG(   6,  0, EAX, 10,  1, HWP_ENERGY_PERFORMANCE_PREFERENCE,     NA,  FALSE) \
-FLAG(   6,  0, EAX, 11,  1, HWP_PACKAGE_LEVEL_REQUEST,             NA,  FALSE) \
-FLAG(   6,  0, EAX, 13,  1, HDC,                                   NA,  FALSE) \
-FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,                   NA,  FALSE) \
-FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                     NA,  FALSE) \
-FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                      NA,  FALSE)
-
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FLAG(   6,  0, EAX,  0,  1, THERMAL_SENSOR,                    NO,   0, FALSE) \
+FLAG(   6,  0, EAX,  1,  1, TURBO_MODE,                        NO,   0, FALSE) \
+FLAG(   6,  0, EAX,  2,  1, APIC_INVARIANT,                    ANY, 13, FALSE) \
+FLAG(   6,  0, EAX,  4,  1, PLN,                               NO,   0, FALSE) \
+FLAG(   6,  0, EAX,  5,  1, ECMD,                              NO,   0, FALSE) \
+FLAG(   6,  0, EAX,  6,  1, PTM,                               NO,   0, FALSE) \
+FLAG(   6,  0, EAX,  7,  1, HWP,                               NO,   0, FALSE) \
+FLAG(   6,  0, EAX,  8,  1, HWP_NOTIFICATION,                  NO,   0, FALSE) \
+FLAG(   6,  0, EAX,  9,  1, HWP_ACTIVITY_WINDOW,               NO,   0, FALSE) \
+FLAG(   6,  0, EAX, 10,  1, HWP_ENERGY_PERFORMANCE_PREFERENCE, NO,   0, FALSE) \
+FLAG(   6,  0, EAX, 11,  1, HWP_PACKAGE_LEVEL_REQUEST,         NO,   0, FALSE) \
+FLAG(   6,  0, EAX, 13,  1, HDC,                               NO,   0, FALSE) \
+FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,               NO,   0, FALSE) \
+FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                 NO,   0, FALSE) \
+FLAG(   6,  0, ECX,  1,  1, ACNT2,                             ANY, 13, FALSE) \
+FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                  NO,   0, FALSE)
+
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_7                                               \
-FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                              YES, FALSE) \
-FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                            ANY, FALSE) \
-FLAG(   7,  0, EBX,  3,  1, BMI1,                                  YES, TRUE)  \
-FLAG(   7,  0, EBX,  2,  1, SGX,                                   NO,  FALSE) \
-FLAG(   7,  0, EBX,  4,  1, HLE,                                   YES, TRUE)  \
-FLAG(   7,  0, EBX,  5,  1, AVX2,                                  YES, TRUE)  \
-FLAG(   7,  0, EBX,  7,  1, SMEP,                                  YES, FALSE) \
-FLAG(   7,  0, EBX,  8,  1, BMI2,                                  YES, TRUE)  \
-FLAG(   7,  0, EBX,  9,  1, ENFSTRG,                               YES, FALSE) \
-FLAG(   7,  0, EBX, 10,  1, INVPCID,                               YES, FALSE) \
-FLAG(   7,  0, EBX, 11,  1, RTM,                                   YES, TRUE)  \
-FLAG(   7,  0, EBX, 12,  1, PQM,                                   NO,  FALSE) \
-FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                       ANY, TRUE)  \
-FLAG(   7,  0, EBX, 15,  1, PQE,                                   NO,  FALSE) \
-FLAG(   7,  0, EBX, 18,  1, RDSEED,                                YES, TRUE)  \
-FLAG(   7,  0, EBX, 19,  1, ADX,                                   YES, TRUE)  \
-FLAG(   7,  0, EBX, 20,  1, SMAP,                                  YES, FALSE) \
-FLAG(   7,  0, EBX, 25,  1, PT,                                    NO,  FALSE) \
-FLAG(   7,  0, ECX,  0,  1, PREFETCHWT1,                           NO,  TRUE)
-
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                          YES,  9, FALSE) \
+FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                        ANY, 11, FALSE) \
+FLAG(   7,  0, EBX,  2,  1, SGX,                               NO,   0, FALSE) \
+FLAG(   7,  0, EBX,  3,  1, BMI1,                              YES,  9, TRUE)  \
+FLAG(   7,  0, EBX,  4,  1, HLE,                               YES, 11, TRUE)  \
+FLAG(   7,  0, EBX,  5,  1, AVX2,                              YES, 11, TRUE)  \
+FLAG(   7,  0, EBX,  6,  1, FDP_EXCPTN_ONLY,                   ANY, 13, TRUE)  \
+FLAG(   7,  0, EBX,  7,  1, SMEP,                              YES,  9, FALSE) \
+FLAG(   7,  0, EBX,  8,  1, BMI2,                              YES, 11, TRUE)  \
+FLAG(   7,  0, EBX,  9,  1, ENFSTRG,                           YES,  9, FALSE) \
+FLAG(   7,  0, EBX, 10,  1, INVPCID,                           YES, 11, FALSE) \
+FLAG(   7,  0, EBX, 11,  1, RTM,                               YES, 11, TRUE)  \
+FLAG(   7,  0, EBX, 12,  1, PQM,                               NO,   0, FALSE) \
+FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                   ANY, 11, TRUE)  \
+FLAG(   7,  0, EBX, 14,  1, MPX,                               YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 15,  1, PQE,                               NO,   0, FALSE) \
+FLAG(   7,  0, EBX, 16,  1, AVX512F,                           YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 17,  1, AVX512DQ,                          YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 18,  1, RDSEED,                            YES, 11, TRUE)  \
+FLAG(   7,  0, EBX, 19,  1, ADX,                               YES, 11, TRUE)  \
+FLAG(   7,  0, EBX, 20,  1, SMAP,                              YES, 11, FALSE) \
+FLAG(   7,  0, EBX, 21,  1, AVX512IFMA,                        YES, 15, TRUE)  \
+FLAG(   7,  0, EBX, 23,  1, CLFLUSHOPT,                        YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 24,  1, CLWB,                              YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 25,  1, PT,                                NO,   0, FALSE) \
+FLAG(   7,  0, EBX, 26,  1, AVX512PF,                          YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 27,  1, AVX512ER,                          YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 28,  1, AVX512CD,                          YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 29,  1, SHA,                               YES, 14, TRUE)  \
+FLAG(   7,  0, EBX, 30,  1, AVX512BW,                          YES, 13, TRUE)  \
+FLAG(   7,  0, EBX, 31,  1, AVX512VL,                          YES, 13, TRUE)  \
+FLAG(   7,  0, ECX,  0,  1, PREFETCHWT1,                       YES, 13, TRUE)  \
+FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                        YES, 15, TRUE)  \
+FLAG(   7,  0, ECX,  3,  1, PKU,                               YES, 13, TRUE)  \
+FLAG(   7,  0, ECX,  4,  1, OSPKE,                             ANY, 13, TRUE)  \
+FLAG(   7,  0, ECX, 30,  1, SGX_LC,                            NO,   0, FALSE) \
+
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_A                                               \
-FIELD(  A,  0, EAX,  0,  8, PMC_VERSION,                           NA,  FALSE) \
-FIELD(  A,  0, EAX,  8,  8, PMC_NUM_GEN,                           NA,  FALSE) \
-FIELD(  A,  0, EAX, 16,  8, PMC_WIDTH_GEN,                         NA,  FALSE) \
-FIELD(  A,  0, EAX, 24,  8, PMC_EBX_LENGTH,                        NA,  FALSE) \
-FLAG(   A,  0, EBX,  0,  1, PMC_CORE_CYCLES,                       NA,  FALSE) \
-FLAG(   A,  0, EBX,  1,  1, PMC_INSTR_RETIRED,                     NA,  FALSE) \
-FLAG(   A,  0, EBX,  2,  1, PMC_REF_CYCLES,                        NA,  FALSE) \
-FLAG(   A,  0, EBX,  3,  1, PMC_LAST_LVL_CREF,                     NA,  FALSE) \
-FLAG(   A,  0, EBX,  4,  1, PMC_LAST_LVL_CMISS,                    NA,  FALSE) \
-FLAG(   A,  0, EBX,  5,  1, PMC_BR_INST_RETIRED,                   NA,  FALSE) \
-FLAG(   A,  0, EBX,  6,  1, PMC_BR_MISS_RETIRED,                   NA,  FALSE) \
-FIELD(  A,  0, EDX,  0,  5, PMC_NUM_FIXED,                         NA,  FALSE) \
-FIELD(  A,  0, EDX,  5,  8, PMC_WIDTH_FIXED,                       NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FIELD(  A,  0, EAX,  0,  8, PMC_VERSION,                       NA,   0, FALSE) \
+FIELD(  A,  0, EAX,  8,  8, PMC_NUM_GEN,                       NA,   0, FALSE) \
+FIELD(  A,  0, EAX, 16,  8, PMC_WIDTH_GEN,                     NA,   0, FALSE) \
+FIELD(  A,  0, EAX, 24,  8, PMC_EBX_LENGTH,                    NA,   0, FALSE) \
+FLAG(   A,  0, EBX,  0,  1, PMC_CORE_CYCLES,                   NA,   0, FALSE) \
+FLAG(   A,  0, EBX,  1,  1, PMC_INSTR_RETIRED,                 NA,   0, FALSE) \
+FLAG(   A,  0, EBX,  2,  1, PMC_REF_CYCLES,                    NA,   0, FALSE) \
+FLAG(   A,  0, EBX,  3,  1, PMC_LAST_LVL_CREF,                 NA,   0, FALSE) \
+FLAG(   A,  0, EBX,  4,  1, PMC_LAST_LVL_CMISS,                NA,   0, FALSE) \
+FLAG(   A,  0, EBX,  5,  1, PMC_BR_INST_RETIRED,               NA,   0, FALSE) \
+FLAG(   A,  0, EBX,  6,  1, PMC_BR_MISS_RETIRED,               NA,   0, FALSE) \
+FIELD(  A,  0, EDX,  0,  5, PMC_NUM_FIXED,                     NA,   0, FALSE) \
+FIELD(  A,  0, EDX,  5,  8, PMC_WIDTH_FIXED,                   NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_B                                               \
-FIELD(  B,  0, EAX,  0,  5, TOPOLOGY_MASK_WIDTH,                   NA,  FALSE) \
-FIELD(  B,  0, EBX,  0, 16, TOPOLOGY_CPUS_SHARING_LEVEL,           NA,  FALSE) \
-FIELD(  B,  0, ECX,  0,  8, TOPOLOGY_LEVEL_NUMBER,                 NA,  FALSE) \
-FIELD(  B,  0, ECX,  8,  8, TOPOLOGY_LEVEL_TYPE,                   NA,  FALSE) \
-FIELD(  B,  0, EDX,  0, 32, TOPOLOGY_X2APIC_ID,                    NA,  FALSE)
+FIELD(  B,  0, EAX,  0,  5, TOPOLOGY_MASK_WIDTH,               NA,   0, FALSE) \
+FIELD(  B,  0, EBX,  0, 16, TOPOLOGY_CPUS_SHARING_LEVEL,       NA,   0, FALSE) \
+FIELD(  B,  0, ECX,  0,  8, TOPOLOGY_LEVEL_NUMBER,             NA,   0, FALSE) \
+FIELD(  B,  0, ECX,  8,  8, TOPOLOGY_LEVEL_TYPE,               NA,   0, FALSE) \
+FIELD(  B,  0, EDX,  0, 32, TOPOLOGY_X2APIC_ID,                NA,   0, FALSE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_D                                               \
-FLAG(   D,  0, EAX,  0,  1, XCR0_MASTER_LEGACY_FP,                 YES, FALSE) \
-FLAG(   D,  0, EAX,  1,  1, XCR0_MASTER_SSE,                       YES, FALSE) \
-FLAG(   D,  0, EAX,  2,  1, XCR0_MASTER_YMM_H,                     YES, FALSE) \
-FIELD(  D,  0, EAX,  3, 29, XCR0_MASTER_LOWER,                     NO,  FALSE) \
-FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                    ANY, FALSE) \
-FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                        YES, FALSE) \
-FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                     NO,  FALSE) \
-FLAG(   D,  0, EDX, 30,  1, XCR0_MASTER_LWP,                       NO,  FALSE) \
-FLAG(   D,  0, EDX, 31,  1, XCR0_MASTER_EXTENDED_XSAVE,            NO,  FALSE) \
-FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                              YES, FALSE) \
-FLAG(   D,  1, EAX,  1,  1, XSAVEC,                                NO,  FALSE) \
-FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                           NO,  FALSE) \
-FLAG(   D,  1, EAX,  3,  1, XSAVES,                                NO,  FALSE) \
-FIELD(  D,  1, EBX,  0, 32, XSAVE_XSS_SIZE,                        NO,  FALSE) \
-FIELD(  D,  1, ECX,  0, 32, XSS_LOWER,                             NO,  FALSE) \
-FIELD(  D,  1, EDX,  0, 32, XSS_UPPER,                             NO,  FALSE) \
-FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                        YES, FALSE) \
-FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                      YES, FALSE) \
-FIELD(  D,  2, ECX,  0, 32, XSAVE_YMM_RSVD1,                       YES, FALSE) \
-FIELD(  D,  2, EDX,  0, 32, XSAVE_YMM_RSVD2,                       YES, FALSE) \
-FIELD(  D, 62, EAX,  0, 32, XSAVE_LWP_SIZE,                        NO,  FALSE) \
-FIELD(  D, 62, EBX,  0, 32, XSAVE_LWP_OFFSET,                      NO,  FALSE) \
-FIELD(  D, 62, ECX,  0, 32, XSAVE_LWP_RSVD1,                       NO,  FALSE) \
-FIELD(  D, 62, EDX,  0, 32, XSAVE_LWP_RSVD2,                       NO,  FALSE)
-
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FLAG(   D,  0, EAX,  0,  1, XCR0_MASTER_LEGACY_FP,             YES,  8, FALSE) \
+FLAG(   D,  0, EAX,  1,  1, XCR0_MASTER_SSE,                   YES,  8, FALSE) \
+FLAG(   D,  0, EAX,  2,  1, XCR0_MASTER_YMM_H,                 YES,  8, FALSE) \
+FLAG(   D,  0, EAX,  3,  1, XCR0_MASTER_BNDREGS,               YES, 13, FALSE) \
+FLAG(   D,  0, EAX,  4,  1, XCR0_MASTER_BNDCSR,                YES, 13, FALSE) \
+FLAG(   D,  0, EAX,  5,  1, XCR0_MASTER_OPMASK,                YES, 13, FALSE) \
+FLAG(   D,  0, EAX,  6,  1, XCR0_MASTER_ZMM_H,                 YES, 13, FALSE) \
+FLAG(   D,  0, EAX,  7,  1, XCR0_MASTER_HI16_ZMM,              YES, 13, FALSE) \
+FLAG(   D,  0, EAX,  8,  1, XCR0_MASTER_XSS,                   NO,   0, FALSE) \
+FLAG(   D,  0, EAX,  9,  1, XCR0_MASTER_PKRU,                  YES, 13, FALSE) \
+FIELD(  D,  0, EAX,  10,22, XCR0_MASTER_LOWER,                 NO,   0, FALSE) \
+FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                ANY,  8, FALSE) \
+FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                    YES,  8, FALSE) \
+FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                 NO,   0, FALSE) \
+FLAG(   D,  0, EDX, 30,  1, XCR0_MASTER_LWP,                   NO,   0, FALSE) \
+FLAG(   D,  0, EDX, 31,  1, XCR0_MASTER_EXTENDED_XSAVE,        NO,   0, FALSE) \
+FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                          YES, 11, FALSE) \
+FLAG(   D,  1, EAX,  1,  1, XSAVEC,                            YES, 13, FALSE) \
+FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                       NO,   0, FALSE) \
+FLAG(   D,  1, EAX,  3,  1, XSAVES,                            YES, 13, FALSE) \
+FIELD(  D,  1, EBX,  0, 32, XSAVES_ENABLED_SIZE,               ANY, 13, FALSE) \
+FIELD(  D,  1, ECX,  0,  7, XSS_XCR0_USED0,                    NO,   0, FALSE) \
+FLAG(   D,  1, ECX,  8,  1, XSS_PT,                            NO,   0, FALSE) \
+FIELD(  D,  1, ECX,  9,  1, XSS_XCR0_USED1,                    NO,   0, FALSE) \
+FIELD(  D,  1, ECX,  10,22, XSS_RSVD0,                         NO,   0, FALSE) \
+FIELD(  D,  1, EDX,  0, 32, XSS_RSVD1,                         NO,   0, FALSE) \
+FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                    YES,  9, FALSE) \
+FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                  YES,  9, FALSE) \
+FLAG(   D,  2, ECX,  0,  1, XSAVE_YMM_SUP_BY_XSS,              NO,   0, FALSE) \
+FLAG(   D,  2, ECX,  1,  1, XSAVE_YMM_ALIGN,                   YES, 13, FALSE) \
+FIELD(  D,  2, ECX,  2, 30, XSAVE_YMM_RSVD1,                   NO,   0, FALSE) \
+FIELD(  D,  2, EDX,  0, 32, XSAVE_YMM_RSVD2,                   NO,   0, FALSE) \
+FIELD(  D,  3, EAX,  0, 32, XSAVE_BNDREGS_SIZE,                YES, 13, FALSE) \
+FIELD(  D,  3, EBX,  0, 32, XSAVE_BNDREGS_OFFSET,              YES, 13, FALSE) \
+FLAG(   D,  3, ECX,  0,  1, XSAVE_BNDREGS_SUP_BY_XSS,          NO,   0, FALSE) \
+FLAG(   D,  3, ECX,  1,  1, XSAVE_BNDREGS_ALIGN,               YES, 13, FALSE) \
+FIELD(  D,  3, ECX,  2, 30, XSAVE_BNDREGS_RSVD1,               NO,   0, FALSE) \
+FIELD(  D,  3, EDX,  0, 32, XSAVE_BNDREGS_RSVD2,               NO,   0, FALSE) \
+FIELD(  D,  4, EAX,  0, 32, XSAVE_BNDCSR_SIZE,                 YES, 13, FALSE) \
+FIELD(  D,  4, EBX,  0, 32, XSAVE_BNDCSR_OFFSET,               YES, 13, FALSE) \
+FLAG(   D,  4, ECX,  0,  1, XSAVE_BNDCSR_SUP_BY_XSS,           NO,   0, FALSE) \
+FLAG(   D,  4, ECX,  1,  1, XSAVE_BNDCSR_ALIGN,                YES, 13, FALSE) \
+FIELD(  D,  4, ECX,  2, 30, XSAVE_BNDCSR_RSVD1,                NO,   0, FALSE) \
+FIELD(  D,  4, EDX,  0, 32, XSAVE_BNDCSR_RSVD2,                NO,   0, FALSE) \
+FIELD(  D,  5, EAX,  0, 32, XSAVE_OPMASK_SIZE,                 YES, 13, FALSE) \
+FIELD(  D,  5, EBX,  0, 32, XSAVE_OPMASK_OFFSET,               YES, 13, FALSE) \
+FLAG(   D,  5, ECX,  0,  1, XSAVE_OPMASK_SUP_BY_XSS,           NO,   0, FALSE) \
+FLAG(   D,  5, ECX,  1,  1, XSAVE_OPMASK_ALIGN,                YES, 13, FALSE) \
+FIELD(  D,  5, ECX,  2, 30, XSAVE_OPMASK_RSVD1,                NO,   0, FALSE) \
+FIELD(  D,  5, EDX,  0, 32, XSAVE_OPMASK_RSVD2,                NO,   0, FALSE) \
+FIELD(  D,  6, EAX,  0, 32, XSAVE_ZMM_H_SIZE,                  YES, 13, FALSE) \
+FIELD(  D,  6, EBX,  0, 32, XSAVE_ZMM_H_OFFSET,                YES, 13, FALSE) \
+FLAG(   D,  6, ECX,  0,  1, XSAVE_ZMM_H_SUP_BY_XSS,            NO,   0, FALSE) \
+FLAG(   D,  6, ECX,  1,  1, XSAVE_ZMM_H_ALIGN,                 YES, 13, FALSE) \
+FIELD(  D,  6, ECX,  2, 30, XSAVE_ZMM_H_RSVD1,                 NO,   0, FALSE) \
+FIELD(  D,  6, EDX,  0, 32, XSAVE_ZMM_H_RSVD2,                 NO,   0, FALSE) \
+FIELD(  D,  7, EAX,  0, 32, XSAVE_HI16_ZMM_SIZE,               YES, 13, FALSE) \
+FIELD(  D,  7, EBX,  0, 32, XSAVE_HI16_ZMM_OFFSET,             YES, 13, FALSE) \
+FLAG(   D,  7, ECX,  0,  1, XSAVE_HI16_ZMM_SUP_BY_XSS,         NO,   0, FALSE) \
+FLAG(   D,  7, ECX,  1,  1, XSAVE_HI16_ZMM_ALIGN,              YES, 13, FALSE) \
+FIELD(  D,  7, ECX,  2, 30, XSAVE_HI16_ZMM_RSVD1,              NO,   0, FALSE) \
+FIELD(  D,  7, EDX,  0, 32, XSAVE_HI16_ZMM_RSVD2,              NO,   0, FALSE) \
+FIELD(  D,  8, EAX,  0, 32, XSAVE_PT_STATE_SIZE,               NO,   0, FALSE) \
+FIELD(  D,  8, EBX,  0, 32, XSAVE_PT_STATE_OFFSET,             NO,   0, FALSE) \
+FLAG(   D,  8, ECX,  0,  1, XSAVE_PT_STATE_SUP_BY_XSS,         NO,   0, FALSE) \
+FLAG(   D,  8, ECX,  1,  1, XSAVE_PT_STATE_ALIGN,              NO,   0, FALSE) \
+FIELD(  D,  8, ECX,  2, 30, XSAVE_PT_STATE_RSVD1,              NO,   0, FALSE) \
+FIELD(  D,  8, EDX,  0, 32, XSAVE_PT_STATE_RSVD2,              NO,   0, FALSE) \
+FIELD(  D,  9, EAX,  0, 32, XSAVE_PKRU_SIZE,                   YES, 13, FALSE) \
+FIELD(  D,  9, EBX,  0, 32, XSAVE_PKRU_OFFSET,                 YES, 13, FALSE) \
+FLAG(   D,  9, ECX,  0,  1, XSAVE_PKRU_SUP_BY_XSS,             NO,   0, FALSE) \
+FLAG(   D,  9, ECX,  1,  1, XSAVE_PKRU_ALIGN,                  YES, 13, FALSE) \
+FIELD(  D,  9, ECX,  2, 30, XSAVE_PKRU_RSVD1,                  NO,   0, FALSE) \
+FIELD(  D,  9, EDX,  0, 32, XSAVE_PKRU_RSVD2,                  NO,   0, FALSE) \
+FIELD(  D, 62, EAX,  0, 32, XSAVE_LWP_SIZE,                    NO,   0, FALSE) \
+FIELD(  D, 62, EBX,  0, 32, XSAVE_LWP_OFFSET,                  NO,   0, FALSE) \
+FIELD(  D, 62, ECX,  0, 32, XSAVE_LWP_RSVD1,                   NO,   0, FALSE) \
+FIELD(  D, 62, EDX,  0, 32, XSAVE_LWP_RSVD2,                   NO,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_F                                               \
+FIELD(  F,  0, EBX,  0, 32, PQM_MAX_RMID,                      NO,   0, FALSE) \
+FLAG(   F,  0, EDX,  1,  1, PQM_CMT_SUPPORT,                   NO,   0, FALSE) \
+FIELD(  F,  1, EBX,  0, 32, PQM_CMT_CONV,                      NO,   0, FALSE) \
+FIELD(  F,  1, ECX,  0, 32, PQM_CMT_NUM_RMID,                  NO,   0, FALSE) \
+FLAG(   F,  1, EDX,  0,  1, PQM_CMT_OCCUPANCY,                 NO,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_10                                              \
+FLAG(  10,  0, EBX,  1,  1, L3_QOS_ENFORCEMENT,                NO,   0, FALSE) \
+FIELD( 10,  1, EAX,  0,  4, RESID_CAPACITY_MASK_LENGTH,        NO,   0, FALSE) \
+FIELD( 10,  1, EBX,  0, 32, ISOLATION_UNIT_MAP,                NO,   0, FALSE) \
+FLAG(  10,  1, ECX,  1,  1, INFREQUENT_COS_UPDATE,             NO,   0, FALSE) \
+FLAG(  10,  1, ECX,  2,  1, CODE_AND_DATA_PRIORITIZATION,      NO,   0, FALSE) \
+FIELD( 10,  1, EDX,  0, 16, MAX_COS_NUMBER,                    NO,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_12                                              \
-FLAG(  12,  0, EAX,  0,  1, SGX1,                                  NA,  FALSE) \
-FLAG(  12,  0, EAX,  1,  1, SGX2,                                  NA,  FALSE) \
-FLAG(  12,  0, EBX, 31,  1, SGX_MISCSELECT,                        NA,  FALSE) \
-FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,                NA,  FALSE) \
-FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,                   NA,  FALSE) \
-FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                      NA,  FALSE) \
-FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                      NA,  FALSE) \
-FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                      NA,  FALSE) \
-FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                      NA,  FALSE) \
-FIELD( 12,  2, EAX,  0,  4, EPC00_VALID,                           NA,  FALSE) \
-FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                        NA,  FALSE) \
-FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                       NA,  FALSE) \
-FIELD( 12,  2, ECX,  0,  4, EPC00_PROTECTED,                       NA,  FALSE) \
-FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                        NA,  FALSE) \
-FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                       NA,  FALSE) \
-FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                           NA,  FALSE) \
-FIELD( 12,  3, EAX, 12, 20, EPC01_BASE_LOW,                        NA,  FALSE) \
-FIELD( 12,  3, EBX,  0, 20, EPC01_BASE_HIGH,                       NA,  FALSE) \
-FIELD( 12,  3, ECX,  0,  4, EPC01_PROTECTED,                       NA,  FALSE) \
-FIELD( 12,  3, ECX, 12, 20, EPC01_SIZE_LOW,                        NA,  FALSE) \
-FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                       NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FLAG(  12,  0, EAX,  0,  1, SGX1,                              NO,   0, FALSE) \
+FLAG(  12,  0, EAX,  1,  1, SGX2,                              NO,   0, FALSE) \
+FLAG(  12,  0, EBX,  0,  1, SGX_MISCSELECT_EXINFO,             NO,   0, FALSE) \
+FIELD( 12,  0, EBX,  1, 31, SGX_MISCSELECT_RSVD,               NO,   0, FALSE) \
+FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,            NO,   0, FALSE) \
+FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,               NO,   0, FALSE) \
+FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                  NO,   0, FALSE) \
+FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                  NO,   0, FALSE) \
+FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                  NO,   0, FALSE) \
+FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                  NO,   0, FALSE) \
+FIELD( 12,  2, EAX,  0, 15, EPC00_VALID,                       NO,   0, FALSE) \
+FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                    NO,   0, FALSE) \
+FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                   NO,   0, FALSE) \
+FIELD( 12,  2, ECX,  0, 15, EPC00_PROTECTED,                   NO,   0, FALSE) \
+FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                    NO,   0, FALSE) \
+FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                   NO,   0, FALSE) \
+FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                       NO,   0, FALSE) \
+FIELD( 12,  3, EAX, 12, 20, EPC01_BASE_LOW,                    NO,   0, FALSE) \
+FIELD( 12,  3, EBX,  0, 20, EPC01_BASE_HIGH,                   NO,   0, FALSE) \
+FIELD( 12,  3, ECX,  0,  4, EPC01_PROTECTED,                   NO,   0, FALSE) \
+FIELD( 12,  3, ECX, 12, 20, EPC01_SIZE_LOW,                    NO,   0, FALSE) \
+FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                   NO,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_14                                              \
+FIELD( 14,  0, EAX,  0, 32, MAX_SUB_LEAF,                        NO, 0, FALSE) \
+FLAG(  14,  0, EBX,  0,  1, CR3FTR_AND_MATCHMSR_AVAILABLE,       NO, 0, FALSE) \
+FLAG(  14,  0, EBX,  1,  1, PSB_AND_CYCLE_ACCURATE_MODE,         NO, 0, FALSE) \
+FLAG(  14,  0, EBX,  2,  1, IP_TRACESTOP_FTR_PTMSR_PERSIST,      NO, 0, FALSE) \
+FLAG(  14,  0, EBX,  3,  1, MTC_PKT_GENERATION_SUPPORTED,        NO, 0, FALSE) \
+FLAG(  14,  0, ECX,  0,  1, TOPA_OUTPUT_SUPPORTED,               NO, 0, FALSE) \
+FLAG(  14,  0, ECX,  1,  1, TOPA_ALLOW_MULTIPLE_ENTRIES,         NO, 0, FALSE) \
+FLAG(  14,  0, ECX,  2,  1, SINGLE_RANGE_OUTPUT_SCHEME,          NO, 0, FALSE) \
+FLAG(  14,  0, ECX,  3,  1, TRACE_TRANSPORT_SUBSYSTEM,           NO, 0, FALSE) \
+FLAG(  14,  0, ECX, 31,  1, LIP_PRESENT_FOR_IP_PAYLOADS,         NO, 0, FALSE) \
+FIELD( 14,  1, EAX,  0,  2, NUM_ADDR_RANGE_FOR_FILTERING,        NO, 0, FALSE) \
+FIELD( 14,  1, EAX, 16, 16, SUPPORTED_MTC_ENCODINGS,             NO, 0, FALSE) \
+FIELD( 14,  1, EBX,  0, 16, SUPPORTED_CYCLE_THRESHOLD_ENCODINGS, NO, 0, FALSE) \
+FIELD( 14,  1, EBX, 16, 16, SUPPORTED_PSB_FREQ_ENCODINGS,        NO, 0, FALSE) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_15                                              \
+FIELD( 15,  0, EAX,  0, 32, DENOM_TSC_TO_CORE_CRYSTAL_CLK,     NO,   0, FALSE) \
+FIELD( 15,  0, EBX,  0, 32, NUMER_TSC_TO_CORE_CRYSTAL_CLK,     NO,   0, FALSE) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_16                                              \
+FIELD( 16,  0, EAX,  0, 16, PROC_BASE_FREQ,                    NO,   0, FALSE) \
+FIELD( 16,  0, EBX,  0, 16, PROC_MIN_FREQ,                     NO,   0, FALSE) \
+FIELD( 16,  0, ECX,  0, 16, BUS_FREQ,                          NO,   0, FALSE) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_17                                              \
+FIELD( 17,  0, EAX,  0, 31, MAX_SOCID_INDEX,                   NO,   0, FALSE) \
+FIELD( 17,  0, EBX,  0, 16, SOC_VENDOR_ID,                     NO,   0, FALSE) \
+FIELD( 17,  0, EBX, 16,  1, SOC_INDUSTRY_STD,                  NO,   0, FALSE) \
+FIELD( 17,  0, ECX,  0, 31, SOC_PROJECT_ID,                    NO,   0, FALSE) \
+FIELD( 17,  0, EDX,  0, 31, SOC_STEPPING_ID,                   NO,   0, FALSE) \
+FIELD( 17,  1, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_1_0,       NO,   0, FALSE) \
+FIELD( 17,  1, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_1_1,       NO,   0, FALSE) \
+FIELD( 17,  1, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_1_2,       NO,   0, FALSE) \
+FIELD( 17,  1, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_1_3,       NO,   0, FALSE) \
+FIELD( 17,  2, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_2_0,       NO,   0, FALSE) \
+FIELD( 17,  2, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_2_1,       NO,   0, FALSE) \
+FIELD( 17,  2, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_2_2,       NO,   0, FALSE) \
+FIELD( 17,  2, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_2_3,       NO,   0, FALSE) \
+FIELD( 17,  3, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_3_0,       NO,   0, FALSE) \
+FIELD( 17,  3, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_3_1,       NO,   0, FALSE) \
+FIELD( 17,  3, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_3_2,       NO,   0, FALSE) \
+FIELD( 17,  3, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_3_3,       NO,   0, FALSE) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_400                                             \
-FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                         NA,  FALSE) \
-FIELD(400,  0, EBX,  0, 32, HYPERVISOR_VENDOR0,                    NA,  FALSE) \
-FIELD(400,  0, ECX,  0, 32, HYPERVISOR_VENDOR1,                    NA,  FALSE) \
-FIELD(400,  0, EDX,  0, 32, HYPERVISOR_VENDOR2,                    NA,  FALSE)
+FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                     NA,   0, FALSE) \
+FIELD(400,  0, EBX,  0, 32, HYPERVISOR_VENDOR0,                NA,   0, FALSE) \
+FIELD(400,  0, ECX,  0, 32, HYPERVISOR_VENDOR1,                NA,   0, FALSE) \
+FIELD(400,  0, EDX,  0, 32, HYPERVISOR_VENDOR2,                NA,   0, FALSE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_401                                             \
-FIELD(401,  0, EAX,  0, 32, HV_INTERFACE_SIGNATURE,                NA,  FALSE)
+FIELD(401,  0, EAX,  0, 32, HV_INTERFACE_SIGNATURE,            NA,   0, FALSE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_402                                             \
-FIELD(402,  0, EAX,  0, 32, BUILD_NUMBER,                          NA,  FALSE) \
-FIELD(402,  0, EBX,  0, 16, MINOR_VERSION,                         NA,  FALSE) \
-FIELD(402,  0, EBX, 16, 16, MAJOR_VERSION,                         NA,  FALSE) \
-FIELD(402,  0, ECX,  0, 32, SERVICE_PACK,                          NA,  FALSE) \
-FIELD(402,  0, EDX,  0, 24, SERVICE_NUMBER,                        NA,  FALSE) \
-FIELD(402,  0, EDX, 24,  8, SERVICE_BRANCH,                        NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FIELD(402,  0, EAX,  0, 32, BUILD_NUMBER,                      NA,   0, FALSE) \
+FIELD(402,  0, EBX,  0, 16, MINOR_VERSION,                     NA,   0, FALSE) \
+FIELD(402,  0, EBX, 16, 16, MAJOR_VERSION,                     NA,   0, FALSE) \
+FIELD(402,  0, ECX,  0, 32, SERVICE_PACK,                      NA,   0, FALSE) \
+FIELD(402,  0, EDX,  0, 24, SERVICE_NUMBER,                    NA,   0, FALSE) \
+FIELD(402,  0, EDX, 24,  8, SERVICE_BRANCH,                    NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_403                                             \
-FLAG( 403,  0, EAX,  0,  1, VP_RUNTIME_AVAIL,                      NA,  FALSE) \
-FLAG( 403,  0, EAX,  1,  1, REF_COUNTER_AVAIL,                     NA,  FALSE) \
-FLAG( 403,  0, EAX,  2,  1, BASIC_SYNIC_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EAX,  3,  1, SYNTH_TIMER_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EAX,  4,  1, APIC_ACCESS_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EAX,  5,  1, HYPERCALL_MSRS_AVAIL,                  NA,  FALSE) \
-FLAG( 403,  0, EAX,  6,  1, VP_INDEX_MSR_AVAIL,                    NA,  FALSE) \
-FLAG( 403,  0, EAX,  7,  1, VIRT_RESET_MSR_AVAIL,                  NA,  FALSE) \
-FLAG( 403,  0, EAX,  8,  1, STATS_PAGES_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EAX,  9,  1, REF_TSC_AVAIL,                         NA,  FALSE) \
-FLAG( 403,  0, EAX, 10,  1, GUEST_IDLE_MSR_AVAIL,                  NA,  FALSE) \
-FLAG( 403,  0, EAX, 11,  1, FREQUENCY_MSRS_AVAIL,                  NA,  FALSE) \
-FLAG( 403,  0, EAX, 12,  1, SYNTH_DEBUG_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EBX,  0,  1, CREATE_PARTITIONS_FLAG,                NA,  FALSE) \
-FLAG( 403,  0, EBX,  1,  1, ACCESS_PARTITION_ID_FLAG,              NA,  FALSE) \
-FLAG( 403,  0, EBX,  2,  1, ACCESS_MEMORY_POOL_FLAG,               NA,  FALSE) \
-FLAG( 403,  0, EBX,  3,  1, ADJUST_MESSAGE_BUFFERS_FLAG,           NA,  FALSE) \
-FLAG( 403,  0, EBX,  4,  1, POST_MESSAGES_FLAG,                    NA,  FALSE) \
-FLAG( 403,  0, EBX,  5,  1, SIGNAL_EVENTS_FLAG,                    NA,  FALSE) \
-FLAG( 403,  0, EBX,  6,  1, CREATE_PORT_FLAG,                      NA,  FALSE) \
-FLAG( 403,  0, EBX,  7,  1, CONNECT_PORT_FLAG,                     NA,  FALSE) \
-FLAG( 403,  0, EBX,  8,  1, ACCESS_STATS_FLAG,                     NA,  FALSE) \
-FLAG( 403,  0, EBX, 11,  1, DEBUGGING_FLAG,                        NA,  FALSE) \
-FLAG( 403,  0, EBX, 12,  1, CPU_MANAGEMENT_FLAG,                   NA,  FALSE) \
-FLAG( 403,  0, EBX, 13,  1, CONFIGURE_PROFILER_FLAG,               NA,  FALSE) \
-FLAG( 403,  0, EBX, 14,  1, ENABLE_EXPANDED_STACKWALKING_FLAG,     NA,  FALSE) \
-FIELD(403,  0, ECX,  0,  4, MAX_POWER_STATE,                       NA,  FALSE) \
-FLAG( 403,  0, ECX,  4,  1, HPET_NEEDED_FOR_C3,                    NA,  FALSE) \
-FLAG( 403,  0, EDX,  0,  1, MWAIT_AVAIL,                           NA,  FALSE) \
-FLAG( 403,  0, EDX,  1,  1, GUEST_DEBUGGING_AVAIL,                 NA,  FALSE) \
-FLAG( 403,  0, EDX,  2,  1, PERFORMANCE_MONITOR_AVAIL,             NA,  FALSE) \
-FLAG( 403,  0, EDX,  3,  1, CPU_DYN_PARTITIONING_AVAIL,            NA,  FALSE) \
-FLAG( 403,  0, EDX,  4,  1, XMM_REGISTERS_FOR_HYPERCALL_AVAIL,     NA,  FALSE) \
-FLAG( 403,  0, EDX,  5,  1, GUEST_IDLE_AVAIL,                      NA,  FALSE) \
-FLAG( 403,  0, EDX,  6,  1, HYPERVISOR_SLEEP_STATE_AVAIL,          NA,  FALSE) \
-FLAG( 403,  0, EDX,  7,  1, NUMA_DISTANCE_QUERY_AVAIL,             NA,  FALSE) \
-FLAG( 403,  0, EDX,  8,  1, TIMER_FREQUENCY_AVAIL,                 NA,  FALSE) \
-FLAG( 403,  0, EDX,  9,  1, SYNTH_MACHINE_CHECK_AVAIL,             NA,  FALSE) \
-FLAG( 403,  0, EDX, 10,  1, GUEST_CRASH_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EDX, 11,  1, DEBUG_MSRS_AVAIL,                      NA,  FALSE) \
-FLAG( 403,  0, EDX, 12,  1, NPIEP1_AVAIL,                          NA,  FALSE) \
-FLAG( 403,  0, EDX, 13,  1, DISABLE_HYPERVISOR_AVAIL,              NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FLAG( 403,  0, EAX,  0,  1, VP_RUNTIME_AVAIL,                  NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  1,  1, REF_COUNTER_AVAIL,                 NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  2,  1, BASIC_SYNIC_MSRS_AVAIL,            NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  3,  1, SYNTH_TIMER_MSRS_AVAIL,            NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  4,  1, APIC_ACCESS_MSRS_AVAIL,            NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  5,  1, HYPERCALL_MSRS_AVAIL,              NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  6,  1, VP_INDEX_MSR_AVAIL,                NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  7,  1, VIRT_RESET_MSR_AVAIL,              NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  8,  1, STATS_PAGES_MSRS_AVAIL,            NA,   0, FALSE) \
+FLAG( 403,  0, EAX,  9,  1, REF_TSC_AVAIL,                     NA,   0, FALSE) \
+FLAG( 403,  0, EAX, 10,  1, GUEST_IDLE_MSR_AVAIL,              NA,   0, FALSE) \
+FLAG( 403,  0, EAX, 11,  1, FREQUENCY_MSRS_AVAIL,              NA,   0, FALSE) \
+FLAG( 403,  0, EAX, 12,  1, SYNTH_DEBUG_MSRS_AVAIL,            NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  0,  1, CREATE_PARTITIONS_FLAG,            NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  1,  1, ACCESS_PARTITION_ID_FLAG,          NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  2,  1, ACCESS_MEMORY_POOL_FLAG,           NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  3,  1, ADJUST_MESSAGE_BUFFERS_FLAG,       NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  4,  1, POST_MESSAGES_FLAG,                NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  5,  1, SIGNAL_EVENTS_FLAG,                NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  6,  1, CREATE_PORT_FLAG,                  NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  7,  1, CONNECT_PORT_FLAG,                 NA,   0, FALSE) \
+FLAG( 403,  0, EBX,  8,  1, ACCESS_STATS_FLAG,                 NA,   0, FALSE) \
+FLAG( 403,  0, EBX, 11,  1, DEBUGGING_FLAG,                    NA,   0, FALSE) \
+FLAG( 403,  0, EBX, 12,  1, CPU_MANAGEMENT_FLAG,               NA,   0, FALSE) \
+FLAG( 403,  0, EBX, 13,  1, CONFIGURE_PROFILER_FLAG,           NA,   0, FALSE) \
+FLAG( 403,  0, EBX, 14,  1, ENABLE_EXPANDED_STACKWALKING_FLAG, NA,   0, FALSE) \
+FIELD(403,  0, ECX,  0,  4, MAX_POWER_STATE,                   NA,   0, FALSE) \
+FLAG( 403,  0, ECX,  4,  1, HPET_NEEDED_FOR_C3,                NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  0,  1, MWAIT_AVAIL,                       NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  1,  1, GUEST_DEBUGGING_AVAIL,             NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  2,  1, PERFORMANCE_MONITOR_AVAIL,         NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  3,  1, CPU_DYN_PARTITIONING_AVAIL,        NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  4,  1, XMM_REGISTERS_FOR_HYPERCALL_AVAIL, NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  5,  1, GUEST_IDLE_AVAIL,                  NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  6,  1, HYPERVISOR_SLEEP_STATE_AVAIL,      NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  7,  1, NUMA_DISTANCE_QUERY_AVAIL,         NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  8,  1, TIMER_FREQUENCY_AVAIL,             NA,   0, FALSE) \
+FLAG( 403,  0, EDX,  9,  1, SYNTH_MACHINE_CHECK_AVAIL,         NA,   0, FALSE) \
+FLAG( 403,  0, EDX, 10,  1, GUEST_CRASH_MSRS_AVAIL,            NA,   0, FALSE) \
+FLAG( 403,  0, EDX, 11,  1, DEBUG_MSRS_AVAIL,                  NA,   0, FALSE) \
+FLAG( 403,  0, EDX, 12,  1, NPIEP1_AVAIL,                      NA,   0, FALSE) \
+FLAG( 403,  0, EDX, 13,  1, DISABLE_HYPERVISOR_AVAIL,          NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_404                                             \
-FLAG( 404,  0, EAX,  0,  1, USE_HYPERCALL_TO_SWITCH_ADDR_SPACE,    NA,  FALSE) \
-FLAG( 404,  0, EAX,  1,  1, USE_HYPERCALL_TO_FLUSH_TLB,            NA,  FALSE) \
-FLAG( 404,  0, EAX,  2,  1, USE_HYPERCALL_FOR_TLB_SHOOTDOWN,       NA,  FALSE) \
-FLAG( 404,  0, EAX,  3,  1, USE_MSRS_FOR_EOI_ICR_TPR,              NA,  FALSE) \
-FLAG( 404,  0, EAX,  4,  1, USE_MSR_FOR_RESET,                     NA,  FALSE) \
-FLAG( 404,  0, EAX,  5,  1, USE_RELAXED_TIMING,                    NA,  FALSE) \
-FLAG( 404,  0, EAX,  6,  1, USE_DMA_REMAPPING,                     NA,  FALSE) \
-FLAG( 404,  0, EAX,  7,  1, USE_INTERRUPT_REMAPPING,               NA,  FALSE) \
-FLAG( 404,  0, EAX,  8,  1, USE_X2APIC,                            NA,  FALSE) \
-FLAG( 404,  0, EAX,  9,  1, DEPRECATE_AUTOEOI,                     NA,  FALSE) \
-FIELD(404,  0, EBX,  0, 32, SPINLOCK_RETRIES,                      NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FLAG( 404,  0, EAX,  0,  1, USE_HYPERCALL_TO_SWITCH_ADDR_SPACE,NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  1,  1, USE_HYPERCALL_TO_FLUSH_TLB,        NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  2,  1, USE_HYPERCALL_FOR_TLB_SHOOTDOWN,   NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  3,  1, USE_MSRS_FOR_EOI_ICR_TPR,          NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  4,  1, USE_MSR_FOR_RESET,                 NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  5,  1, USE_RELAXED_TIMING,                NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  6,  1, USE_DMA_REMAPPING,                 NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  7,  1, USE_INTERRUPT_REMAPPING,           NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  8,  1, USE_X2APIC,                        NA,   0, FALSE) \
+FLAG( 404,  0, EAX,  9,  1, DEPRECATE_AUTOEOI,                 NA,   0, FALSE) \
+FIELD(404,  0, EBX,  0, 32, SPINLOCK_RETRIES,                  NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_405                                             \
-FIELD(405,  0, EAX,  0, 32, MAX_VCPU,                              NA,  FALSE) \
-FIELD(405,  0, EBX,  0, 32, MAX_LCPU,                              NA,  FALSE) \
-FIELD(405,  0, ECX,  0, 32, MAX_REMAPPABLE_VECTORS,                NA,  FALSE)
+FIELD(405,  0, EAX,  0, 32, MAX_VCPU,                          NA,   0, FALSE) \
+FIELD(405,  0, EBX,  0, 32, MAX_LCPU,                          NA,   0, FALSE) \
+FIELD(405,  0, ECX,  0, 32, MAX_REMAPPABLE_VECTORS,            NA,   0, FALSE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_406                                             \
-FLAG( 406,  0, EAX,  0,  1, APIC_OVERLAY_ASSIST,                   NA,  FALSE) \
-FLAG( 406,  0, EAX,  1,  1, MSR_BITMAPS,                           NA,  FALSE) \
-FLAG( 406,  0, EAX,  2,  1, ARCH_PMCS,                             NA,  FALSE) \
-FLAG( 406,  0, EAX,  3,  1, SLAT,                                  NA,  FALSE) \
-FLAG( 406,  0, EAX,  4,  1, DMA_REMAPPING,                         NA,  FALSE) \
-FLAG( 406,  0, EAX,  5,  1, INTERRUPT_REMAPPING,                   NA,  FALSE) \
-FLAG( 406,  0, EAX,  6,  1, MEMORY_PATROL_SCRUBBER,                NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FLAG( 406,  0, EAX,  0,  1, APIC_OVERLAY_ASSIST,               NA,   0, FALSE) \
+FLAG( 406,  0, EAX,  1,  1, MSR_BITMAPS,                       NA,   0, FALSE) \
+FLAG( 406,  0, EAX,  2,  1, ARCH_PMCS,                         NA,   0, FALSE) \
+FLAG( 406,  0, EAX,  3,  1, SLAT,                              NA,   0, FALSE) \
+FLAG( 406,  0, EAX,  4,  1, DMA_REMAPPING,                     NA,   0, FALSE) \
+FLAG( 406,  0, EAX,  5,  1, INTERRUPT_REMAPPING,               NA,   0, FALSE) \
+FLAG( 406,  0, EAX,  6,  1, MEMORY_PATROL_SCRUBBER,            NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_410                                             \
-FIELD(410,  0, EAX,  0, 32, TSC_HZ,                                NA,  FALSE) \
-FIELD(410,  0, EBX,  0, 32, ACPIBUS_HZ,                            NA,  FALSE)
+FIELD(410,  0, EAX,  0, 32, TSC_HZ,                            NA,   0, FALSE) \
+FIELD(410,  0, EBX,  0, 32, APICBUS_HZ,                        NA,   0, FALSE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_80                                              \
-FIELD( 80,  0, EAX,  0, 32, NUM_EXT_LEVELS,                        NA,  FALSE) \
-FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                        NA,  FALSE) \
-FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                        NA,  FALSE) \
-FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                        NA,  FALSE)
+FIELD( 80,  0, EAX,  0, 32, NUM_EXT_LEVELS,                    NA,   0, FALSE) \
+FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                    NA,   0, FALSE) \
+FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                    NA,   0, FALSE) \
+FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                    NA,   0, FALSE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_81                                              \
-FIELD( 81,  0, EAX,  0, 32, UNKNOWN81EAX,                          ANY, FALSE) \
-FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                       ANY, FALSE) \
-FIELD( 81,  0, EAX,  4,  4, LEAF81_MODEL,                          ANY, FALSE) \
-FIELD( 81,  0, EAX,  8,  4, LEAF81_FAMILY,                         ANY, FALSE) \
-FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                           ANY, FALSE) \
-FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,                 ANY, FALSE) \
-FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,                ANY, FALSE) \
-FIELD( 81,  0, EBX,  0, 32, UNKNOWN81EBX,                          ANY, FALSE) \
-FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                       ANY, FALSE) \
-FIELD( 81,  0, EBX, 16, 16, UNDEF,                                 ANY, FALSE) \
-FLAG(  81,  0, ECX,  0,  1, LAHF64,                                YES, TRUE)  \
-FLAG(  81,  0, ECX,  1,  1, CMPLEGACY,                             ANY, FALSE) \
-FLAG(  81,  0, ECX,  2,  1, SVM,                                   YES, FALSE) \
-FLAG(  81,  0, ECX,  3,  1, EXTAPICSPC,                            YES, FALSE) \
-FLAG(  81,  0, ECX,  4,  1, CR8AVAIL,                              YES, FALSE) \
-FLAG(  81,  0, ECX,  5,  1, ABM,                                   YES, TRUE)  \
-FLAG(  81,  0, ECX,  6,  1, SSE4A,                                 YES, TRUE)  \
-FLAG(  81,  0, ECX,  7,  1, MISALIGNED_SSE,                        YES, TRUE)  \
-FLAG(  81,  0, ECX,  8,  1, 3DNPREFETCH,                           YES, TRUE)  \
-FLAG(  81,  0, ECX,  9,  1, OSVW,                                  ANY, FALSE) \
-FLAG(  81,  0, ECX, 10,  1, IBS,                                   NO,  FALSE) \
-FLAG(  81,  0, ECX, 11,  1, XOP,                                   YES, TRUE)  \
-FLAG(  81,  0, ECX, 12,  1, SKINIT,                                NO,  FALSE) \
-FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                              NO,  FALSE) \
-FLAG(  81,  0, ECX, 15,  1, LWP,                                   NO,  FALSE) \
-FLAG(  81,  0, ECX, 16,  1, FMA4,                                  YES, TRUE)  \
-FLAG(  81,  0, ECX, 17,  1, TCE,                                   NO,  FALSE) \
-FLAG(  81,  0, ECX, 19,  1, NODEID_MSR,                            NO,  FALSE) \
-FLAG(  81,  0, ECX, 21,  1, TBM,                                   YES, TRUE)  \
-FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                              NO,  FALSE) \
-FLAG(  81,  0, ECX, 23,  1, PERFCORE,                              ANY, TRUE)  \
-FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                            YES, TRUE)  \
-FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  2,  1, LEAF81_DE,                             YES, FALSE) \
-FLAG(  81,  0, EDX,  3,  1, LEAF81_PSE,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  4,  1, LEAF81_TSC,                            YES, TRUE)  \
-FLAG(  81,  0, EDX,  5,  1, LEAF81_MSR,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  6,  1, LEAF81_PAE,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  7,  1, LEAF81_MCE,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  8,  1, LEAF81_CX8,                            YES, TRUE)  \
-FLAG(  81,  0, EDX,  9,  1, LEAF81_APIC,                           ANY, FALSE) \
-FLAG(  81,  0, EDX, 11,  1, SYSC,                                  ANY, TRUE)  \
-FLAG(  81,  0, EDX, 12,  1, LEAF81_MTRR,                           YES, FALSE) \
-FLAG(  81,  0, EDX, 13,  1, LEAF81_PGE,                            YES, FALSE) \
-FLAG(  81,  0, EDX, 14,  1, LEAF81_MCA,                            YES, FALSE) \
-FLAG(  81,  0, EDX, 15,  1, LEAF81_CMOV,                           YES, TRUE)  \
-FLAG(  81,  0, EDX, 16,  1, LEAF81_PAT,                            YES, FALSE) \
-FLAG(  81,  0, EDX, 17,  1, LEAF81_PSE36,                          YES, FALSE) \
-FLAG(  81,  0, EDX, 20,  1, NX,                                    YES, FALSE) \
-FLAG(  81,  0, EDX, 22,  1, MMXEXT,                                YES, TRUE)  \
-FLAG(  81,  0, EDX, 23,  1, LEAF81_MMX,                            YES, TRUE)  \
-FLAG(  81,  0, EDX, 24,  1, LEAF81_FXSR,                           YES, TRUE)  \
-FLAG(  81,  0, EDX, 25,  1, FFXSR,                                 YES, FALSE) \
-FLAG(  81,  0, EDX, 26,  1, PDPE1GB,                               YES, FALSE) \
-FLAG(  81,  0, EDX, 27,  1, RDTSCP,                                YES, TRUE)  \
-FLAG(  81,  0, EDX, 29,  1, LM,                                    YES, FALSE) \
-FLAG(  81,  0, EDX, 30,  1, 3DNOWPLUS,                             YES, TRUE)  \
-FLAG(  81,  0, EDX, 31,  1, 3DNOW,                                 YES, TRUE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+FIELD( 81,  0, EAX,  0, 32, UNKNOWN81EAX,                      ANY,  4, FALSE) \
+FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                   ANY,  4, FALSE) \
+FIELD( 81,  0, EAX,  4,  4, LEAF81_MODEL,                      ANY,  4, FALSE) \
+FIELD( 81,  0, EAX,  8,  4, LEAF81_FAMILY,                     ANY,  4, FALSE) \
+FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                       ANY,  4, FALSE) \
+FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,             ANY,  4, FALSE) \
+FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,            ANY,  4, FALSE) \
+FIELD( 81,  0, EBX,  0, 32, UNKNOWN81EBX,                      ANY,  4, FALSE) \
+FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                   ANY,  4, FALSE) \
+FIELD( 81,  0, EBX, 16, 16, UNDEF,                             ANY,  4, FALSE) \
+FLAG(  81,  0, ECX,  0,  1, LAHF64,                            YES,  4, TRUE)  \
+FLAG(  81,  0, ECX,  1,  1, CMPLEGACY,                         ANY,  9, FALSE) \
+FLAG(  81,  0, ECX,  2,  1, SVM,                               YES,  7, FALSE) \
+FLAG(  81,  0, ECX,  3,  1, EXTAPICSPC,                        YES,  4, FALSE) \
+FLAG(  81,  0, ECX,  4,  1, CR8AVAIL,                          YES,  4, FALSE) \
+FLAG(  81,  0, ECX,  5,  1, ABM,                               YES,  7, TRUE)  \
+FLAG(  81,  0, ECX,  6,  1, SSE4A,                             YES,  4, TRUE)  \
+FLAG(  81,  0, ECX,  7,  1, MISALIGNED_SSE,                    YES,  4, TRUE)  \
+FLAG(  81,  0, ECX,  8,  1, 3DNPREFETCH,                       YES,  4, TRUE)  \
+FLAG(  81,  0, ECX,  9,  1, OSVW,                              ANY,  8, FALSE) \
+FLAG(  81,  0, ECX, 10,  1, IBS,                               NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 11,  1, XOP,                               YES,  8, TRUE)  \
+FLAG(  81,  0, ECX, 12,  1, SKINIT,                            NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                          NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 15,  1, LWP,                               NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 16,  1, FMA4,                              YES,  8, TRUE)  \
+FLAG(  81,  0, ECX, 17,  1, TCE,                               NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 19,  1, NODEID_MSR,                        NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 21,  1, TBM,                               YES,  9, TRUE)  \
+FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                          NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 23,  1, PERFCORE,                          ANY,  4, TRUE)  \
+FLAG(  81,  0, ECX, 24,  1, PERFNB,                            NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 26,  1, DATABK,                            NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 27,  1, PERFTSC,                           NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 28,  1, PERFL3,                            NO,   0, FALSE) \
+FLAG(  81,  0, ECX, 29,  1, MWAITX,                            NO,   0, FALSE) \
+FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                        YES,  4, TRUE)  \
+FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                        YES,  4, FALSE) \
+FLAG(  81,  0, EDX,  2,  1, LEAF81_DE,                         YES,  4, FALSE) \
+FLAG(  81,  0, EDX,  3,  1, LEAF81_PSE,                        YES,  4, FALSE) \
+FLAG(  81,  0, EDX,  4,  1, LEAF81_TSC,                        YES,  4, TRUE)  \
+FLAG(  81,  0, EDX,  5,  1, LEAF81_MSR,                        YES,  4, FALSE) \
+FLAG(  81,  0, EDX,  6,  1, LEAF81_PAE,                        YES,  4, FALSE) \
+FLAG(  81,  0, EDX,  7,  1, LEAF81_MCE,                        YES,  4, FALSE) \
+FLAG(  81,  0, EDX,  8,  1, LEAF81_CX8,                        YES,  4, TRUE)  \
+FLAG(  81,  0, EDX,  9,  1, LEAF81_APIC,                       ANY,  4, FALSE) \
+FLAG(  81,  0, EDX, 11,  1, SYSC,                              ANY,  4, TRUE)  \
+FLAG(  81,  0, EDX, 12,  1, LEAF81_MTRR,                       YES,  4, FALSE) \
+FLAG(  81,  0, EDX, 13,  1, LEAF81_PGE,                        YES,  4, FALSE) \
+FLAG(  81,  0, EDX, 14,  1, LEAF81_MCA,                        YES,  4, FALSE) \
+FLAG(  81,  0, EDX, 15,  1, LEAF81_CMOV,                       YES,  4, TRUE)  \
+FLAG(  81,  0, EDX, 16,  1, LEAF81_PAT,                        YES,  4, FALSE) \
+FLAG(  81,  0, EDX, 17,  1, LEAF81_PSE36,                      YES,  4, FALSE) \
+FLAG(  81,  0, EDX, 20,  1, NX,                                YES,  4, FALSE) \
+FLAG(  81,  0, EDX, 22,  1, MMXEXT,                            YES,  4, TRUE)  \
+FLAG(  81,  0, EDX, 23,  1, LEAF81_MMX,                        YES,  4, TRUE)  \
+FLAG(  81,  0, EDX, 24,  1, LEAF81_FXSR,                       YES,  4, TRUE)  \
+FLAG(  81,  0, EDX, 25,  1, FFXSR,                             YES,  4, FALSE) \
+FLAG(  81,  0, EDX, 26,  1, PDPE1GB,                           YES,  7, FALSE) \
+FLAG(  81,  0, EDX, 27,  1, RDTSCP,                            YES,  4, TRUE)  \
+FLAG(  81,  0, EDX, 29,  1, LM,                                YES,  4, FALSE) \
+FLAG(  81,  0, EDX, 30,  1, 3DNOWPLUS,                         YES,  4, TRUE)  \
+FLAG(  81,  0, EDX, 31,  1, 3DNOW,                             YES,  4, TRUE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_82                                              \
-FIELD( 82,  0, EAX,  0, 32, LEAF82_BRAND_STRING_EAX,               NA,  FALSE) \
-FIELD( 82,  0, EBX,  0, 32, LEAF82_BRAND_STRING_EBX,               NA,  FALSE) \
-FIELD( 82,  0, ECX,  0, 32, LEAF82_BRAND_STRING_ECX,               NA,  FALSE) \
-FIELD( 82,  0, EDX,  0, 32, LEAF82_BRAND_STRING_EDX,               NA,  FALSE)
+FIELD( 82,  0, EAX,  0, 32, LEAF82_BRAND_STRING_EAX,           NA,   0, FALSE) \
+FIELD( 82,  0, EBX,  0, 32, LEAF82_BRAND_STRING_EBX,           NA,   0, FALSE) \
+FIELD( 82,  0, ECX,  0, 32, LEAF82_BRAND_STRING_ECX,           NA,   0, FALSE) \
+FIELD( 82,  0, EDX,  0, 32, LEAF82_BRAND_STRING_EDX,           NA,   0, FALSE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_83                                              \
-FIELD( 83,  0, EAX,  0, 32, LEAF83_BRAND_STRING_EAX,               NA,  FALSE) \
-FIELD( 83,  0, EBX,  0, 32, LEAF83_BRAND_STRING_EBX,               NA,  FALSE) \
-FIELD( 83,  0, ECX,  0, 32, LEAF83_BRAND_STRING_ECX,               NA,  FALSE) \
-FIELD( 83,  0, EDX,  0, 32, LEAF83_BRAND_STRING_EDX,               NA,  FALSE)
+FIELD( 83,  0, EAX,  0, 32, LEAF83_BRAND_STRING_EAX,           NA,   0, FALSE) \
+FIELD( 83,  0, EBX,  0, 32, LEAF83_BRAND_STRING_EBX,           NA,   0, FALSE) \
+FIELD( 83,  0, ECX,  0, 32, LEAF83_BRAND_STRING_ECX,           NA,   0, FALSE) \
+FIELD( 83,  0, EDX,  0, 32, LEAF83_BRAND_STRING_EDX,           NA,   0, FALSE)
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_84                                              \
-FIELD( 84,  0, EAX,  0, 32, LEAF84_BRAND_STRING_EAX,               NA,  FALSE) \
-FIELD( 84,  0, EBX,  0, 32, LEAF84_BRAND_STRING_EBX,               NA,  FALSE) \
-FIELD( 84,  0, ECX,  0, 32, LEAF84_BRAND_STRING_ECX,               NA,  FALSE) \
-FIELD( 84,  0, EDX,  0, 32, LEAF84_BRAND_STRING_EDX,               NA,  FALSE)
+FIELD( 84,  0, EAX,  0, 32, LEAF84_BRAND_STRING_EAX,           NA,   0, FALSE) \
+FIELD( 84,  0, EBX,  0, 32, LEAF84_BRAND_STRING_EBX,           NA,   0, FALSE) \
+FIELD( 84,  0, ECX,  0, 32, LEAF84_BRAND_STRING_ECX,           NA,   0, FALSE) \
+FIELD( 84,  0, EDX,  0, 32, LEAF84_BRAND_STRING_EDX,           NA,   0, FALSE)
+
+/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_85                                              \
+FIELD( 85,  0, EAX,  0,  8, ITLB_ENTRIES_2M4M_PGS,             NA,   0, FALSE) \
+FIELD( 85,  0, EAX,  8,  8, ITLB_ASSOC_2M4M_PGS,               NA,   0, FALSE) \
+FIELD( 85,  0, EAX, 16,  8, DTLB_ENTRIES_2M4M_PGS,             NA,   0, FALSE) \
+FIELD( 85,  0, EAX, 24,  8, DTLB_ASSOC_2M4M_PGS,               NA,   0, FALSE) \
+FIELD( 85,  0, EBX,  0,  8, ITLB_ENTRIES_4K_PGS,               NA,   0, FALSE) \
+FIELD( 85,  0, EBX,  8,  8, ITLB_ASSOC_4K_PGS,                 NA,   0, FALSE) \
+FIELD( 85,  0, EBX, 16,  8, DTLB_ENTRIES_4K_PGS,               NA,   0, FALSE) \
+FIELD( 85,  0, EBX, 24,  8, DTLB_ASSOC_4K_PGS,                 NA,   0, FALSE) \
+FIELD( 85,  0, ECX,  0,  8, L1_DCACHE_LINE_SIZE,               NA,   0, FALSE) \
+FIELD( 85,  0, ECX,  8,  8, L1_DCACHE_LINES_PER_TAG,           NA,   0, FALSE) \
+FIELD( 85,  0, ECX, 16,  8, L1_DCACHE_ASSOC,                   NA,   0, FALSE) \
+FIELD( 85,  0, ECX, 24,  8, L1_DCACHE_SIZE,                    NA,   0, FALSE) \
+FIELD( 85,  0, EDX,  0,  8, L1_ICACHE_LINE_SIZE,               NA,   0, FALSE) \
+FIELD( 85,  0, EDX,  8,  8, L1_ICACHE_LINES_PER_TAG,           NA,   0, FALSE) \
+FIELD( 85,  0, EDX, 16,  8, L1_ICACHE_ASSOC,                   NA,   0, FALSE) \
+FIELD( 85,  0, EDX, 24,  8, L1_ICACHE_SIZE,                    NA,   0, FALSE)
+
+/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_86                                              \
+FIELD( 86,  0, EAX,  0, 12, L2_ITLB_ENTRIES_2M4M_PGS,          NA,   0, FALSE) \
+FIELD( 86,  0, EAX, 12,  4, L2_ITLB_ASSOC_2M4M_PGS,            NA,   0, FALSE) \
+FIELD( 86,  0, EAX, 16, 12, L2_DTLB_ENTRIES_2M4M_PGS,          NA,   0, FALSE) \
+FIELD( 86,  0, EAX, 28,  4, L2_DTLB_ASSOC_2M4M_PGS,            NA,   0, FALSE) \
+FIELD( 86,  0, EBX,  0, 12, L2_ITLB_ENTRIES_4K_PGS,            NA,   0, FALSE) \
+FIELD( 86,  0, EBX, 12,  4, L2_ITLB_ASSOC_4K_PGS,              NA,   0, FALSE) \
+FIELD( 86,  0, EBX, 16, 12, L2_DTLB_ENTRIES_4K_PGS,            NA,   0, FALSE) \
+FIELD( 86,  0, EBX, 28,  4, L2_DTLB_ASSOC_4K_PGS,              NA,   0, FALSE) \
+FIELD( 86,  0, ECX,  0,  8, L2CACHE_LINE,                      NA,   0, FALSE) \
+FIELD( 86,  0, ECX,  8,  4, L2CACHE_LINE_PER_TAG,              NA,   0, FALSE) \
+FIELD( 86,  0, ECX, 12,  4, L2CACHE_WAYS,                      NA,   0, FALSE) \
+FIELD( 86,  0, ECX, 16, 16, L2CACHE_SIZE,                      NA,   0, FALSE) \
+FIELD( 86,  0, EDX,  0,  8, L3CACHE_LINE,                      NA,   0, FALSE) \
+FIELD( 86,  0, EDX,  8,  4, L3CACHE_LINE_PER_TAG,              NA,   0, FALSE) \
+FIELD( 86,  0, EDX, 12,  4, L3CACHE_WAYS,                      NA,   0, FALSE) \
+FIELD( 86,  0, EDX, 18, 14, L3CACHE_SIZE,                      NA,   0, FALSE)
+
+/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_87                                              \
+FLAG(  87,  0, EDX,  0,  1, TS,                                NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  1,  1, FID,                               NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  2,  1, VID,                               NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  3,  1, TTP,                               NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  4,  1, LEAF87_TM,                         NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  5,  1, STC,                               NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  6,  1, 100MHZSTEPS,                       NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                          NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                     NA,   0, FALSE) \
+FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                   NA,   0, FALSE)
+
+/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_88                                              \
+FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                         YES,  4, FALSE) \
+FIELD( 88,  0, EAX,  8,  8, VIRT_BITS,                         YES,  4, FALSE) \
+FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                YES,  8, FALSE) \
+FLAG(  88,  0, EBX,  0,  1, CLZERO,                            YES, 14, TRUE)  \
+FLAG(  88,  0, EBX,  1,  1, IRPERF,                            NO,   0, FALSE) \
+FLAG(  88,  0, EBX,  2,  1, XSAVE_ERR_PTR,                     NO,   0, FALSE) \
+FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                 YES,  4, FALSE) \
+FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                YES,  7, FALSE) \
+FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                      NO,   0, FALSE)
 
 #define CPUID_8A_EDX_11 \
-FLAG(  8A,  0, EDX, 11,  1, SVMEDX_RSVD1,                          NO,  FALSE)
-#define CPUID_8A_EDX_14_31 \
-FIELD( 8A,  0, EDX, 14, 18, SVMEDX_RSVD2,                          NO,  FALSE)
-
-/*    LEVEL, REG, POS, SIZE, NAME,                             MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_8x                                              \
-FIELD( 85,  0, EAX,  0,  8, ITLB_ENTRIES_2M4M_PGS,                 NA,  FALSE) \
-FIELD( 85,  0, EAX,  8,  8, ITLB_ASSOC_2M4M_PGS,                   NA,  FALSE) \
-FIELD( 85,  0, EAX, 16,  8, DTLB_ENTRIES_2M4M_PGS,                 NA,  FALSE) \
-FIELD( 85,  0, EAX, 24,  8, DTLB_ASSOC_2M4M_PGS,                   NA,  FALSE) \
-FIELD( 85,  0, EBX,  0,  8, ITLB_ENTRIES_4K_PGS,                   NA,  FALSE) \
-FIELD( 85,  0, EBX,  8,  8, ITLB_ASSOC_4K_PGS,                     NA,  FALSE) \
-FIELD( 85,  0, EBX, 16,  8, DTLB_ENTRIES_4K_PGS,                   NA,  FALSE) \
-FIELD( 85,  0, EBX, 24,  8, DTLB_ASSOC_4K_PGS,                     NA,  FALSE) \
-FIELD( 85,  0, ECX,  0,  8, L1_DCACHE_LINE_SIZE,                   NA,  FALSE) \
-FIELD( 85,  0, ECX,  8,  8, L1_DCACHE_LINES_PER_TAG,               NA,  FALSE) \
-FIELD( 85,  0, ECX, 16,  8, L1_DCACHE_ASSOC,                       NA,  FALSE) \
-FIELD( 85,  0, ECX, 24,  8, L1_DCACHE_SIZE,                        NA,  FALSE) \
-FIELD( 85,  0, EDX,  0,  8, L1_ICACHE_LINE_SIZE,                   NA,  FALSE) \
-FIELD( 85,  0, EDX,  8,  8, L1_ICACHE_LINES_PER_TAG,               NA,  FALSE) \
-FIELD( 85,  0, EDX, 16,  8, L1_ICACHE_ASSOC,                       NA,  FALSE) \
-FIELD( 85,  0, EDX, 24,  8, L1_ICACHE_SIZE,                        NA,  FALSE) \
-FIELD( 86,  0, EAX,  0, 12, L2_ITLB_ENTRIES_2M4M_PGS,              NA,  FALSE) \
-FIELD( 86,  0, EAX, 12,  4, L2_ITLB_ASSOC_2M4M_PGS,                NA,  FALSE) \
-FIELD( 86,  0, EAX, 16, 12, L2_DTLB_ENTRIES_2M4M_PGS,              NA,  FALSE) \
-FIELD( 86,  0, EAX, 28,  4, L2_DTLB_ASSOC_2M4M_PGS,                NA,  FALSE) \
-FIELD( 86,  0, EBX,  0, 12, L2_ITLB_ENTRIES_4K_PGS,                NA,  FALSE) \
-FIELD( 86,  0, EBX, 12,  4, L2_ITLB_ASSOC_4K_PGS,                  NA,  FALSE) \
-FIELD( 86,  0, EBX, 16, 12, L2_DTLB_ENTRIES_4K_PGS,                NA,  FALSE) \
-FIELD( 86,  0, EBX, 28,  4, L2_DTLB_ASSOC_4K_PGS,                  NA,  FALSE) \
-FIELD( 86,  0, ECX,  0,  8, L2CACHE_LINE,                          NA,  FALSE) \
-FIELD( 86,  0, ECX,  8,  4, L2CACHE_LINE_PER_TAG,                  NA,  FALSE) \
-FIELD( 86,  0, ECX, 12,  4, L2CACHE_WAYS,                          NA,  FALSE) \
-FIELD( 86,  0, ECX, 16, 16, L2CACHE_SIZE,                          NA,  FALSE) \
-FIELD( 86,  0, EDX,  0,  8, L3CACHE_LINE,                          NA,  FALSE) \
-FIELD( 86,  0, EDX,  8,  4, L3CACHE_LINE_PER_TAG,                  NA,  FALSE) \
-FIELD( 86,  0, EDX, 12,  4, L3CACHE_WAYS,                          NA,  FALSE) \
-FIELD( 86,  0, EDX, 18, 14, L3CACHE_SIZE,                          NA,  FALSE) \
-FLAG(  87,  0, EDX,  0,  1, TS,                                    NA,  FALSE) \
-FLAG(  87,  0, EDX,  1,  1, FID,                                   NA,  FALSE) \
-FLAG(  87,  0, EDX,  2,  1, VID,                                   NA,  FALSE) \
-FLAG(  87,  0, EDX,  3,  1, TTP,                                   NA,  FALSE) \
-FLAG(  87,  0, EDX,  4,  1, LEAF87_TM,                             NA,  FALSE) \
-FLAG(  87,  0, EDX,  5,  1, STC,                                   NA,  FALSE) \
-FLAG(  87,  0, EDX,  6,  1, 100MHZSTEPS,                           NA,  FALSE) \
-FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                              NA,  FALSE) \
-FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                         NA,  FALSE) \
-FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                       NA,  FALSE) \
-FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                             NA,  FALSE) \
-FIELD( 88,  0, EAX,  8,  8, VIRT_BITS,                             NA,  FALSE) \
-FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                    NA,  FALSE) \
-FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                     NA,  FALSE) \
-FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                    NA,  FALSE) \
-FIELD( 8A,  0, EAX,  0,  8, SVM_REVISION,                          YES, FALSE) \
-FLAG(  8A,  0, EAX,  8,  1, SVM_HYPERVISOR,                        NO,  FALSE) \
-FIELD( 8A,  0, EAX,  9, 23, SVMEAX_RSVD,                           NO,  FALSE) \
-FIELD( 8A,  0, EBX,  0, 32, SVM_NUM_ASIDS,                         YES, FALSE) \
-FIELD( 8A,  0, ECX,  0, 32, SVMECX_RSVD,                           NO,  FALSE) \
-FLAG(  8A,  0, EDX,  0,  1, SVM_NPT,                               YES, FALSE) \
-FLAG(  8A,  0, EDX,  1,  1, SVM_LBR,                               NO,  FALSE) \
-FLAG(  8A,  0, EDX,  2,  1, SVM_LOCK,                              ANY, FALSE) \
-FLAG(  8A,  0, EDX,  3,  1, SVM_NRIP,                              YES, FALSE) \
-FLAG(  8A,  0, EDX,  4,  1, SVM_TSC_RATE_MSR,                      NO,  FALSE) \
-FLAG(  8A,  0, EDX,  5,  1, SVM_VMCB_CLEAN,                        YES, FALSE) \
-FLAG(  8A,  0, EDX,  6,  1, SVM_FLUSH_BY_ASID,                     YES, FALSE) \
-FLAG(  8A,  0, EDX,  7,  1, SVM_DECODE_ASSISTS,                    YES, FALSE) \
-FIELD( 8A,  0, EDX,  8,  2, SVMEDX_RSVD0,                          NO,  FALSE) \
-FLAG(  8A,  0, EDX, 10,  1, SVM_PAUSE_FILTER,                      NO,  FALSE) \
+FLAG(  8A,  0, EDX, 11,  1, SVMEDX_RSVD1,                      NO,   0, FALSE)
+#define CPUID_8A_EDX_14 \
+FLAG(  8A,  0, EDX, 14,  1, SVMEDX_RSVD2,                      NO,   0, FALSE)
+
+/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_8A                                              \
+FIELD( 8A,  0, EAX,  0,  8, SVM_REVISION,                      YES,  4, FALSE) \
+FLAG(  8A,  0, EAX,  8,  1, SVM_HYPERVISOR,                    NO,   0, FALSE) \
+FIELD( 8A,  0, EAX,  9, 23, SVMEAX_RSVD,                       NO,   0, FALSE) \
+FIELD( 8A,  0, EBX,  0, 32, SVM_NUM_ASIDS,                     YES,  7, FALSE) \
+FIELD( 8A,  0, ECX,  0, 32, SVMECX_RSVD,                       NO,   0, FALSE) \
+FLAG(  8A,  0, EDX,  0,  1, SVM_NPT,                           YES,  7, FALSE) \
+FLAG(  8A,  0, EDX,  1,  1, SVM_LBR,                           NO,   0, FALSE) \
+FLAG(  8A,  0, EDX,  2,  1, SVM_LOCK,                          ANY,  7, FALSE) \
+FLAG(  8A,  0, EDX,  3,  1, SVM_NRIP,                          YES,  7, FALSE) \
+FLAG(  8A,  0, EDX,  4,  1, SVM_TSC_RATE_MSR,                  NO,   0, FALSE) \
+FLAG(  8A,  0, EDX,  5,  1, SVM_VMCB_CLEAN,                    YES,  7, FALSE) \
+FLAG(  8A,  0, EDX,  6,  1, SVM_FLUSH_BY_ASID,                 YES,  7, FALSE) \
+FLAG(  8A,  0, EDX,  7,  1, SVM_DECODE_ASSISTS,                YES,  7, FALSE) \
+FIELD( 8A,  0, EDX,  8,  2, SVMEDX_RSVD0,                      NO,   0, FALSE) \
+FLAG(  8A,  0, EDX, 10,  1, SVM_PAUSE_FILTER,                  NO,   0, FALSE) \
 CPUID_8A_EDX_11 \
-FLAG(  8A,  0, EDX, 12,  1, SVM_PAUSE_THRESHOLD,                   NO,  FALSE) \
-FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                              NO,  FALSE) \
-CPUID_8A_EDX_14_31
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81x                                             \
-FIELD(819,  0, EAX,  0, 12, L1_ITLB_ENTRIES_1G_PGS,                NA,  FALSE) \
-FIELD(819,  0, EAX, 12,  4, L1_ITLB_ASSOC_1G_PGS,                  NA,  FALSE) \
-FIELD(819,  0, EAX, 16, 12, L1_DTLB_ENTRIES_1G_PGS,                NA,  FALSE) \
-FIELD(819,  0, EAX, 28,  4, L1_DTLB_ASSOC_1G_PGS,                  NA,  FALSE) \
-FIELD(819,  0, EBX,  0, 12, L2_ITLB_ENTRIES_1G_PGS,                NA,  FALSE) \
-FIELD(819,  0, EBX, 12,  4, L2_ITLB_ASSOC_1G_PGS,                  NA,  FALSE) \
-FIELD(819,  0, EBX, 16, 12, L2_DTLB_ENTRIES_1G_PGS,                NA,  FALSE) \
-FIELD(819,  0, EBX, 28,  4, L2_DTLB_ASSOC_1G_PGS,                  NA,  FALSE) \
-FLAG( 81A,  0, EAX,  0,  1, FP128,                                 NA,  FALSE) \
-FLAG( 81A,  0, EAX,  1,  1, MOVU,                                  NA,  FALSE) \
-FLAG( 81B,  0, EAX,  0,  1, IBS_FFV,                               NA,  FALSE) \
-FLAG( 81B,  0, EAX,  1,  1, IBS_FETCHSAM,                          NA,  FALSE) \
-FLAG( 81B,  0, EAX,  2,  1, IBS_OPSAM,                             NA,  FALSE) \
-FLAG( 81B,  0, EAX,  3,  1, RW_OPCOUNT,                            NA,  FALSE) \
-FLAG( 81B,  0, EAX,  4,  1, OPCOUNT,                               NA,  FALSE) \
-FLAG( 81B,  0, EAX,  5,  1, BRANCH_TARGET_ADDR,                    NA,  FALSE) \
-FLAG( 81B,  0, EAX,  6,  1, OPCOUNT_EXT,                           NA,  FALSE) \
-FLAG( 81B,  0, EAX,  7,  1, RIP_INVALID_CHECK,                     NA,  FALSE) \
-FLAG( 81C,  0, EAX,  0,  1, LWP_AVAIL,                             NA,  FALSE) \
-FLAG( 81C,  0, EAX,  1,  1, LWP_VAL_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  2,  1, LWP_IRE_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  3,  1, LWP_BRE_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  4,  1, LWP_DME_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  5,  1, LWP_CNH_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  6,  1, LWP_RNH_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX, 31,  1, LWP_INT_AVAIL,                         NA,  FALSE) \
-FIELD(81C,  0, EBX,  0,  8, LWP_CB_SIZE,                           NA,  FALSE) \
-FIELD(81C,  0, EBX,  8,  8, LWP_EVENT_SIZE,                        NA,  FALSE) \
-FIELD(81C,  0, EBX, 16,  8, LWP_MAX_EVENTS,                        NA,  FALSE) \
-FIELD(81C,  0, EBX, 24,  8, LWP_EVENT_OFFSET,                      NA,  FALSE) \
-FIELD(81C,  0, ECX,  0,  4, LWP_LATENCY_MAX,                       NA,  FALSE) \
-FLAG( 81C,  0, ECX,  5,  1, LWP_DATA_ADDR_VALID,                   NA,  FALSE) \
-FIELD(81C,  0, ECX,  6,  3, LWP_LATENCY_ROUND,                     NA,  FALSE) \
-FIELD(81C,  0, ECX,  9,  7, LWP_VERSION,                           NA,  FALSE) \
-FIELD(81C,  0, ECX, 16,  8, LWP_MIN_BUF_SIZE,                      NA,  FALSE) \
-FLAG( 81C,  0, ECX, 28,  1, LWP_BRANCH_PRED,                       NA,  FALSE) \
-FLAG( 81C,  0, ECX, 29,  1, LWP_IP_FILTERING,                      NA,  FALSE) \
-FLAG( 81C,  0, ECX, 30,  1, LWP_CACHE_LEVEL,                       NA,  FALSE) \
-FLAG( 81C,  0, ECX, 31,  1, LWP_CACHE_LATENCY,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  0,  1, LWP_SUPPORTED,                         NA,  FALSE) \
-FLAG( 81C,  0, EDX,  1,  1, LWP_VAL_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  2,  1, LWP_IRE_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  3,  1, LWP_BRE_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  4,  1, LWP_DME_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  5,  1, LWP_CNH_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  6,  1, LWP_RNH_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX, 31,  1, LWP_INT_SUPPORTED,                     NA,  FALSE) \
-FIELD(81D,  0, EAX,  0,  5, LEAF81D_CACHE_TYPE,                    NA,  FALSE) \
-FIELD(81D,  0, EAX,  5,  3, LEAF81D_CACHE_LEVEL,                   NA,  FALSE) \
-FLAG( 81D,  0, EAX,  8,  1, LEAF81D_CACHE_SELF_INIT,               NA,  FALSE) \
-FLAG( 81D,  0, EAX,  9,  1, LEAF81D_CACHE_FULLY_ASSOC,             NA,  FALSE) \
-FIELD(81D,  0, EAX, 14, 12, LEAF81D_NUM_SHARING_CACHE,             NA,  FALSE) \
-FIELD(81D,  0, EBX,  0, 12, LEAF81D_CACHE_LINE_SIZE,               NA,  FALSE) \
-FIELD(81D,  0, EBX, 12, 10, LEAF81D_CACHE_PHYS_PARTITIONS,         NA,  FALSE) \
-FIELD(81D,  0, EBX, 22, 10, LEAF81D_CACHE_WAYS,                    NA,  FALSE) \
-FIELD(81D,  0, ECX,  0, 32, LEAF81D_CACHE_NUM_SETS,                NA,  FALSE) \
-FLAG( 81D,  0, EDX,  0,  1, LEAF81D_CACHE_WBINVD,                  NA,  FALSE) \
-FLAG( 81D,  0, EDX,  1,  1, LEAF81D_CACHE_INCLUSIVE,               NA,  FALSE) \
-FIELD(81E,  0, EAX,  0, 32, EXTENDED_APICID,                       NA,  FALSE) \
-FIELD(81E,  0, EBX,  0,  8, COMPUTE_UNIT_ID,                       NA,  FALSE) \
-FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,                NA,  FALSE) \
-FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                            NA,  FALSE) \
-FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                         NA,  FALSE)
+FLAG(  8A,  0, EDX, 12,  1, SVM_PAUSE_THRESHOLD,               NO,   0, FALSE) \
+FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                          NO,   0, FALSE) \
+CPUID_8A_EDX_14 \
+FLAG(  8A,  0, EDX, 15,  1, SVM_VIRT_VMSAVE_VMLOAD,            NO,   0, FALSE) \
+FLAG(  8A,  0, EDX, 16,  1, SVM_VGIF,                          NO,   0, FALSE) \
+FIELD( 8A,  0, EDX, 17, 15, SVMEDX_RSVD,                       NO,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_819                                             \
+FIELD(819,  0, EAX,  0, 12, L1_ITLB_ENTRIES_1G_PGS,            NA,   0, FALSE) \
+FIELD(819,  0, EAX, 12,  4, L1_ITLB_ASSOC_1G_PGS,              NA,   0, FALSE) \
+FIELD(819,  0, EAX, 16, 12, L1_DTLB_ENTRIES_1G_PGS,            NA,   0, FALSE) \
+FIELD(819,  0, EAX, 28,  4, L1_DTLB_ASSOC_1G_PGS,              NA,   0, FALSE) \
+FIELD(819,  0, EBX,  0, 12, L2_ITLB_ENTRIES_1G_PGS,            NA,   0, FALSE) \
+FIELD(819,  0, EBX, 12,  4, L2_ITLB_ASSOC_1G_PGS,              NA,   0, FALSE) \
+FIELD(819,  0, EBX, 16, 12, L2_DTLB_ENTRIES_1G_PGS,            NA,   0, FALSE) \
+FIELD(819,  0, EBX, 28,  4, L2_DTLB_ASSOC_1G_PGS,              NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81A                                             \
+FLAG( 81A,  0, EAX,  0,  1, FP128,                             NA,   0, FALSE) \
+FLAG( 81A,  0, EAX,  1,  1, MOVU,                              NA,   0, FALSE) \
+FLAG( 81A,  0, EAX,  2,  1, FP256,                             NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81B                                             \
+FLAG( 81B,  0, EAX,  0,  1, IBS_FFV,                           NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  1,  1, IBS_FETCHSAM,                      NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  2,  1, IBS_OPSAM,                         NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  3,  1, RW_OPCOUNT,                        NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  4,  1, OPCOUNT,                           NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  5,  1, BRANCH_TARGET_ADDR,                NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  6,  1, OPCOUNT_EXT,                       NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  7,  1, RIP_INVALID_CHECK,                 NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  8,  1, OP_BRN_FUSE,                       NA,   0, FALSE) \
+FLAG( 81B,  0, EAX,  9,  1, IBS_FETCH_CTL_EXTD,                NA,   0, FALSE) \
+FLAG( 81B,  0, EAX, 10,  1, IBS_OP_DATA4,                      NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81C                                             \
+FLAG( 81C,  0, EAX,  0,  1, LWP_AVAIL,                         NA,   0, FALSE) \
+FLAG( 81C,  0, EAX,  1,  1, LWP_VAL_AVAIL,                     NA,   0, FALSE) \
+FLAG( 81C,  0, EAX,  2,  1, LWP_IRE_AVAIL,                     NA,   0, FALSE) \
+FLAG( 81C,  0, EAX,  3,  1, LWP_BRE_AVAIL,                     NA,   0, FALSE) \
+FLAG( 81C,  0, EAX,  4,  1, LWP_DME_AVAIL,                     NA,   0, FALSE) \
+FLAG( 81C,  0, EAX,  5,  1, LWP_CNH_AVAIL,                     NA,   0, FALSE) \
+FLAG( 81C,  0, EAX,  6,  1, LWP_RNH_AVAIL,                     NA,   0, FALSE) \
+FLAG( 81C,  0, EAX, 29,  1, LWP_CONT_AVAIL,                    NA,   0, FALSE) \
+FLAG( 81C,  0, EAX, 30,  1, LWP_PTSC_AVAIL,                    NA,   0, FALSE) \
+FLAG( 81C,  0, EAX, 31,  1, LWP_INT_AVAIL,                     NA,   0, FALSE) \
+FIELD(81C,  0, EBX,  0,  8, LWP_CB_SIZE,                       NA,   0, FALSE) \
+FIELD(81C,  0, EBX,  8,  8, LWP_EVENT_SIZE,                    NA,   0, FALSE) \
+FIELD(81C,  0, EBX, 16,  8, LWP_MAX_EVENTS,                    NA,   0, FALSE) \
+FIELD(81C,  0, EBX, 24,  8, LWP_EVENT_OFFSET,                  NA,   0, FALSE) \
+FIELD(81C,  0, ECX,  0,  4, LWP_LATENCY_MAX,                   NA,   0, FALSE) \
+FLAG( 81C,  0, ECX,  5,  1, LWP_DATA_ADDR_VALID,               NA,   0, FALSE) \
+FIELD(81C,  0, ECX,  6,  3, LWP_LATENCY_ROUND,                 NA,   0, FALSE) \
+FIELD(81C,  0, ECX,  9,  7, LWP_VERSION,                       NA,   0, FALSE) \
+FIELD(81C,  0, ECX, 16,  8, LWP_MIN_BUF_SIZE,                  NA,   0, FALSE) \
+FLAG( 81C,  0, ECX, 28,  1, LWP_BRANCH_PRED,                   NA,   0, FALSE) \
+FLAG( 81C,  0, ECX, 29,  1, LWP_IP_FILTERING,                  NA,   0, FALSE) \
+FLAG( 81C,  0, ECX, 30,  1, LWP_CACHE_LEVEL,                   NA,   0, FALSE) \
+FLAG( 81C,  0, ECX, 31,  1, LWP_CACHE_LATENCY,                 NA,   0, FALSE) \
+FLAG( 81C,  0, EDX,  0,  1, LWP_SUPPORTED,                     NA,   0, FALSE) \
+FLAG( 81C,  0, EDX,  1,  1, LWP_VAL_SUPPORTED,                 NA,   0, FALSE) \
+FLAG( 81C,  0, EDX,  2,  1, LWP_IRE_SUPPORTED,                 NA,   0, FALSE) \
+FLAG( 81C,  0, EDX,  3,  1, LWP_BRE_SUPPORTED,                 NA,   0, FALSE) \
+FLAG( 81C,  0, EDX,  4,  1, LWP_DME_SUPPORTED,                 NA,   0, FALSE) \
+FLAG( 81C,  0, EDX,  5,  1, LWP_CNH_SUPPORTED,                 NA,   0, FALSE) \
+FLAG( 81C,  0, EDX,  6,  1, LWP_RNH_SUPPORTED,                 NA,   0, FALSE) \
+FLAG( 81C,  0, EDX, 29,  1, LWP_CONT_SUPPORTED,                NA,   0, FALSE) \
+FLAG( 81C,  0, EDX, 30,  1, LWP_PTSC_SUPPORTED,                NA,   0, FALSE) \
+FLAG( 81C,  0, EDX, 31,  1, LWP_INT_SUPPORTED,                 NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81D                                             \
+FIELD(81D,  0, EAX,  0,  5, LEAF81D_CACHE_TYPE,                NA,   0, FALSE) \
+FIELD(81D,  0, EAX,  5,  3, LEAF81D_CACHE_LEVEL,               NA,   0, FALSE) \
+FLAG( 81D,  0, EAX,  8,  1, LEAF81D_CACHE_SELF_INIT,           NA,   0, FALSE) \
+FLAG( 81D,  0, EAX,  9,  1, LEAF81D_CACHE_FULLY_ASSOC,         NA,   0, FALSE) \
+FIELD(81D,  0, EAX, 14, 12, LEAF81D_NUM_SHARING_CACHE,         NA,   0, FALSE) \
+FIELD(81D,  0, EBX,  0, 12, LEAF81D_CACHE_LINE_SIZE,           NA,   0, FALSE) \
+FIELD(81D,  0, EBX, 12, 10, LEAF81D_CACHE_PHYS_PARTITIONS,     NA,   0, FALSE) \
+FIELD(81D,  0, EBX, 22, 10, LEAF81D_CACHE_WAYS,                NA,   0, FALSE) \
+FIELD(81D,  0, ECX,  0, 32, LEAF81D_CACHE_NUM_SETS,            NA,   0, FALSE) \
+FLAG( 81D,  0, EDX,  0,  1, LEAF81D_CACHE_WBINVD,              NA,   0, FALSE) \
+FLAG( 81D,  0, EDX,  1,  1, LEAF81D_CACHE_INCLUSIVE,           NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81E                                             \
+FIELD(81E,  0, EAX,  0, 32, EXTENDED_APICID,                   NA,   0, FALSE) \
+FIELD(81E,  0, EBX,  0,  8, COMPUTE_UNIT_ID,                   NA,   0, FALSE) \
+FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,            NA,   0, FALSE) \
+FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                        NA,   0, FALSE) \
+FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                     NA,   0, FALSE)
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_FIELD_DATA_LEVEL_81F                                             \
+FLAG( 81F,  0, EAX,  0,  1, SME,                               NO,   0, FALSE) \
+FLAG( 81F,  0, EAX,  1,  1, SEV,                               NO,   0, FALSE) \
+FLAG( 81F,  0, EAX,  2,  1, PAGE_FLUSH_MSR,                    NO,   0, FALSE) \
+FLAG( 81F,  0, EAX,  3,  1, SEV_ES,                            NO,   0, FALSE) \
+FIELD(81F,  0, EBX,  0,  5, SME_PAGE_TABLE_BIT_NUM,            NO,   0, FALSE) \
+FIELD(81F,  0, EBX,  6,  6, SME_PHYS_ADDR_SPACE_REDUCTION,     NO,   0, FALSE) \
+FIELD(81F,  0, ECX,  0, 32, NUM_ENCRYPTED_GUESTS,              NO,   0, FALSE) \
+FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                      NO,   0, FALSE)
 
 #define INTEL_CPUID_FIELD_DATA
 
@@ -863,7 +1098,13 @@ FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                         NA,  FALSE)
    CPUID_FIELD_DATA_LEVEL_A                                           \
    CPUID_FIELD_DATA_LEVEL_B                                           \
    CPUID_FIELD_DATA_LEVEL_D                                           \
+   CPUID_FIELD_DATA_LEVEL_F                                           \
+   CPUID_FIELD_DATA_LEVEL_10                                          \
    CPUID_FIELD_DATA_LEVEL_12                                          \
+   CPUID_FIELD_DATA_LEVEL_14                                          \
+   CPUID_FIELD_DATA_LEVEL_15                                          \
+   CPUID_FIELD_DATA_LEVEL_16                                          \
+   CPUID_FIELD_DATA_LEVEL_17                                          \
    CPUID_FIELD_DATA_LEVEL_400                                         \
    CPUID_FIELD_DATA_LEVEL_401                                         \
    CPUID_FIELD_DATA_LEVEL_402                                         \
@@ -877,8 +1118,18 @@ FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                         NA,  FALSE)
    CPUID_FIELD_DATA_LEVEL_82                                          \
    CPUID_FIELD_DATA_LEVEL_83                                          \
    CPUID_FIELD_DATA_LEVEL_84                                          \
-   CPUID_FIELD_DATA_LEVEL_8x                                          \
-   CPUID_FIELD_DATA_LEVEL_81x                                         \
+   CPUID_FIELD_DATA_LEVEL_85                                          \
+   CPUID_FIELD_DATA_LEVEL_86                                          \
+   CPUID_FIELD_DATA_LEVEL_87                                          \
+   CPUID_FIELD_DATA_LEVEL_88                                          \
+   CPUID_FIELD_DATA_LEVEL_8A                                          \
+   CPUID_FIELD_DATA_LEVEL_819                                         \
+   CPUID_FIELD_DATA_LEVEL_81A                                         \
+   CPUID_FIELD_DATA_LEVEL_81B                                         \
+   CPUID_FIELD_DATA_LEVEL_81C                                         \
+   CPUID_FIELD_DATA_LEVEL_81D                                         \
+   CPUID_FIELD_DATA_LEVEL_81E                                         \
+   CPUID_FIELD_DATA_LEVEL_81F                                         \
    INTEL_CPUID_FIELD_DATA                                             \
    AMD_CPUID_FIELD_DATA
 
@@ -891,20 +1142,19 @@ FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                         NA,  FALSE)
  *
  * e.g. - CPUID_VIRT_BITS_MASK  = 0xff00
  *      - CPUID_VIRT_BITS_SHIFT = 8
- *
- * Note: The MASK definitions must use some gymnastics to get
- * around a warning when shifting left by 32.
  */
-#define VMW_BIT_MASK(shift)  (((1 << (shift - 1)) << 1) - 1)
+#define VMW_BIT_MASK(shift)  (0xffffffffu >> (32 - shift))
+
 
-#define FIELD(lvl, ecxIn, reg, bitpos, size, name, s, c3)      \
+#define FIELD(lvl, ecxIn, reg, bitpos, size, name, s, hwv, c3) \
    CPUID_##name##_SHIFT        = bitpos,                       \
    CPUID_##name##_MASK         = VMW_BIT_MASK(size) << bitpos, \
    CPUID_INTERNAL_SHIFT_##name = bitpos,                       \
    CPUID_INTERNAL_MASK_##name  = VMW_BIT_MASK(size) << bitpos, \
    CPUID_INTERNAL_REG_##name   = CPUID_REG_##reg,              \
    CPUID_INTERNAL_EAXIN_##name = CPUID_LEVEL_VAL_##lvl,        \
-   CPUID_INTERNAL_ECXIN_##name = ecxIn,
+   CPUID_INTERNAL_ECXIN_##name = ecxIn,                        \
+   CPUID_INTERNAL_HWV_##name   = hwv,
 
 #define FLAG FIELD
 
@@ -1114,8 +1364,9 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_FAMILY_K8MOBILE        0x11
 #define CPUID_FAMILY_LLANO           0x12
 #define CPUID_FAMILY_BOBCAT          0x14
-#define CPUID_FAMILY_BULLDOZER       0x15  // Bulldozer Piledriver Steamroller
+#define CPUID_FAMILY_BULLDOZER       0x15  // BD PD SR EX
 #define CPUID_FAMILY_KYOTO           0x16  // Note: Jaguar microarch
+#define CPUID_FAMILY_ZEN             0x17
 
 /* Effective VIA CPU Families */
 #define CPUID_FAMILY_C7               6
@@ -1157,12 +1408,21 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_ATOM_4A        0x4a  // Future Silvermont
 #define CPUID_MODEL_ATOM_4C        0x4c  // Airmont
 #define CPUID_MODEL_ATOM_4D        0x4d  // Avoton
-#define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y
+#define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y / Kabylake U/Y ES
 #define CPUID_MODEL_BROADWELL_4F   0x4f  // Broadwell EP/EN/EX
 #define CPUID_MODEL_BROADWELL_56   0x56  // Broadwell DE
+#define CPUID_MODEL_KNL_57         0x57  // Knights Landing
 #define CPUID_MODEL_ATOM_5A        0x5a  // Future Silvermont
 #define CPUID_MODEL_ATOM_5D        0x5d  // Future Silvermont
-#define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S
+#define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S / Kabylake S/H ES
+#define CPUID_MODEL_ATOM_5F        0x5f  // Denverton
+#define CPUID_MODEL_KABYLAKE_8E    0x8e  // Kabylake U/Y QS
+#define CPUID_MODEL_KABYLAKE_9E    0x9e  // Kabylake S/H QS
+
+/* Intel stepping information */
+#define CPUID_STEPPING_KABYLAKE_ES     0x8  // Kabylake S/H/U/Y ES
+#define CPUID_STEPPING_COFFEELAKE_A    0xA  // Coffeelake U/S/H
+#define CPUID_STEPPING_COFFEELAKE_B    0xB  // Coffeelake S/H
 
 #define CPUID_MODEL_PIII_07    7
 #define CPUID_MODEL_PIII_08    8
@@ -1181,6 +1441,12 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_PILEDRIVER_02     0x02 // family == CPUID_FAMILY_BULLDOZER
 #define CPUID_MODEL_OPTERON_REVF_41   0x41 // family == CPUID_FAMILY_K8
 #define CPUID_MODEL_KYOTO_00          0x00 // family == CPUID_FAMILY_KYOTO
+#define CPUID_MODEL_STEAMROLLER_3F    0x3F // Max Steamroller model defined in BKDG
+#define CPUID_MODEL_STEAMROLLER_30    0x30 // family == CPUID_FAMILY_BULLDOZER
+#define CPUID_MODEL_EXCAVATOR_60      0x60 // family == CPUID_FAMILY_BULLDOZER
+#define CPUID_MODEL_EXCAVATOR_6F      0x6F // Max Excavator model defined in BKDG
+#define CPUID_MODEL_ZEN_00            0x00 // family == CPUID_FAMILY_ZEN
+#define CPUID_MODEL_ZEN_1F            0x1F // Max Zen model defined in BKDG
 
 /* VIA model information */
 #define CPUID_MODEL_NANO       15     // Isaiah
@@ -1247,6 +1513,12 @@ CPUID_EFFECTIVE_MODEL(uint32 v) /* %eax from CPUID with %eax=1. */
    return m + (em << 4);
 }
 
+static INLINE uint32
+CPUID_EFFECTIVE_STEPPING(uint32 v) /* %eax from CPUID with %eax=1. */
+{
+   return CPUID_GET(1, EAX, STEPPING, v);
+}
+
 /*
  * Notice that CPUID families for Intel and AMD overlap. The following macros
  * should only be used AFTER the manufacturer has been established (through
@@ -1371,19 +1643,48 @@ CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
    /* Assumes the CPU manufacturer is Intel. */
    return CPUID_FAMILY_IS_P6(v) &&
-          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E ||
-           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E);
+          ((CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E &&
+            CPUID_EFFECTIVE_STEPPING(v) != CPUID_STEPPING_KABYLAKE_ES) ||
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E &&
+            CPUID_EFFECTIVE_STEPPING(v) != CPUID_STEPPING_KABYLAKE_ES));
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_COFFEELAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          ((CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_9E           &&
+            (CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_COFFEELAKE_A   ||
+             CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_COFFEELAKE_B)) ||
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_8E           &&
+            CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_COFFEELAKE_A));
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_KABYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          !CPUID_MODEL_IS_COFFEELAKE(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_9E         ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_8E         ||
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E         &&
+            CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_KABYLAKE_ES) ||
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E         &&
+            CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_KABYLAKE_ES));
+}
 
 static INLINE Bool
 CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
    /* Assumes the CPU manufacturer is Intel. */
-   return CPUID_FAMILY_IS_P6(v) && CPUID_MODEL_IS_SKYLAKE(v);
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_MODEL_IS_COFFEELAKE(v) ||
+           CPUID_MODEL_IS_KABYLAKE(v)   ||
+           CPUID_MODEL_IS_SKYLAKE(v));
 }
 
-
 static INLINE Bool
 CPUID_UARCH_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
@@ -1409,6 +1710,30 @@ CPUID_MODEL_IS_AVOTON(uint32 v) // IN: %eax from CPUID with %eax=1.
           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_4D;
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_BAYTRAIL(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_37;
+}
+
+static INLINE Bool
+CPUID_UARCH_IS_SILVERMONT(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_MODEL_IS_AVOTON(v) || CPUID_MODEL_IS_BAYTRAIL(v));
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_DENVERTON(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_5F;
+}
+
 static INLINE Bool
 CPUID_MODEL_IS_WESTMERE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
@@ -1446,6 +1771,15 @@ CPUID_MODEL_IS_IVYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
 }
 
 
+static INLINE Bool
+CPUID_MODEL_IS_KNIGHTS_LANDING(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KNL_57;
+}
+
+
 static INLINE Bool
 CPUID_FAMILY_IS_K7(uint32 eax)
 {
@@ -1458,13 +1792,18 @@ CPUID_FAMILY_IS_K8(uint32 eax)
    return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8;
 }
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * CPUID_FAMILY_IS_K8EXT --
+ *
+ *      Return TRUE for family K8 with effective model >= 0x10.
+ *
+ *----------------------------------------------------------------------
+ */
 static INLINE Bool
 CPUID_FAMILY_IS_K8EXT(uint32 eax)
 {
-   /*
-    * We check for this pattern often enough that it's
-    * worth a separate function, for syntactic sugar.
-    */
    return CPUID_FAMILY_IS_K8(eax) &&
           CPUID_GET(1, EAX, EXTENDED_MODEL, eax) != 0;
 }
@@ -1518,6 +1857,12 @@ CPUID_FAMILY_IS_KYOTO(uint32 eax)
    return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_KYOTO;
 }
 
+static INLINE Bool
+CPUID_FAMILY_IS_ZEN(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN;
+}
+
 /*
  * AMD Barcelona (of either Opteron or Phenom kind).
  */
@@ -1583,6 +1928,24 @@ CPUID_MODEL_IS_PILEDRIVER(uint32 eax)
 }
 
 
+static INLINE Bool
+CPUID_MODEL_IS_STEAMROLLER(uint32 eax)
+{
+   /* Steamroller is model 0x30 of family 0x15 (so far). */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
+          (CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_STEAMROLLER_30 &&
+           CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_STEAMROLLER_3F);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_EXCAVATOR(uint32 eax)
+{
+   /* Excavator is model 0x60 of family 0x15 (so far). */
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
+          (CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_EXCAVATOR_60 &&
+           CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_EXCAVATOR_6F);
+}
 
 
 static INLINE Bool
@@ -1593,6 +1956,14 @@ CPUID_MODEL_IS_KYOTO(uint32 eax)
           CPUID_EFFECTIVE_MODEL(eax) == CPUID_MODEL_KYOTO_00;
 }
 
+
+static INLINE Bool
+CPUID_MODEL_IS_ZEN(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN &&
+          CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN_1F;
+}
+
 #define CPUID_TYPE_PRIMARY     0
 #define CPUID_TYPE_OVERDRIVE   1
 #define CPUID_TYPE_SECONDARY   2
@@ -1708,8 +2079,20 @@ CPUID_IsHypervisorLevel(uint32 level)
 
 static INLINE Bool
 CPUID_LevelUsesEcx(uint32 level) {
-   return level == 4 || level == 7 || level == 0xb || level == 0xd ||
-          level == 0x8000001d;
+   switch (level)
+   {
+
+#define CPUIDLEVEL(t, s, v, c, h)   \
+      case v:                       \
+         return c != 0;
+
+      CPUID_ALL_LEVELS
+
+#undef CPUIDLEVEL
+
+      default:
+         return FALSE;
+   }
 }
 
 /*
@@ -1777,7 +2160,18 @@ CPUID_SupportsMsrPlatformInfo(CpuidVendor vendor, uint32 version)
            CPUID_UARCH_IS_SANDYBRIDGE(version) ||
            CPUID_UARCH_IS_HASWELL(version)     ||
            CPUID_UARCH_IS_SKYLAKE(version)     ||
-           CPUID_MODEL_IS_AVOTON(version));
+           CPUID_MODEL_IS_KNIGHTS_LANDING(version) ||
+           CPUID_MODEL_IS_DENVERTON(version) ||
+           CPUID_UARCH_IS_SILVERMONT(version));
 }
 
+#ifdef _MSC_VER
+#pragma warning (pop)
+#endif
+
+
+#if defined __cplusplus
+} // extern "C"
 #endif
+
+#endif // _X86CPUID_H_
diff --git a/vmmon-only/include/x86cpuid_asm.h b/vmmon-only/include/x86cpuid_asm.h
index 5a96ea65..e596accd 100644
--- a/vmmon-only/include/x86cpuid_asm.h
+++ b/vmmon-only/include/x86cpuid_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -63,6 +63,14 @@ extern "C" {
  */
 void __cpuid(int regs[4], int eax);
 #pragma intrinsic(__cpuid)
+
+/*
+ * __cpuidex has been supported since VS2008
+ */
+#if _MSC_VER >= 1500
+void __cpuidex(int regs[4], int eax, int ecx);
+#pragma intrinsic(__cpuidex)
+#endif /* _MSC_VER >= 1500 */
 #endif /* VM_X86_64 */
 
 #ifdef __cplusplus
@@ -247,6 +255,20 @@ __GET_CPUID(int input, CPUIDRegs *regs)
 
 #ifdef VM_X86_64
 
+#if _MSC_VER >= 1500
+
+/*
+ * __cpuidex has been supported since VS2008
+ */
+
+static INLINE void
+__GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs)
+{
+   __cpuidex((int *)regs, inputEax, inputEcx);
+}
+
+#else // _MSC_VER >= 1500
+
 /*
  * No inline assembly in Win64. Implemented in bora/lib/misc in
  * cpuidMasm64.asm.
@@ -254,6 +276,7 @@ __GET_CPUID(int input, CPUIDRegs *regs)
 
 extern void
 __GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs);
+#endif // _MSC_VER >= 1500
 
 #else // VM_X86_64
 
@@ -441,5 +464,13 @@ __GET_EAX_FROM_CPUID4(int inputEcx)
    _dx = regs.edx;                      \
 }
 
+#define GET_CPUID2(_ax, _bx, _cx, _dx) {\
+   CPUIDRegs regs;                      \
+   __GET_CPUID2(_ax, _cx, &regs);       \
+   _ax = regs.eax;                      \
+   _bx = regs.ebx;                      \
+   _cx = regs.ecx;                      \
+   _dx = regs.edx;                      \
+}
 
 #endif
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index e1675bde..3a6bfe8e 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,6 +38,11 @@
 #include "vm_basic_types.h"
 #include "community_source.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 /*
  * Results of calling rdmsr(msrNum) on all logical processors.
  */
@@ -92,6 +97,7 @@ MSRQuery;
 #define MSR_MCG_CAP           0x00000179
 #define MSR_MCG_STATUS        0x0000017a
 #define MSR_MCG_CTL           0x0000017b
+#define MSR_MCG_EXT_CTL       0x000004d0
 #define MSR_EVNTSEL0          0x00000186
 #define MSR_EVNTSEL1          0x00000187
 #define MSR_FLEX_RATIO        0x00000194 // Intel Nehalem Family
@@ -240,6 +246,133 @@ typedef enum {
 #define MSR_X2APIC_DIVIDER   0x0000083e
 #define MSR_X2APIC_SELFIPI   0x0000083f
 
+#define MSR_BNDCFGS          0x00000d90  // Sup. mode bounds configuration
+
+#define MSR_XSS              0x00000da0  // Extended Supervisor State Mask
+
+/* RTIT MSRs */
+#define MSR_RTIT_CTL              0x00000570
+#define MSR_RTIT_STATUS           0x00000571
+#define MSR_RTIT_OUTPUT_BASE      0x00000560
+#define MSR_RTIT_OUTPUT_MASK_PTRS 0x00000561
+#define MSR_RTIT_CR3_MATCH        0x00000572
+#define MSR_RTIT_ADDR0_A          0x00000580
+#define MSR_RTIT_ADDR0_B          0x00000581
+#define MSR_RTIT_ADDR1_A          0x00000582
+#define MSR_RTIT_ADDR1_B          0x00000583
+#define MSR_RTIT_ADDR2_A          0x00000584
+#define MSR_RTIT_ADDR2_B          0x00000585
+#define MSR_RTIT_ADDR3_A          0x00000586
+#define MSR_RTIT_ADDR3_B          0x00000587
+
+#define MSR_RTIT_NUM_OF_ADDR_REG  8
+
+/* RTIT control MSR bits */
+#define MSR_RTIT_CTL_TRACE_EN      (1LL<<0)  // Enable tracing
+#define MSR_RTIT_CTL_CYC_EN        (1LL<<1)  // Enable CYC Packet
+#define MSR_RTIT_CTL_OS            (1LL<<2)  // CPL0 filter
+#define MSR_RTIT_CTL_USER          (1LL<<3)  // CPL > 0 filter
+#define MSR_RTIT_CTL_FABRIC_EN     (1LL<<6)  // Trace output direction
+#define MSR_RTIT_CTL_CR3_FILTER_EN (1LL<<7)  // Enable CR3 filter
+#define MSR_RTIT_CTL_TOPA          (1LL<<8)  // Enable ToPA output scheme
+#define MSR_RTIT_CTL_MTC_EN        (1LL<<9)  // Enable MTC packet
+#define MSR_RTIT_CTL_TSC_EN        (1LL<<10) // Enable TSC packet
+#define MSR_RTIT_CTL_DIS_RETC      (1LL<<11) // Disable RET compression
+#define MSR_RTIT_CTL_BRANCH_EN     (1LL<<13) // Disable COFI-based packets
+#define MSR_RTIT_CTL_RSVD          CONST64U(0xffff0000f0841030) // Reserved bits
+
+#define MSR_RTIT_CTL_MTCFREQ_MASK CONST64U(0xf)
+#define MSR_RTIT_CTL_MTCFREQ_SHIFT 14
+#define MSR_RTIT_CTL_MTCFREQ(_msr)  \
+       (((_msr) >> MSR_RTIT_CTL_MTCFREQ_SHIFT) & MSR_RTIT_CTL_MTCFREQ_MASK)
+
+#define MSR_RTIT_CTL_CYCTHRESH_MASK CONST64U(0xf)
+#define MSR_RTIT_CTL_CYCTHRESH_SHIFT 19
+#define MSR_RTIT_CTL_CYCTHRESH(_msr)  \
+       (((_msr) >> MSR_RTIT_CTL_CYCTHRESH_SHIFT) & MSR_RTIT_CTL_CYCTHRESH_MASK)
+
+#define MSR_RTIT_CTL_PSBFREQ_MASK CONST64U(0xf)
+#define MSR_RTIT_CTL_PSBFREQ_SHIFT 24
+#define MSR_RTIT_CTL_PSBFREQ(_msr)  \
+       (((_msr) >> MSR_RTIT_CTL_PSBFREQ_SHIFT) & MSR_RTIT_CTL_PSBFREQ_MASK)
+
+#define MSR_RTIT_CTL_ADDR0_CFG_MASK  CONST64U(0xf)
+#define MSR_RTIT_CTL_ADDR0_CFG_SHIFT 32
+#define MSR_RTIT_CTL_ADDR0_CFG(_msr)  \
+       (((_msr) >> MSR_RTIT_CTL_ADDR0_CFG_SHIFT) & MSR_RTIT_CTL_ADDR0_CFG_MASK)
+
+#define MSR_RTIT_CTL_ADDR1_CFG_MASK  CONST64U(0xf)
+#define MSR_RTIT_CTL_ADDR1_CFG_SHIFT 36
+#define MSR_RTIT_CTL_ADDR1_CFG(_msr)  \
+       (((_msr) >> MSR_RTIT_CTL_ADDR1_CFG_SHIFT) & MSR_RTIT_CTL_ADDR1_CFG_MASK)
+
+#define MSR_RTIT_CTL_ADDR2_CFG_MASK  CONST64U(0xf)
+#define MSR_RTIT_CTL_ADDR2_CFG_SHIFT 40
+#define MSR_RTIT_CTL_ADDR2_CFG(_msr)  \
+       (((_msr) >> MSR_RTIT_CTL_ADDR2_CFG_SHIFT) & MSR_RTIT_CTL_ADDR2_CFG_MASK)
+
+#define MSR_RTIT_CTL_ADDR3_CFG_MASK  CONST64U(0xf)
+#define MSR_RTIT_CTL_ADDR3_CFG_SHIFT 44
+#define MSR_RTIT_CTL_ADDR3_CFG(_msr)  \
+       (((_msr) >> MSR_RTIT_CTL_ADDR3_CFG_SHIFT) & MSR_RTIT_CTL_ADDR3_CFG_MASK)
+
+/* RTIT status MSR bits */
+#define MSR_RTIT_STATUS_FILTER_EN    (1LL<<0)
+#define MSR_RTIT_STATUS_CONTEXT_EN   (1LL<<1)
+#define MSR_RTIT_STATUS_TRIGGER_EN   (1LL<<2)
+#define MSR_RTIT_STATUS_ERROR        (1LL<<4)
+#define MSR_RTIT_STATUS_STOPPED      (1LL<<5)
+#define MSR_RTIT_STATUS_RSVD         CONST64U(0xfffe0000ffffffc8)
+
+#define MSR_RTIT_STATUS_PKT_BYTES_CNT_MASK  CONST64U(0x1ffff)
+#define MSR_RTIT_STATUS_PKT_BYTES_CNT_SHIFT 32
+#define MSR_RTIT_STATUS_PKT_BYTES_CNT(_msr)  \
+        (((_msr) >> MSR_RTIT_STATUS_PKT_BYTES_CNT_SHIFT) & \
+             MSR_RTIT_STATUS_PKT_BYTES_CNT_MASK)
+
+/* RTIT CR3 MSR bits */
+#define MSR_RTIT_CR3_MATCH_MASK CONST64U(~0x1f)
+
+/* RTIT output base MSR bits */
+#define MSR_RTIT_OUTPUT_BASE_MASK CONST64U(~0x7f)
+#define MSR_RTIT_OUTPUT_BASE_RSVD CONST64U(0x7f)
+
+/* RTIT output mask ptrs MSR bits */
+#define MSR_RTIT_OUTPUT_MASK_LOWERMASK CONST64U(0x7f)
+
+/*
+ * Get the mask value for the single contiguous output region
+ * when MSR_RTIT_CTL.ToPA is masked
+ */
+#define MSR_RTIT_OUTPUT_MASK_MASK  CONST64U(0xffffffff)
+#define MSR_RTIT_OUTPUT_MASK(_msr) \
+        ((_msr) & MSR_RTIT_OUTPUT_MASK_MASK)
+
+/* Get the offset pointer of the ToPA table when MSR_RTIT_CTL.ToPA is set */
+#define MSR_RTIT_OUTPUT_TABLE_OFFSET_MASK  CONST64U(0x1ffffff)
+#define MSR_RTIT_OUTPUT_TABLE_OFFSET_SHIFT 7
+#define MSR_RTIT_OUTPUT_TABLE_OFFSET(_msr) \
+        ((((_msr) >> MSR_RTIT_OUTPUT_TABLE_OFFSET_SHIFT) & \
+              MSR_RTIT_OUTPUT_TABLE_OFFSET_MASK) << 3)
+#define MSR_RTIT_OUTPUT_TABLE_ENTRY(_msr) \
+        (((_msr) >> MSR_RTIT_OUTPUT_TABLE_OFFSET_SHIFT) & \
+              MSR_RTIT_OUTPUT_TABLE_OFFSET_MASK)
+
+#define MSR_RTIT_OUTPUT_OFFSET_MASK  CONST64U(0xffffffff)
+#define MSR_RTIT_OUTPUT_OFFSET_SHIFT 32
+#define MSR_RTIT_OUTPUT_OFFSET(_msr) \
+        (((_msr) >> MSR_RTIT_OUTPUT_OFFSET_SHIFT) & \
+             MSR_RTIT_OUTPUT_OFFSET_MASK)
+
+#define MSR_RTIT_CR3_MATCH_RSVD CONST64U(0x1f)
+
+/* SGX MSRs */
+#define MSR_SGX_SVN_STATUS               0x00000500
+
+/* SGX SVN status MSR fields */
+#define MSR_SGX_SVN_STATUS_LOCK          0x1
+#define MSR_SGX_SVN_STATUS_SINIT_SVN     CONST64U(0xff0000)
+#define MSR_SGX_SVN_STATUS_RSVD          CONST64U(0xffffffffff00fffe)
 
 /* MSR_CR_PAT power-on value */
 #define MSR_CR_PAT_DEFAULT   0x0007040600070406ULL
@@ -277,7 +410,10 @@ typedef enum {
 #define MSR_FEATCTL_LOCK     0x00000001
 #define MSR_FEATCTL_SMXE     0x00000002
 #define MSR_FEATCTL_VMXE     0x00000004
+#define MSR_FEATCTL_SENTERP  0x00007F00
+#define MSR_FEATCTL_SENTERE  0x00008000
 #define MSR_FEATCTL_SGXE     0x00040000
+#define MSR_FEATCTL_LMCE     0x00100000
 
 /* MSR_EFER bits. */
 #define MSR_EFER_SCE         0x0000000000000001ULL  /* Sys call ext'ns:  r/w */
@@ -423,6 +559,7 @@ typedef enum {
 
 #define MSR_HYPERV_HYPERCALL_EN                  1ULL
 #define MSR_HYPERV_REFERENCE_TSC_EN              1ULL
+#define MSR_HYPERV_VP_ASSIST_EN                  1ULL
 
 #define MSR_HYPERV_GUESTOSID_VENDOR_SHIFT        48
 #define MSR_HYPERV_GUESTOSID_VENDOR_MASK         0xfULL
@@ -481,6 +618,14 @@ typedef enum {
 
 
 
+/*
+ * Platform Quality of Service
+ */
+
+#define MSR_INTEL_QOS_EVTSEL    0xc8d
+#define MSR_INTEL_QOS_CTR       0xc8e
+#define MSR_INTEL_QOS_ASSOC     0xc8f
+
 static INLINE uint32
 X86MSR_SysCallEIP(uint64 star)
 {
@@ -502,4 +647,8 @@ X86MSR_SysRetCS(uint64 star)
 }
 
 
+#if defined __cplusplus
+}
+#endif
+
 #endif /* _X86MSR_H_ */
diff --git a/vmmon-only/include/x86paging_64.h b/vmmon-only/include/x86paging_64.h
new file mode 100644
index 00000000..a8e09469
--- /dev/null
+++ b/vmmon-only/include/x86paging_64.h
@@ -0,0 +1,87 @@
+/*********************************************************
+ * Copyright (C) 1998-2014,2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86paging_64.h --
+ *
+ *      Contains definitions for the x86 page table layout specific to
+ *      long mode.
+ */
+
+#ifndef _X86PAGING_64_H_
+#define _X86PAGING_64_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "x86types.h"
+#include "vm_pagetable.h"
+
+#define LM_PTE_PFN_MASK      CONST64U(0xffffffffff000)
+#define LM_PTE_2_PFN(_pte)   (((_pte) & LM_PTE_PFN_MASK) >> PT_PTE_PFN_SHIFT)
+
+#define LM_PDE_PFN_MASK      0xfffffffe00000LL
+#define LM_PDPTE_PFN_MASK    0xfffffc0000000LL
+
+#define LM_AVAIL_SHIFT         9
+
+#define LM_AVAIL_MASK         (CONST64(0x7) << LM_AVAIL_SHIFT)
+#define LM_FLAGS_MASK         CONST64(0x80000000000001ff)
+#define LM_CR3_FLAGS_MASK     CONST64(0x18)
+#define LM_L4_L3_RSVD_MASK    CONST64(0x180)
+#define LM_L3_1G_RSVD_MASK    CONST64(0x3fffe000)
+
+#define LM_MAKE_CR3(_mpfn, _flags) \
+                   (((uint64)(_mpfn) << PT_PTE_PFN_SHIFT) | \
+                   ((_flags) & LM_CR3_FLAGS_MASK))
+
+#define LM_MAKE_PTE(_mpfn, _avail, _flags) \
+                   (((uint64)(_mpfn) << PT_PTE_PFN_SHIFT) | \
+                    (((_avail) << LM_AVAIL_SHIFT) & LM_AVAIL_MASK) | \
+                    ((uint64)(_flags) & LM_FLAGS_MASK))
+
+#define LM_MAKE_PDE(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
+#define LM_MAKE_L4E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
+#define LM_MAKE_L3E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
+#define LM_MAKE_L2E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
+#define LM_MAKE_L1E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
+
+
+/*
+ * x86-64 architecture requires implementations supporting less than
+ * full 64-bit VAs to ensure that all virtual addresses are in canonical
+ * form. An address is in canonical form if the address bits from the
+ * most significant implemented bit up to bit 63 are all ones or all
+ * zeros. If this is not the case, the processor generates #GP/#SS. Our
+ * VCPU implements 48 bits of virtual address space.
+ */
+
+#define VA64_IMPL_BITS             48
+#define VA64_CANONICAL_MASK        ~((CONST64U(1) << (VA64_IMPL_BITS - 1)) - 1)
+#define VA64_CANONICAL_HOLE_START   (CONST64U(1) << (VA64_IMPL_BITS - 1))
+#define VA64_CANONICAL_HOLE_LEN  VA64_CANONICAL_MASK - VA64_CANONICAL_HOLE_START
+
+#endif /* _X86PAGING_64_H_ */
diff --git a/vmmon-only/include/x86paging_common.h b/vmmon-only/include/x86paging_common.h
new file mode 100644
index 00000000..a93fd41b
--- /dev/null
+++ b/vmmon-only/include/x86paging_common.h
@@ -0,0 +1,113 @@
+/*********************************************************
+ * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86paging_common.h --
+ *
+ *      Contains definitions for the x86 page table layout that are common
+ *      to legacy and long modes.
+ */
+
+#ifndef _X86PAGING_COMMON_H_
+#define _X86PAGING_COMMON_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+
+
+/*
+ *   page tables
+ */
+
+#define PTE_P           0x00000001
+#define PTE_RW          0x00000002
+#define PTE_US          0x00000004
+#define PTE_PWT         0x00000008
+#define PTE_PCD         0x00000010 // careful: MMU_PTE_EX has same value.
+#define PTE_A           0x00000020
+#define PTE_D           0x00000040
+#define PTE_PS          0x00000080
+#define PTE_PAT         0x00000080
+#define PTE_G           0x00000100
+#define PTE_LARGE_PAT   0x00001000
+#define PTE_RSVD        CONST64(0x0008000000000000)
+#define PTE_NX          CONST64(0x8000000000000000)
+#define PTE_NX_SHIFT    63
+
+#define PTE_PK_MASK     CONST64(0x7800000000000000)
+#define PTE_PK_SHIFT    59
+
+#define PTE_LARGE_PAT_2_PS(_pte) (((_pte) & PTE_LARGE_PAT) >> 5)
+
+#define PTE_PROT_FLAGS  (PTE_P|PTE_RW|PTE_US)
+#define PTE_FLAGS       (PTE_PROT_FLAGS|PTE_G)
+
+#define PTE_KERNEL              (PTE_P|PTE_RW)
+#define PTE_KERNEL_NX           (PTE_P|PTE_RW|PTE_NX)
+
+#define PTE_PRESENT(_pte)   (((_pte) & PTE_P) != 0)
+#define PTE_WRITEABLE(_pte) (((_pte) & PTE_RW) != 0)
+#define PTE_ACCESS(_pte)    (((_pte) & PTE_A) != 0)
+#define PTE_DIRTY(_pte)     (((_pte) & PTE_D) != 0)
+#define PTE_USER(_pte)      (((_pte) & PTE_US) != 0)
+#define PTE_GLOBAL(_pte)    (((_pte) & PTE_G) != 0)
+#define PTE_LARGEPAGE(_pte) (((_pte) & PTE_PS) != 0)
+#define PTE_UNCACHED(_pte)  (((_pte) & PTE_PCD) != 0)
+#define PTE_NOEXECUTE(_pte) (((_pte) & PTE_NX) != 0)
+#define PTE_PK(_pte)        (((_pte) & PTE_PK_MASK) >> PTE_PK_SHIFT)
+
+#define PK_AD         1 /* Access disable bit */
+#define PK_WD         2 /* Write disable bit */
+#define PKR_WIDTH     2
+#define PKR_MASK      3
+#define PK_RIGHTS(_pkru, _key) (((_pkru) >> ((_key) * PKR_WIDTH)) & PKR_MASK);
+
+/* Error code flags */
+#define PF_P            0x0001
+#define PF_RW           0x0002
+#define PF_US           0x0004
+#define PF_RSVD         0x0008
+#define PF_ID           0x0010
+#define PF_PK           0x0020
+#define PF_SGX          0x8000
+
+/*
+ * Operand definitions for the INVPCID instruction. See SDM Vol. 2A.
+ */
+#define INVPCID_EXTENT_ADDR               0
+#define INVPCID_EXTENT_PCID_CTX           1
+#define INVPCID_EXTENT_ALL_CTX            2
+#define INVPCID_EXTENT_ALL_CTX_LOCAL      3
+#define INVPCID_EXTENT_MAX                3
+#define INVPCID_MAX_PCID              0xfff
+
+typedef struct {
+   uint64   pcid;    /* Bits 63:12 reserved.                   */
+   uint64   la;      /* Used for single address invalidation.  */
+} InvpcidArg;
+
+#endif /* _X86PAGING_COMMON_H_ */
diff --git a/vmmon-only/include/x86perfctr.h b/vmmon-only/include/x86perfctr.h
index 606c898e..5ab6c8c6 100644
--- a/vmmon-only/include/x86perfctr.h
+++ b/vmmon-only/include/x86perfctr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2012,2014-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2012,2014-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,7 +39,7 @@
 #define PERFCTR_PENTIUM4_NUM_COUNTERS            18
 #define PERFCTR_PENTIUM4_NUM_COUNTERS_WITH_L3    26
 #define PERFCTR_AMD_NUM_COUNTERS                 4 
-#define PERFCTR_BD_NUM_COUNTERS                  6
+#define PERFCTR_AMD_EXT_NUM_COUNTERS             6
 #define PERFCTR_P6_NUM_COUNTERS                  2
 #define PERFCTR_NEHALEM_NUM_GEN_COUNTERS         4
 #define PERFCTR_NEHALEM_NUM_FIXED_COUNTERS       3
@@ -109,10 +109,10 @@
 /* AMD Performance Counter MSR Definitions */
 #define PERFCTR_AMD_PERFEVTSEL0_ADDR             0xC0010000
 #define PERFCTR_AMD_PERFCTR0_ADDR                0xC0010004
-#define PERFCTR_BD_BASE_ADDR                     0xC0010200
-#define PERFCTR_BD_EVENTSEL                      0
-#define PERFCTR_BD_CTR                           1
-#define PERFCTR_BD_MSR_STRIDE                    2
+#define PERFCTR_AMD_EXT_BASE_ADDR                0xC0010200
+#define PERFCTR_AMD_EXT_EVENTSEL                 0
+#define PERFCTR_AMD_EXT_CTR                      1
+#define PERFCTR_AMD_EXT_MSR_STRIDE               2
 
 /* AMD Clocks */
 #define PERFCTR_AMD_CPU_CLK_UNHALTED                           0x76
@@ -144,10 +144,6 @@
 #define PERFCTR_AMD_L2_MISS                                    0x7e
 #define PERFCTR_AMD_L2_FILL_WRITEBACK                          0x7f
 
-/* AMD L3 Cache */
-#define PERFCTR_AMD_REQUESTS_TO_L3                             (0x4e0 | 0xf000)
-#define PERFCTR_AMD_L3_MISS                                    (0x4e1 | 0xf000)
-
 /* AMD Instruction Cache Events */
 
 #define PERFCTR_AMD_INSTR_FETCHES                              0x80
@@ -395,7 +391,7 @@
  *    Use CPUID 0xa to get perf capabilities.  Some (7) events are
  *    architectural; most are version-specific.
  *
- *    V1: Yonah, V2: Merom, V2+: Penryn
+ *    V1: Yonah, V2: Merom, V2+: Penryn, V3: Nehalem, V4: Skylake
  *
  *    V1 is similar to P6, with some additions:
  *       - Global control MSR
@@ -404,6 +400,14 @@
  *       - Ability to freeze a counter before PMI delivery.
  *       - Freeze during SMI (Penryn+ only)
  *       - VMCS global enable (Penryn+ only)
+ *    V3 introduces:
+ *       - (nothing we virtualize)
+ *    V4 introduces:
+ *       - Global unavailable (in-use) MSR
+ *       - Freeze on PMI bit
+ *       - ASCI bit
+ *       - Global status set MSR
+ *       - Global status reset MSR (previously called Ovf ctrl)
  *
  * ----------------------------------------------------------------------
  */
@@ -443,6 +447,7 @@
 #define PERFCTR_CORE_PMI_UNAVAILABLE_IN_USE         (CONST64U(1) << 63)
 // XXX serebrin/dhecht: 1-10-11: Make ANYTHREAD depend on number of fixed PMCs
 
+#define PERFCTR_CORE_GLOBAL_STATUS_TOPA_PMI      (1ULL << 55)
 #define PERFCTR_CORE_GLOBAL_STATUS_CTR_FRZ       (1ULL << 59)
 #define PERFCTR_CORE_GLOBAL_STATUS_ASCI          (1ULL << 60)
 #define PERFCTR_CORE_GLOBAL_STATUS_OVFBUFFER     (1ULL << 62)
@@ -632,7 +637,7 @@
  *      escrAddr:     MSR # of the Perf Event Selector (0xc0010000 + index).
  *      escrVal:      Value placed in PerfEvtSel MSR; what to measure.
  *
- *      On AMD BD:
+ *      On AMD with PerfCtrExtCore support:
  *      index:        Which perf ctr, 0 to 5.  RDPMC argument
  *      addr:         MSR of raw perf ctr              (0xc0010201 + 2 * index).
  *                                  aliased PMCs 0 - 3 (0xc0010004 + index).
@@ -731,13 +736,17 @@ PerfCtr_PgcToOvfValidBits(uint64 pgcValBits)
 static INLINE uint64
 PerfCtr_PgcToStsRstValidBits(uint64 pgcValBits)
 {
-   return pgcValBits | (1ULL << 55) | MASKRANGE64(63, 58);
+   return pgcValBits |
+          PERFCTR_CORE_GLOBAL_STATUS_TOPA_PMI |
+          MASKRANGE64(63, 58);
 }
 
 static INLINE uint64
 PerfCtr_PgcToGssValidBits(uint64 pgcValBits)
 {
-   return pgcValBits | (1ULL << 55) | MASKRANGE64(62, 58);
+   return pgcValBits |
+          PERFCTR_CORE_GLOBAL_STATUS_TOPA_PMI |
+          MASKRANGE64(62, 58);
 }
 
 /*
@@ -815,6 +824,34 @@ PerfCtr_PEBSAvailable(void)
    return FALSE; 
 }
 
+/*
+ *----------------------------------------------------------------------
+ *
+ *  PerfCtr_PTAvailable --
+ *
+ *      Checks if this CPU is capable of PT(Intel processor trace).
+ *
+ * Results:
+ *      TRUE if PT is supported, FALSE otherwise.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+PerfCtr_PTAvailable(void)
+{
+   CPUIDRegs regs;
+   __GET_CPUID(0, &regs);
+   if (CPUID_IsVendorIntel(&regs)) {
+      __GET_CPUID2(7, 0, &regs);
+      return (regs.ecx & CPUID_INTERNAL_MASK_PT) != 0;
+   }
+   return FALSE;
+}
+
 /* The following are taken from the Intel Architecture Manual,
  * Book 3, Table 14-4. 
  */ 
diff --git a/vmmon-only/include/x86sel.h b/vmmon-only/include/x86sel.h
index 934bfde6..83993684 100644
--- a/vmmon-only/include/x86sel.h
+++ b/vmmon-only/include/x86sel.h
@@ -35,6 +35,11 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 #define SELECTOR_GDT             0
 #define SELECTOR_LDT             1
 #define SELECTOR_RPL_SHIFT       0
@@ -64,4 +69,9 @@ MAKE_SELECTOR(unsigned index, unsigned ti, unsigned rpl)
    return MAKE_SELECTOR_UNCHECKED(index, ti, rpl);
 }
 
+
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif /* !defined _X86SEL_H_ */
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
index 584a4afc..dc5d60a4 100644
--- a/vmmon-only/include/x86svm.h
+++ b/vmmon-only/include/x86svm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2014,2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -47,10 +47,6 @@
 #endif
 #include "x86cpuid_asm.h"
 
-#ifdef VMM
-#include "cpuidMonitor.h"
-#endif
-
 #define SVM_VMCB_IO_BITMAP_SIZE    (3 * PAGE_SIZE)
 #define SVM_VMCB_MSR_BITMAP_SIZE   (2 * PAGE_SIZE)
 
diff --git a/vmmon-only/include/x86types.h b/vmmon-only/include/x86types.h
index cf7966e9..c070e4eb 100644
--- a/vmmon-only/include/x86types.h
+++ b/vmmon-only/include/x86types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,16 +39,7 @@
 #include "vm_basic_defs.h"
 #include "address_defs.h"
 #include "x86segdescrs.h"
-
-/*
- * Types used for PL4 page table in x86_64 and arm64
- */
-
-typedef uint64 VM_L4E;
-typedef uint64 VM_L3E;
-typedef uint64 VM_L2E;
-typedef uint64 VM_L1E;
-
+#include "vm_pagetable.h"
 
 /*
  * Page table
diff --git a/vmmon-only/include/x86vendor.h b/vmmon-only/include/x86vendor.h
index 0c9ccdd7..62248ec2 100644
--- a/vmmon-only/include/x86vendor.h
+++ b/vmmon-only/include/x86vendor.h
@@ -1,6 +1,6 @@
 
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/x86vt-exit-reasons.h b/vmmon-only/include/x86vt-exit-reasons.h
new file mode 100644
index 00000000..07d6cf6d
--- /dev/null
+++ b/vmmon-only/include/x86vt-exit-reasons.h
@@ -0,0 +1,97 @@
+/*********************************************************
+ * Copyright (C) 2016 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * x86vt-exit-reasons.h --
+ *
+ * VT exit reasons.
+ *
+ */
+
+#include "community_source.h"
+
+#define VT_EXITREASON_VMENTRYFAIL           (1U << 31)
+
+VT_EXIT(EXC_OR_NMI,            0)
+VT_EXIT(EXTINT,                1)
+VT_EXIT(TRIPLEFAULT,           2)
+VT_EXIT(INIT,                  3)
+VT_EXIT(SIPI,                  4)
+VT_EXIT(IOSMI,                 5)
+VT_EXIT(OTHERSMI,              6)
+VT_EXIT(VINTR_WINDOW,          7)
+VT_EXIT(VNMI_WINDOW,           8)
+VT_EXIT(TS,                    9)
+VT_EXIT(CPUID,                10)
+VT_EXIT(GETSEC,               11)
+VT_EXIT(HLT,                  12)
+VT_EXIT(INVD,                 13)
+VT_EXIT(INVLPG,               14)
+VT_EXIT(RDPMC,                15)
+VT_EXIT(RDTSC,                16)
+VT_EXIT(RSM,                  17)
+VT_EXIT(VMCALL,               18)
+VT_EXIT(VMCLEAR,              19)
+VT_EXIT(VMLAUNCH,             20)
+VT_EXIT(VMPTRLD,              21)
+VT_EXIT(VMPTRST,              22)
+VT_EXIT(VMREAD,               23)
+VT_EXIT(VMRESUME,             24)
+VT_EXIT(VMWRITE,              25)
+VT_EXIT(VMXOFF,               26)
+VT_EXIT(VMXON,                27)
+VT_EXIT(CR,                   28)
+VT_EXIT(DR,                   29)
+VT_EXIT(IO,                   30)
+VT_EXIT(RDMSR,                31)
+VT_EXIT(WRMSR,                32)
+VT_EXIT(VMENTRYFAIL_GUEST,   (33 | VT_EXITREASON_VMENTRYFAIL))
+VT_EXIT(VMENTRYFAIL_MSR,     (34 | VT_EXITREASON_VMENTRYFAIL))
+VT_EXIT(VMEXIT35,             35)
+VT_EXIT(MWAIT,                36)
+VT_EXIT(MTF,                  37)
+VT_EXIT(VMEXIT38,             38)
+VT_EXIT(MONITOR,              39)
+VT_EXIT(PAUSE,                40)
+VT_EXIT(VMENTRYFAIL_MC,      (41 | VT_EXITREASON_VMENTRYFAIL))
+VT_EXIT(VMEXIT42,             42)
+VT_EXIT(TPR,                  43)
+VT_EXIT(APIC,                 44)
+VT_EXIT(EOI,                  45)
+VT_EXIT(GDTR_IDTR,            46)
+VT_EXIT(LDTR_TR,              47)
+VT_EXIT(EPT_VIOLATION,        48)
+VT_EXIT(EPT_MISCONFIG,        49)
+VT_EXIT(INVEPT,               50)
+VT_EXIT(RDTSCP,               51)
+VT_EXIT(TIMER,                52)
+VT_EXIT(INVVPID,              53)
+VT_EXIT(WBINVD,               54)
+VT_EXIT(XSETBV,               55)
+VT_EXIT(APIC_WRITE,           56)
+VT_EXIT(RDRAND,               57)
+VT_EXIT(INVPCID,              58)
+VT_EXIT(VMFUNC,               59)
+VT_EXIT(ENCLS,                60)
+VT_EXIT(RDSEED,               61)
+VT_EXIT(PML_LOGFULL,          62)
+VT_EXIT(XSAVES,               63)
+VT_EXIT(XRSTORS,              64)
+
+/* Bump this up if you add an exit reason. */
+#define VT_NUM_EXIT_REASONS   65
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
index 321b5331..74b9b4cc 100644
--- a/vmmon-only/include/x86vt-vmcs-fields.h
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,195 +19,697 @@
 /*
  * x86vt-vmcs-fields.h --
  *
- * VMCS encodings; SDM volume 3 Appendix B.
- * These are the values passed to VMWRITE and VMREAD.
+ * VMCS fields (SDM volume 3 Appendix B).
  *
- * VMCS_FIELD(name, encoding)
  */
 
 #include "community_source.h"
 
 /*
- * VMCS_FIELD(name,                    encoding, vVT support)
+ * There are 16 groups of VMCS fields: 4 sizes crossed with 4 types.
+ * The 4 sizes are 16-bit, 64-bit, 32-bit, and "natural", in that order,
+ * per the enumeration of the size in the field encoding.
+ * The 4 types are control, read-only data, guest-state, and host-state,
+ * in that order, per the enumeration of the type in the field encoding.
  */
 
+/*
+ * Use of this table:
+ * A typical consumer will define a VMCS_FIELD macro to extract and
+ * collate the desired information for each VMCS field, and then it will
+ * include this file to invoke that macro with the property list for each
+ * VMCS field.  Some properties are represented mnemonically (e.g. _S16 for
+ * "16-bit size," so that the extracted property can be defined by another
+ * macro.  For example, some consumers may choose to interpret the size
+ * property "_S16" as "uint16", while others may wish to interpret it as "s16."
+ * For convenience, each of the 16 groups is preceded by a VMCS_GROUP_START
+ * macro and followed by a VMCS_GROUP_END macro.  Similarly, each set of four
+ * groups with the same size is preceded by a VMCS_SET_START macro and followed
+ * by a VMCS_SET_END macro.  This file provides empty definitions of
+ * VMCS_GROUP_START, VMCS_GROUP_END, VMCS_SET_START, and VMCS_SET_END if the
+ * consumer has not defined them.
+ */
+
+#ifndef VMCS_GROUP_START
+#define VMCS_GROUP_START(size, type)
+#define LOCAL_GROUP_START
+#endif
+
+#ifndef VMCS_GROUP_END
+#define VMCS_GROUP_END(size, type)
+#define LOCAL_GROUP_END
+#endif
+
+#ifndef VMCS_SET_START
+#define VMCS_SET_START(size)
+#define LOCAL_SET_START
+#endif
+
+#ifndef VMCS_SET_END
+#define VMCS_SET_END(size)
+#define LOCAL_SET_END
+#endif
+
+#ifndef VMCS_UNUSED
+#define VMCS_UNUSED(val, size, type, index)
+#define LOCAL_UNUSED
+#endif
+
+/*
+ * VMCS_FIELD(_name, _val, _size, _type, _index, _cache, _vvt, _access)
+ *    _type is one of:
+ *       _TC -- control
+ *       _TG -- guest-state
+ *       _TH -- host-state
+ *       _TD -- read-only data
+ *    _size is one of:
+ *       _S16 -- 16-bits
+ *       _S32 -- 32-bits
+ *       _S64 -- 64-bits
+ *       _SN  -- natural width
+ *    _cache is one of:
+ *       _C  -- cached
+ *       _NC -- not cached
+ *    _vvt is one of:
+ *       _V  -- virtualized
+ *       _NV -- not virtualized
+ *   _access is one of:
+ *       _NA -- no access
+ *       _RW -- read/write access
+ *       _RO -- read-only access
+ *
+ */
+
+
+VMCS_SET_START(16)
 /* 16-bit control fields. */
-VMCS_FIELD(VPID,                    0x0000, TRUE)
-VMCS_FIELD(PI_NOTIFY,               0x0002, FALSE)
-VMCS_FIELD(EPTP_INDEX,              0x0004, FALSE)
+VMCS_GROUP_START(16, CTL)
+VMCS_FIELD(VPID,                    0x0000, _S16, _TC,  0,  _C,  _V, _NA)
+VMCS_FIELD(PI_NOTIFY,               0x0002, _S16, _TC,  1, _NC, _NV, _NA)
+VMCS_FIELD(EPTP_INDEX,              0x0004, _S16, _TC,  2, _NC,  _V, _NA)
+VMCS_UNUSED(                        0x0006, _S16, _TC,  3)
+VMCS_UNUSED(                        0x0008, _S16, _TC,  4)
+VMCS_UNUSED(                        0x000A, _S16, _TC,  5)
+VMCS_UNUSED(                        0x000C, _S16, _TC,  6)
+VMCS_UNUSED(                        0x000E, _S16, _TC,  7)
+VMCS_UNUSED(                        0x0010, _S16, _TC,  8)
+VMCS_UNUSED(                        0x0012, _S16, _TC,  9)
+VMCS_UNUSED(                        0x0014, _S16, _TC,  10)
+VMCS_UNUSED(                        0x0016, _S16, _TC,  11)
+VMCS_UNUSED(                        0x0018, _S16, _TC,  12)
+VMCS_UNUSED(                        0x001A, _S16, _TC,  13)
+VMCS_UNUSED(                        0x001C, _S16, _TC,  14)
+VMCS_UNUSED(                        0x001E, _S16, _TC,  15)
+VMCS_UNUSED(                        0x0020, _S16, _TC,  16)
+VMCS_UNUSED(                        0x0022, _S16, _TC,  17)
+VMCS_UNUSED(                        0x0024, _S16, _TC,  18)
+VMCS_UNUSED(                        0x0026, _S16, _TC,  19)
+VMCS_UNUSED(                        0x0028, _S16, _TC,  20)
+VMCS_UNUSED(                        0x002A, _S16, _TC,  21)
+VMCS_UNUSED(                        0x002C, _S16, _TC,  22)
+VMCS_UNUSED(                        0x002E, _S16, _TC,  23)
+VMCS_UNUSED(                        0x0030, _S16, _TC,  24)
+VMCS_UNUSED(                        0x0032, _S16, _TC,  25)
+VMCS_UNUSED(                        0x0034, _S16, _TC,  26)
+VMCS_UNUSED(                        0x0036, _S16, _TC,  27)
+VMCS_UNUSED(                        0x0038, _S16, _TC,  28)
+VMCS_UNUSED(                        0x003A, _S16, _TC,  29)
+VMCS_UNUSED(                        0x003C, _S16, _TC,  30)
+VMCS_UNUSED(                        0x003E, _S16, _TC,  31)
+VMCS_GROUP_END(16, CTL)
+
+/* 16-bit read-only data fields. */
+VMCS_GROUP_START(16, DATA)
+VMCS_UNUSED(                        0x0400, _S16, _TD,  0)
+VMCS_UNUSED(                        0x0402, _S16, _TD,  1)
+VMCS_UNUSED(                        0x0404, _S16, _TD,  2)
+VMCS_UNUSED(                        0x0406, _S16, _TD,  3)
+VMCS_UNUSED(                        0x0408, _S16, _TD,  4)
+VMCS_UNUSED(                        0x040A, _S16, _TD,  5)
+VMCS_UNUSED(                        0x040C, _S16, _TD,  6)
+VMCS_UNUSED(                        0x040E, _S16, _TD,  7)
+VMCS_UNUSED(                        0x0410, _S16, _TD,  8)
+VMCS_UNUSED(                        0x0412, _S16, _TD,  9)
+VMCS_UNUSED(                        0x0414, _S16, _TD,  10)
+VMCS_UNUSED(                        0x0416, _S16, _TD,  11)
+VMCS_UNUSED(                        0x0418, _S16, _TD,  12)
+VMCS_UNUSED(                        0x041A, _S16, _TD,  13)
+VMCS_UNUSED(                        0x041C, _S16, _TD,  14)
+VMCS_UNUSED(                        0x041E, _S16, _TD,  15)
+VMCS_UNUSED(                        0x0420, _S16, _TD,  16)
+VMCS_UNUSED(                        0x0422, _S16, _TD,  17)
+VMCS_UNUSED(                        0x0424, _S16, _TD,  18)
+VMCS_UNUSED(                        0x0426, _S16, _TD,  19)
+VMCS_UNUSED(                        0x0428, _S16, _TD,  20)
+VMCS_UNUSED(                        0x042A, _S16, _TD,  21)
+VMCS_UNUSED(                        0x042C, _S16, _TD,  22)
+VMCS_UNUSED(                        0x042E, _S16, _TD,  23)
+VMCS_UNUSED(                        0x0430, _S16, _TD,  24)
+VMCS_UNUSED(                        0x0432, _S16, _TD,  25)
+VMCS_UNUSED(                        0x0434, _S16, _TD,  26)
+VMCS_UNUSED(                        0x0436, _S16, _TD,  27)
+VMCS_UNUSED(                        0x0438, _S16, _TD,  28)
+VMCS_UNUSED(                        0x043A, _S16, _TD,  29)
+VMCS_UNUSED(                        0x043C, _S16, _TD,  30)
+VMCS_UNUSED(                        0x043E, _S16, _TD,  31)
+VMCS_GROUP_END(16, DATA)
 
 /* 16-bit guest state. */
-VMCS_FIELD(ES,                      0x0800, TRUE)
-VMCS_FIELD(CS,                      0x0802, TRUE)
-VMCS_FIELD(SS,                      0x0804, TRUE)
-VMCS_FIELD(DS,                      0x0806, TRUE)
-VMCS_FIELD(FS,                      0x0808, TRUE)
-VMCS_FIELD(GS,                      0x080A, TRUE)
-VMCS_FIELD(LDTR,                    0x080C, TRUE)
-VMCS_FIELD(TR,                      0x080E, TRUE)
-VMCS_FIELD(INTR_STATUS,             0x0810, FALSE)
+VMCS_GROUP_START(16, GUEST)
+VMCS_FIELD(ES,                      0x0800, _S16, _TG,  0, _NC,  _V, _RW)
+VMCS_FIELD(CS,                      0x0802, _S16, _TG,  1, _NC,  _V, _RW)
+VMCS_FIELD(SS,                      0x0804, _S16, _TG,  2, _NC,  _V, _RW)
+VMCS_FIELD(DS,                      0x0806, _S16, _TG,  3, _NC,  _V, _RW)
+VMCS_FIELD(FS,                      0x0808, _S16, _TG,  4, _NC,  _V, _RW)
+VMCS_FIELD(GS,                      0x080A, _S16, _TG,  5, _NC,  _V, _RW)
+VMCS_FIELD(LDTR,                    0x080C, _S16, _TG,  6, _NC,  _V, _RW)
+VMCS_FIELD(TR,                      0x080E, _S16, _TG,  7, _NC,  _V, _RW)
+VMCS_FIELD(INTR_STATUS,             0x0810, _S16, _TG,  8, _NC, _NV, _NA)
+VMCS_FIELD(PML_INDEX,               0x0812, _S16, _TG,  9, _NC, _NV, _NA)
+VMCS_UNUSED(                        0x0814, _S16, _TG,  10)
+VMCS_UNUSED(                        0x0816, _S16, _TG,  11)
+VMCS_UNUSED(                        0x0818, _S16, _TG,  12)
+VMCS_UNUSED(                        0x081A, _S16, _TG,  13)
+VMCS_UNUSED(                        0x081C, _S16, _TG,  14)
+VMCS_UNUSED(                        0x081E, _S16, _TG,  15)
+VMCS_UNUSED(                        0x0820, _S16, _TG,  16)
+VMCS_UNUSED(                        0x0822, _S16, _TG,  17)
+VMCS_UNUSED(                        0x0824, _S16, _TG,  18)
+VMCS_UNUSED(                        0x0826, _S16, _TG,  19)
+VMCS_UNUSED(                        0x0828, _S16, _TG,  20)
+VMCS_UNUSED(                        0x082A, _S16, _TG,  21)
+VMCS_UNUSED(                        0x082C, _S16, _TG,  22)
+VMCS_UNUSED(                        0x082E, _S16, _TG,  23)
+VMCS_UNUSED(                        0x0830, _S16, _TG,  24)
+VMCS_UNUSED(                        0x0832, _S16, _TG,  25)
+VMCS_UNUSED(                        0x0834, _S16, _TG,  26)
+VMCS_UNUSED(                        0x0836, _S16, _TG,  27)
+VMCS_UNUSED(                        0x0838, _S16, _TG,  28)
+VMCS_UNUSED(                        0x083A, _S16, _TG,  29)
+VMCS_UNUSED(                        0x083C, _S16, _TG,  30)
+VMCS_UNUSED(                        0x083E, _S16, _TG,  31)
+VMCS_GROUP_END(16, GUEST)
 
 /* 16-bit host state. */
-VMCS_FIELD(HOST_ES,                 0x0C00, TRUE)
-VMCS_FIELD(HOST_CS,                 0x0C02, TRUE)
-VMCS_FIELD(HOST_SS,                 0x0C04, TRUE)
-VMCS_FIELD(HOST_DS,                 0x0C06, TRUE)
-VMCS_FIELD(HOST_FS,                 0x0C08, TRUE)
-VMCS_FIELD(HOST_GS,                 0x0C0A, TRUE)
-VMCS_FIELD(HOST_TR,                 0x0C0C, TRUE)
+VMCS_GROUP_START(16, HOST)
+VMCS_FIELD(HOST_ES,                 0x0C00, _S16, _TH,  0, _NC,  _V, _NA)
+VMCS_FIELD(HOST_CS,                 0x0C02, _S16, _TH,  1, _NC,  _V, _NA)
+VMCS_FIELD(HOST_SS,                 0x0C04, _S16, _TH,  2, _NC,  _V, _NA)
+VMCS_FIELD(HOST_DS,                 0x0C06, _S16, _TH,  3, _NC,  _V, _NA)
+VMCS_FIELD(HOST_FS,                 0x0C08, _S16, _TH,  4, _NC,  _V, _NA)
+VMCS_FIELD(HOST_GS,                 0x0C0A, _S16, _TH,  5, _NC,  _V, _NA)
+VMCS_FIELD(HOST_TR,                 0x0C0C, _S16, _TH,  6, _NC,  _V, _NA)
+VMCS_UNUSED(                        0x0C0E, _S16, _TH,  7)
+VMCS_UNUSED(                        0x0C10, _S16, _TH,  8)
+VMCS_UNUSED(                        0x0C12, _S16, _TH,  9)
+VMCS_UNUSED(                        0x0C14, _S16, _TH,  10)
+VMCS_UNUSED(                        0x0C16, _S16, _TH,  11)
+VMCS_UNUSED(                        0x0C18, _S16, _TH,  12)
+VMCS_UNUSED(                        0x0C1A, _S16, _TH,  13)
+VMCS_UNUSED(                        0x0C1C, _S16, _TH,  14)
+VMCS_UNUSED(                        0x0C1E, _S16, _TH,  15)
+VMCS_UNUSED(                        0x0C20, _S16, _TH,  16)
+VMCS_UNUSED(                        0x0C22, _S16, _TH,  17)
+VMCS_UNUSED(                        0x0C24, _S16, _TH,  18)
+VMCS_UNUSED(                        0x0C26, _S16, _TH,  19)
+VMCS_UNUSED(                        0x0C28, _S16, _TH,  20)
+VMCS_UNUSED(                        0x0C2A, _S16, _TH,  21)
+VMCS_UNUSED(                        0x0C2C, _S16, _TH,  22)
+VMCS_UNUSED(                        0x0C2E, _S16, _TH,  23)
+VMCS_UNUSED(                        0x0C30, _S16, _TH,  24)
+VMCS_UNUSED(                        0x0C32, _S16, _TH,  25)
+VMCS_UNUSED(                        0x0C34, _S16, _TH,  26)
+VMCS_UNUSED(                        0x0C36, _S16, _TH,  27)
+VMCS_UNUSED(                        0x0C38, _S16, _TH,  28)
+VMCS_UNUSED(                        0x0C3A, _S16, _TH,  29)
+VMCS_UNUSED(                        0x0C3C, _S16, _TH,  30)
+VMCS_UNUSED(                        0x0C3E, _S16, _TH,  31)
+VMCS_GROUP_END(16, HOST)
+VMCS_SET_END(16)
+
 
+VMCS_SET_START(64)
 /* 64-bit control fields. */
-VMCS_FIELD(IOBITMAPA,               0x2000, TRUE)
-VMCS_FIELD(IOBITMAPB,               0x2002, TRUE)
-VMCS_FIELD(MSRBITMAP,               0x2004, TRUE)
-VMCS_FIELD(VMEXIT_MSR_STORE_ADDR,   0x2006, TRUE)
-VMCS_FIELD(VMEXIT_MSR_LOAD_ADDR,    0x2008, TRUE)
-VMCS_FIELD(VMENTRY_MSR_LOAD_ADDR,   0x200A, TRUE)
-VMCS_FIELD(EXECUTIVE_VMCS_PTR,      0x200C, TRUE)
-VMCS_FIELD(TSC_OFF,                 0x2010, TRUE)
-VMCS_FIELD(VIRT_APIC_ADDR,          0x2012, TRUE)
-VMCS_FIELD(APIC_ACCESS_ADDR,        0x2014, FALSE)
-VMCS_FIELD(PI_DESC_ADDR,            0x2016, FALSE)
-VMCS_FIELD(VMFUNC_CTLS,             0x2018, FALSE)
-VMCS_FIELD(EPTP,                    0x201A, TRUE)
-VMCS_FIELD(EOI_EXIT0,               0x201C, FALSE)
-VMCS_FIELD(EOI_EXIT1,               0x201E, FALSE)
-VMCS_FIELD(EOI_EXIT2,               0x2020, FALSE)
-VMCS_FIELD(EOI_EXIT3,               0x2022, FALSE)
-VMCS_FIELD(EPTP_LIST_ADDR,          0x2024, FALSE)
-VMCS_FIELD(VMREAD_BITMAP,           0x2026, FALSE)
-VMCS_FIELD(VMWRITE_BITMAP,          0x2028, FALSE)
-VMCS_FIELD(VE_INFO_ADDR,            0x202A, FALSE)
-VMCS_FIELD(XSS_EXITING_BITMAP,      0x202C, FALSE)
-VMCS_FIELD(ENCLS_EXITING_BITMAP,    0x202E, FALSE)
+VMCS_GROUP_START(64, CTL)
+VMCS_FIELD(IOBITMAPA,               0x2000, _S64, _TC,  0, _NC,  _V, _NA)
+VMCS_FIELD(IOBITMAPB,               0x2002, _S64, _TC,  1, _NC,  _V, _NA)
+VMCS_FIELD(MSRBITMAP,               0x2004, _S64, _TC,  2, _NC,  _V, _NA)
+VMCS_FIELD(VMEXIT_MSR_STORE_ADDR,   0x2006, _S64, _TC,  3, _NC,  _V, _NA)
+VMCS_FIELD(VMEXIT_MSR_LOAD_ADDR,    0x2008, _S64, _TC,  4, _NC,  _V, _NA)
+VMCS_FIELD(VMENTRY_MSR_LOAD_ADDR,   0x200A, _S64, _TC,  5, _NC,  _V, _NA)
+VMCS_FIELD(EXECUTIVE_VMCS_PTR,      0x200C, _S64, _TC,  6, _NC,  _V, _NA)
+VMCS_FIELD(PML_ADDR,                0x200E, _S64, _TC,  7, _NC, _NV, _NA)
+VMCS_FIELD(TSC_OFF,                 0x2010, _S64, _TC,  8,  _C,  _V, _NA)
+VMCS_FIELD(VIRT_APIC_ADDR,          0x2012, _S64, _TC,  9, _NC,  _V, _NA)
+VMCS_FIELD(APIC_ACCESS_ADDR,        0x2014, _S64, _TC, 10, _NC,  _V, _NA)
+VMCS_FIELD(PI_DESC_ADDR,            0x2016, _S64, _TC, 11, _NC, _NV, _NA)
+VMCS_FIELD(VMFUNC_CTLS,             0x2018, _S64, _TC, 12, _NC,  _V, _NA)
+VMCS_FIELD(EPTP,                    0x201A, _S64, _TC, 13, _NC,  _V, _NA)
+VMCS_FIELD(EOI_EXIT0,               0x201C, _S64, _TC, 14, _NC, _NV, _NA)
+VMCS_FIELD(EOI_EXIT1,               0x201E, _S64, _TC, 15, _NC, _NV, _NA)
+VMCS_FIELD(EOI_EXIT2,               0x2020, _S64, _TC, 16, _NC, _NV, _NA)
+VMCS_FIELD(EOI_EXIT3,               0x2022, _S64, _TC, 17, _NC, _NV, _NA)
+VMCS_FIELD(EPTP_LIST_ADDR,          0x2024, _S64, _TC, 18, _NC,  _V, _NA)
+VMCS_FIELD(VMREAD_BITMAP,           0x2026, _S64, _TC, 19, _NC, _NV, _NA)
+VMCS_FIELD(VMWRITE_BITMAP,          0x2028, _S64, _TC, 20, _NC, _NV, _NA)
+VMCS_FIELD(VE_INFO_ADDR,            0x202A, _S64, _TC, 21, _NC,  _V, _NA)
+VMCS_FIELD(XSS_EXITING_BITMAP,      0x202C, _S64, _TC, 22, _NC,  _V, _NA)
+VMCS_FIELD(ENCLS_EXITING_BITMAP,    0x202E, _S64, _TC, 23, _NC, _NV, _NA)
+VMCS_UNUSED(                        0x2030, _S64, _TC, 24)
+VMCS_FIELD(TSC_MULTIPLIER,          0x2032, _S64, _TC, 25, _NC, _NV, _NA)
+VMCS_UNUSED(                        0x2034, _S64, _TC, 26)
+VMCS_UNUSED(                        0x2036, _S64, _TC, 27)
+VMCS_UNUSED(                        0x2038, _S64, _TC, 28)
+VMCS_UNUSED(                        0x203A, _S64, _TC, 29)
+VMCS_UNUSED(                        0x203C, _S64, _TC, 30)
+VMCS_UNUSED(                        0x203E, _S64, _TC, 31)
+VMCS_GROUP_END(64, CTL)
 
 /* 64-bit read-only data field. */
-VMCS_FIELD(PHYSADDR,                0x2400, TRUE)
+VMCS_GROUP_START(64, DATA)
+VMCS_FIELD(PHYSADDR,                0x2400, _S64, _TD,  0, _NC,  _V, _RO)
+VMCS_UNUSED(                        0x2402, _S64, _TD,  1)
+VMCS_UNUSED(                        0x2404, _S64, _TD,  2)
+VMCS_UNUSED(                        0x2406, _S64, _TD,  3)
+VMCS_UNUSED(                        0x2408, _S64, _TD,  4)
+VMCS_UNUSED(                        0x240A, _S64, _TD,  5)
+VMCS_UNUSED(                        0x240C, _S64, _TD,  6)
+VMCS_UNUSED(                        0x240E, _S64, _TD,  7)
+VMCS_UNUSED(                        0x2410, _S64, _TD,  8)
+VMCS_UNUSED(                        0x2412, _S64, _TD,  9)
+VMCS_UNUSED(                        0x2414, _S64, _TD,  10)
+VMCS_UNUSED(                        0x2416, _S64, _TD,  11)
+VMCS_UNUSED(                        0x2418, _S64, _TD,  12)
+VMCS_UNUSED(                        0x241A, _S64, _TD,  13)
+VMCS_UNUSED(                        0x241C, _S64, _TD,  14)
+VMCS_UNUSED(                        0x241E, _S64, _TD,  15)
+VMCS_UNUSED(                        0x2420, _S64, _TD,  16)
+VMCS_UNUSED(                        0x2422, _S64, _TD,  17)
+VMCS_UNUSED(                        0x2424, _S64, _TD,  18)
+VMCS_UNUSED(                        0x2426, _S64, _TD,  19)
+VMCS_UNUSED(                        0x2428, _S64, _TD,  20)
+VMCS_UNUSED(                        0x242A, _S64, _TD,  21)
+VMCS_UNUSED(                        0x242C, _S64, _TD,  22)
+VMCS_UNUSED(                        0x242E, _S64, _TD,  23)
+VMCS_UNUSED(                        0x2430, _S64, _TD,  24)
+VMCS_UNUSED(                        0x2432, _S64, _TD,  25)
+VMCS_UNUSED(                        0x2434, _S64, _TD,  26)
+VMCS_UNUSED(                        0x2436, _S64, _TD,  27)
+VMCS_UNUSED(                        0x2438, _S64, _TD,  28)
+VMCS_UNUSED(                        0x243A, _S64, _TD,  29)
+VMCS_UNUSED(                        0x243C, _S64, _TD,  30)
+VMCS_UNUSED(                        0x243E, _S64, _TD,  31)
+VMCS_GROUP_END(64, DATA)
 
 /* 64-bit guest state. */
-VMCS_FIELD(LINK_PTR,                0x2800, TRUE)
-VMCS_FIELD(DEBUGCTL,                0x2802, TRUE)
-VMCS_FIELD(PAT,                     0x2804, FALSE)
-VMCS_FIELD(EFER,                    0x2806, TRUE)
-VMCS_FIELD(PGC,                     0x2808, TRUE)
-VMCS_FIELD(PDPTE0,                  0x280A, TRUE)
-VMCS_FIELD(PDPTE1,                  0x280C, TRUE)
-VMCS_FIELD(PDPTE2,                  0x280E, TRUE)
-VMCS_FIELD(PDPTE3,                  0x2810, TRUE)
+VMCS_GROUP_START(64, GUEST)
+VMCS_FIELD(LINK_PTR,                0x2800, _S64, _TG,  0, _NC,  _V, _NA)
+VMCS_FIELD(DEBUGCTL,                0x2802, _S64, _TG,  1, _NC,  _V, _NA)
+VMCS_FIELD(PAT,                     0x2804, _S64, _TG,  2, _NC,  _V, _NA)
+VMCS_FIELD(EFER,                    0x2806, _S64, _TG,  3, _NC,  _V, _NA)
+VMCS_FIELD(PGC,                     0x2808, _S64, _TG,  4, _NC,  _V, _NA)
+VMCS_FIELD(PDPTE0,                  0x280A, _S64, _TG,  5, _NC,  _V, _RW)
+VMCS_FIELD(PDPTE1,                  0x280C, _S64, _TG,  6, _NC,  _V, _RW)
+VMCS_FIELD(PDPTE2,                  0x280E, _S64, _TG,  7, _NC,  _V, _RW)
+VMCS_FIELD(PDPTE3,                  0x2810, _S64, _TG,  8, _NC,  _V, _RW)
+VMCS_FIELD(BNDCFGS,                 0x2812, _S64, _TG,  9, _NC,  _V, _NA)
+VMCS_UNUSED(                        0x2814, _S64, _TG,  10)
+VMCS_UNUSED(                        0x2816, _S64, _TG,  11)
+VMCS_UNUSED(                        0x2818, _S64, _TG,  12)
+VMCS_UNUSED(                        0x281A, _S64, _TG,  13)
+VMCS_UNUSED(                        0x281C, _S64, _TG,  14)
+VMCS_UNUSED(                        0x281E, _S64, _TG,  15)
+VMCS_UNUSED(                        0x2820, _S64, _TG,  16)
+VMCS_UNUSED(                        0x2822, _S64, _TG,  17)
+VMCS_UNUSED(                        0x2824, _S64, _TG,  18)
+VMCS_UNUSED(                        0x2826, _S64, _TG,  19)
+VMCS_UNUSED(                        0x2828, _S64, _TG,  20)
+VMCS_UNUSED(                        0x282A, _S64, _TG,  21)
+VMCS_UNUSED(                        0x282C, _S64, _TG,  22)
+VMCS_UNUSED(                        0x282E, _S64, _TG,  23)
+VMCS_UNUSED(                        0x2830, _S64, _TG,  24)
+VMCS_UNUSED(                        0x2832, _S64, _TG,  25)
+VMCS_UNUSED(                        0x2834, _S64, _TG,  26)
+VMCS_UNUSED(                        0x2836, _S64, _TG,  27)
+VMCS_UNUSED(                        0x2838, _S64, _TG,  28)
+VMCS_UNUSED(                        0x283A, _S64, _TG,  29)
+VMCS_UNUSED(                        0x283C, _S64, _TG,  30)
+VMCS_UNUSED(                        0x283E, _S64, _TG,  31)
+VMCS_GROUP_END(64, GUEST)
 
 /* 64-bit host state. */
-VMCS_FIELD(HOST_PAT,                0x2C00, FALSE)
-VMCS_FIELD(HOST_EFER,               0x2C02, TRUE)
-VMCS_FIELD(HOST_PGC,                0x2C04, TRUE)
+VMCS_GROUP_START(64, HOST)
+VMCS_FIELD(HOST_PAT,                0x2C00, _S64, _TH,  0, _NC,  _V, _NA)
+VMCS_FIELD(HOST_EFER,               0x2C02, _S64, _TH,  1, _NC,  _V, _NA)
+VMCS_FIELD(HOST_PGC,                0x2C04, _S64, _TH,  2, _NC,  _V, _NA)
+VMCS_UNUSED(                        0x2C06, _S64, _TH,  3)
+VMCS_UNUSED(                        0x2C08, _S64, _TH,  4)
+VMCS_UNUSED(                        0x2C0A, _S64, _TH,  5)
+VMCS_UNUSED(                        0x2C0C, _S64, _TH,  6)
+VMCS_UNUSED(                        0x2C0E, _S64, _TH,  7)
+VMCS_UNUSED(                        0x2C10, _S64, _TH,  8)
+VMCS_UNUSED(                        0x2C12, _S64, _TH,  9)
+VMCS_UNUSED(                        0x2C14, _S64, _TH,  10)
+VMCS_UNUSED(                        0x2C16, _S64, _TH,  11)
+VMCS_UNUSED(                        0x2C18, _S64, _TH,  12)
+VMCS_UNUSED(                        0x2C1A, _S64, _TH,  13)
+VMCS_UNUSED(                        0x2C1C, _S64, _TH,  14)
+VMCS_UNUSED(                        0x2C1E, _S64, _TH,  15)
+VMCS_UNUSED(                        0x2C20, _S64, _TH,  16)
+VMCS_UNUSED(                        0x2C22, _S64, _TH,  17)
+VMCS_UNUSED(                        0x2C24, _S64, _TH,  18)
+VMCS_UNUSED(                        0x2C26, _S64, _TH,  19)
+VMCS_UNUSED(                        0x2C28, _S64, _TH,  20)
+VMCS_UNUSED(                        0x2C2A, _S64, _TH,  21)
+VMCS_UNUSED(                        0x2C2C, _S64, _TH,  22)
+VMCS_UNUSED(                        0x2C2E, _S64, _TH,  23)
+VMCS_UNUSED(                        0x2C30, _S64, _TH,  24)
+VMCS_UNUSED(                        0x2C32, _S64, _TH,  25)
+VMCS_UNUSED(                        0x2C34, _S64, _TH,  26)
+VMCS_UNUSED(                        0x2C36, _S64, _TH,  27)
+VMCS_UNUSED(                        0x2C38, _S64, _TH,  28)
+VMCS_UNUSED(                        0x2C3A, _S64, _TH,  29)
+VMCS_UNUSED(                        0x2C3C, _S64, _TH,  30)
+VMCS_UNUSED(                        0x2C3E, _S64, _TH,  31)
+VMCS_GROUP_END(64, HOST)
+VMCS_SET_END(64)
+
 
+VMCS_SET_START(32)
 /* 32-bit control fields. */
-VMCS_FIELD(PIN_VMEXEC_CTL,          0x4000, TRUE)
-VMCS_FIELD(CPU_VMEXEC_CTL,          0x4002, TRUE)
-VMCS_FIELD(XCP_BITMAP,              0x4004, TRUE)
-VMCS_FIELD(PF_ERR_MASK,             0x4006, TRUE)
-VMCS_FIELD(PF_ERR_MATCH,            0x4008, TRUE)
-VMCS_FIELD(CR3_TARG_COUNT,          0x400A, TRUE)
-VMCS_FIELD(VMEXIT_CTL,              0x400C, TRUE)
-VMCS_FIELD(VMEXIT_MSR_STORE_COUNT,  0x400E, TRUE)
-VMCS_FIELD(VMEXIT_MSR_LOAD_COUNT,   0x4010, TRUE)
-VMCS_FIELD(VMENTRY_CTL,             0x4012, TRUE)
-VMCS_FIELD(VMENTRY_MSR_LOAD_COUNT,  0x4014, TRUE)
-VMCS_FIELD(VMENTRY_INTR_INFO,       0x4016, TRUE)
-VMCS_FIELD(VMENTRY_XCP_ERR,         0x4018, TRUE)
-VMCS_FIELD(VMENTRY_INSTR_LEN,       0x401A, TRUE)
-VMCS_FIELD(TPR_THRESHOLD,           0x401C, TRUE)
-VMCS_FIELD(2ND_VMEXEC_CTL,          0x401E, TRUE)
-VMCS_FIELD(PAUSE_LOOP_GAP,          0x4020, FALSE)
-VMCS_FIELD(PAUSE_LOOP_WINDOW,       0x4022, FALSE)
+VMCS_GROUP_START(32, CTL)
+VMCS_FIELD(PIN_VMEXEC_CTL,          0x4000, _S32, _TC,  0,  _C,  _V, _NA)
+VMCS_FIELD(CPU_VMEXEC_CTL,          0x4002, _S32, _TC,  1,  _C,  _V, _NA)
+VMCS_FIELD(XCP_BITMAP,              0x4004, _S32, _TC,  2, _NC,  _V, _NA)
+VMCS_FIELD(PF_ERR_MASK,             0x4006, _S32, _TC,  3, _NC,  _V, _NA)
+VMCS_FIELD(PF_ERR_MATCH,            0x4008, _S32, _TC,  4, _NC,  _V, _NA)
+VMCS_FIELD(CR3_TARG_COUNT,          0x400A, _S32, _TC,  5, _NC,  _V, _NA)
+VMCS_FIELD(VMEXIT_CTL,              0x400C, _S32, _TC,  6, _NC,  _V, _NA)
+VMCS_FIELD(VMEXIT_MSR_STORE_COUNT,  0x400E, _S32, _TC,  7, _NC,  _V, _NA)
+VMCS_FIELD(VMEXIT_MSR_LOAD_COUNT,   0x4010, _S32, _TC,  8, _NC,  _V, _NA)
+VMCS_FIELD(VMENTRY_CTL,             0x4012, _S32, _TC,  9, _NC,  _V, _NA)
+VMCS_FIELD(VMENTRY_MSR_LOAD_COUNT,  0x4014, _S32, _TC, 10, _NC,  _V, _NA)
+VMCS_FIELD(VMENTRY_INTR_INFO,       0x4016, _S32, _TC, 11, _NC,  _V, _NA)
+VMCS_FIELD(VMENTRY_XCP_ERR,         0x4018, _S32, _TC, 12, _NC,  _V, _NA)
+VMCS_FIELD(VMENTRY_INSTR_LEN,       0x401A, _S32, _TC, 13, _NC,  _V, _NA)
+VMCS_FIELD(TPR_THRESHOLD,           0x401C, _S32, _TC, 14,  _C,  _V, _NA)
+VMCS_FIELD(2ND_VMEXEC_CTL,          0x401E, _S32, _TC, 15,  _C,  _V, _NA)
+VMCS_FIELD(PAUSE_LOOP_GAP,          0x4020, _S32, _TC, 16, _NC,  _V, _NA)
+VMCS_FIELD(PAUSE_LOOP_WINDOW,       0x4022, _S32, _TC, 17, _NC,  _V, _NA)
+VMCS_UNUSED(                        0x4024, _S32, _TC, 18)
+VMCS_UNUSED(                        0x4026, _S32, _TC, 19)
+VMCS_UNUSED(                        0x4028, _S32, _TC, 20)
+VMCS_UNUSED(                        0x402A, _S32, _TC, 21)
+VMCS_UNUSED(                        0x402C, _S32, _TC, 22)
+VMCS_UNUSED(                        0x402E, _S32, _TC, 23)
+VMCS_UNUSED(                        0x4030, _S32, _TC, 24)
+VMCS_UNUSED(                        0x4032, _S32, _TC, 25)
+VMCS_UNUSED(                        0x4034, _S32, _TC, 26)
+VMCS_UNUSED(                        0x4036, _S32, _TC, 27)
+VMCS_UNUSED(                        0x4038, _S32, _TC, 28)
+VMCS_UNUSED(                        0x403A, _S32, _TC, 29)
+VMCS_UNUSED(                        0x403C, _S32, _TC, 30)
+VMCS_UNUSED(                        0x403E, _S32, _TC, 31)
+VMCS_GROUP_END(32, CTL)
 
 /* 32-bit read-only data fields. */
-VMCS_FIELD(VMINSTR_ERR,             0x4400, TRUE)
-VMCS_FIELD(EXIT_REASON,             0x4402, TRUE)
-VMCS_FIELD(EXIT_INTR_INFO,          0x4404, TRUE)
-VMCS_FIELD(EXIT_INTR_ERR,           0x4406, TRUE)
-VMCS_FIELD(IDTVEC_INFO,             0x4408, TRUE)
-VMCS_FIELD(IDTVEC_ERR,              0x440A, TRUE)
-VMCS_FIELD(INSTRLEN,                0x440C, TRUE)
-VMCS_FIELD(INSTR_INFO,              0x440E, TRUE)
+VMCS_GROUP_START(32, DATA)
+VMCS_FIELD(VMINSTR_ERR,             0x4400, _S32, _TD,  0, _NC,  _V, _NA)
+VMCS_FIELD(EXIT_REASON,             0x4402, _S32, _TD,  1, _NC,  _V, _RO)
+VMCS_FIELD(EXIT_INTR_INFO,          0x4404, _S32, _TD,  2,  _C,  _V, _RO)
+VMCS_FIELD(EXIT_INTR_ERR,           0x4406, _S32, _TD,  3, _NC,  _V, _RO)
+VMCS_FIELD(IDTVEC_INFO,             0x4408, _S32, _TD,  4, _NC,  _V, _RO)
+VMCS_FIELD(IDTVEC_ERR,              0x440A, _S32, _TD,  5, _NC,  _V, _RO)
+VMCS_FIELD(INSTRLEN,                0x440C, _S32, _TD,  6, _NC,  _V, _RO)
+VMCS_FIELD(INSTR_INFO,              0x440E, _S32, _TD,  7, _NC,  _V, _RO)
+VMCS_UNUSED(                        0x4410, _S32, _TD,  8)
+VMCS_UNUSED(                        0x4412, _S32, _TD,  9)
+VMCS_UNUSED(                        0x4414, _S32, _TD,  10)
+VMCS_UNUSED(                        0x4416, _S32, _TD,  11)
+VMCS_UNUSED(                        0x4418, _S32, _TD,  12)
+VMCS_UNUSED(                        0x441A, _S32, _TD,  13)
+VMCS_UNUSED(                        0x441C, _S32, _TD,  14)
+VMCS_UNUSED(                        0x441E, _S32, _TD,  15)
+VMCS_UNUSED(                        0x4420, _S32, _TD,  16)
+VMCS_UNUSED(                        0x4422, _S32, _TD,  17)
+VMCS_UNUSED(                        0x4424, _S32, _TD,  18)
+VMCS_UNUSED(                        0x4426, _S32, _TD,  19)
+VMCS_UNUSED(                        0x4428, _S32, _TD,  20)
+VMCS_UNUSED(                        0x442A, _S32, _TD,  21)
+VMCS_UNUSED(                        0x442C, _S32, _TD,  22)
+VMCS_UNUSED(                        0x442E, _S32, _TD,  23)
+VMCS_UNUSED(                        0x4430, _S32, _TD,  24)
+VMCS_UNUSED(                        0x4432, _S32, _TD,  25)
+VMCS_UNUSED(                        0x4434, _S32, _TD,  26)
+VMCS_UNUSED(                        0x4436, _S32, _TD,  27)
+VMCS_UNUSED(                        0x4438, _S32, _TD,  28)
+VMCS_UNUSED(                        0x443A, _S32, _TD,  29)
+VMCS_UNUSED(                        0x443C, _S32, _TD,  30)
+VMCS_UNUSED(                        0x443E, _S32, _TD,  31)
+VMCS_GROUP_END(32, DATA)
 
 /* 32-bit guest state. */
-VMCS_FIELD(ES_LIMIT,                0x4800, TRUE)
-VMCS_FIELD(CS_LIMIT,                0x4802, TRUE)
-VMCS_FIELD(SS_LIMIT,                0x4804, TRUE)
-VMCS_FIELD(DS_LIMIT,                0x4806, TRUE)
-VMCS_FIELD(FS_LIMIT,                0x4808, TRUE)
-VMCS_FIELD(GS_LIMIT,                0x480A, TRUE)
-VMCS_FIELD(LDTR_LIMIT,              0x480C, TRUE)
-VMCS_FIELD(TR_LIMIT,                0x480E, TRUE)
-VMCS_FIELD(GDTR_LIMIT,              0x4810, TRUE)
-VMCS_FIELD(IDTR_LIMIT,              0x4812, TRUE)
-VMCS_FIELD(ES_AR,                   0x4814, TRUE)
-VMCS_FIELD(CS_AR,                   0x4816, TRUE)
-VMCS_FIELD(SS_AR,                   0x4818, TRUE)
-VMCS_FIELD(DS_AR,                   0x481A, TRUE)
-VMCS_FIELD(FS_AR,                   0x481C, TRUE)
-VMCS_FIELD(GS_AR,                   0x481E, TRUE)
-VMCS_FIELD(LDTR_AR,                 0x4820, TRUE)
-VMCS_FIELD(TR_AR,                   0x4822, TRUE)
-VMCS_FIELD(HOLDOFF,                 0x4824, TRUE)
-VMCS_FIELD(ACTSTATE,                0x4826, TRUE)
-VMCS_FIELD(SMBASE,                  0x4828, TRUE)
-VMCS_FIELD(SYSENTER_CS,             0x482A, TRUE)
-VMCS_FIELD(TIMER,                   0x482E, FALSE)
+VMCS_GROUP_START(32, GUEST)
+VMCS_FIELD(ES_LIMIT,                0x4800, _S32, _TG,  0, _NC,  _V, _RW)
+VMCS_FIELD(CS_LIMIT,                0x4802, _S32, _TG,  1, _NC,  _V, _RW)
+VMCS_FIELD(SS_LIMIT,                0x4804, _S32, _TG,  2, _NC,  _V, _RW)
+VMCS_FIELD(DS_LIMIT,                0x4806, _S32, _TG,  3, _NC,  _V, _RW)
+VMCS_FIELD(FS_LIMIT,                0x4808, _S32, _TG,  4, _NC,  _V, _RW)
+VMCS_FIELD(GS_LIMIT,                0x480A, _S32, _TG,  5, _NC,  _V, _RW)
+VMCS_FIELD(LDTR_LIMIT,              0x480C, _S32, _TG,  6, _NC,  _V, _RW)
+VMCS_FIELD(TR_LIMIT,                0x480E, _S32, _TG,  7, _NC,  _V, _RW)
+VMCS_FIELD(GDTR_LIMIT,              0x4810, _S32, _TG,  8, _NC,  _V, _RW)
+VMCS_FIELD(IDTR_LIMIT,              0x4812, _S32, _TG,  9, _NC,  _V, _RW)
+VMCS_FIELD(ES_AR,                   0x4814, _S32, _TG, 10, _NC,  _V, _RW)
+VMCS_FIELD(CS_AR,                   0x4816, _S32, _TG, 11, _NC,  _V, _RW)
+VMCS_FIELD(SS_AR,                   0x4818, _S32, _TG, 12, _NC,  _V, _RW)
+VMCS_FIELD(DS_AR,                   0x481A, _S32, _TG, 13, _NC,  _V, _RW)
+VMCS_FIELD(FS_AR,                   0x481C, _S32, _TG, 14, _NC,  _V, _RW)
+VMCS_FIELD(GS_AR,                   0x481E, _S32, _TG, 15, _NC,  _V, _RW)
+VMCS_FIELD(LDTR_AR,                 0x4820, _S32, _TG, 16, _NC,  _V, _RW)
+VMCS_FIELD(TR_AR,                   0x4822, _S32, _TG, 17, _NC,  _V, _RW)
+VMCS_FIELD(HOLDOFF,                 0x4824, _S32, _TG, 18,  _C,  _V, _RW)
+VMCS_FIELD(ACTSTATE,                0x4826, _S32, _TG, 19, _NC,  _V, _NA)
+VMCS_FIELD(SMBASE,                  0x4828, _S32, _TG, 20, _NC,  _V, _NA)
+VMCS_FIELD(SYSENTER_CS,             0x482A, _S32, _TG, 21, _NC,  _V, _RW)
+VMCS_UNUSED(                        0x482C, _S32, _TG, 22)
+VMCS_FIELD(TIMER,                   0x482E, _S32, _TG, 23, _NC, _NV, _NA)
+VMCS_UNUSED(                        0x4830, _S32, _TG, 24)
+VMCS_UNUSED(                        0x4832, _S32, _TG, 25)
+VMCS_UNUSED(                        0x4834, _S32, _TG, 26)
+VMCS_UNUSED(                        0x4836, _S32, _TG, 27)
+VMCS_UNUSED(                        0x4838, _S32, _TG, 28)
+VMCS_UNUSED(                        0x483A, _S32, _TG, 29)
+VMCS_UNUSED(                        0x483C, _S32, _TG, 30)
+VMCS_UNUSED(                        0x483E, _S32, _TG, 31)
+
+VMCS_GROUP_END(32, GUEST)
 
 /* 32-bit host state. */
-VMCS_FIELD(HOST_SYSENTER_CS,        0x4C00, TRUE)
+VMCS_GROUP_START(32, HOST)
+VMCS_FIELD(HOST_SYSENTER_CS,        0x4C00, _S32, _TH,  0, _NC,  _V, _NA)
+VMCS_UNUSED(                        0x4C02, _S32, _TH,  1)
+VMCS_UNUSED(                        0x4C04, _S32, _TH,  2)
+VMCS_UNUSED(                        0x4C06, _S32, _TH,  3)
+VMCS_UNUSED(                        0x4C08, _S32, _TH,  4)
+VMCS_UNUSED(                        0x4C0A, _S32, _TH,  5)
+VMCS_UNUSED(                        0x4C0C, _S32, _TH,  6)
+VMCS_UNUSED(                        0x4C0E, _S32, _TH,  7)
+VMCS_UNUSED(                        0x4C10, _S32, _TH,  8)
+VMCS_UNUSED(                        0x4C12, _S32, _TH,  9)
+VMCS_UNUSED(                        0x4C14, _S32, _TH,  10)
+VMCS_UNUSED(                        0x4C16, _S32, _TH,  11)
+VMCS_UNUSED(                        0x4C18, _S32, _TH,  12)
+VMCS_UNUSED(                        0x4C1A, _S32, _TH,  13)
+VMCS_UNUSED(                        0x4C1C, _S32, _TH,  14)
+VMCS_UNUSED(                        0x4C1E, _S32, _TH,  15)
+VMCS_UNUSED(                        0x4C20, _S32, _TH,  16)
+VMCS_UNUSED(                        0x4C22, _S32, _TH,  17)
+VMCS_UNUSED(                        0x4C24, _S32, _TH,  18)
+VMCS_UNUSED(                        0x4C26, _S32, _TH,  19)
+VMCS_UNUSED(                        0x4C28, _S32, _TH,  20)
+VMCS_UNUSED(                        0x4C2A, _S32, _TH,  21)
+VMCS_UNUSED(                        0x4C2C, _S32, _TH,  22)
+VMCS_UNUSED(                        0x4C2E, _S32, _TH,  23)
+VMCS_UNUSED(                        0x4C30, _S32, _TH,  24)
+VMCS_UNUSED(                        0x4C32, _S32, _TH,  25)
+VMCS_UNUSED(                        0x4C34, _S32, _TH,  26)
+VMCS_UNUSED(                        0x4C36, _S32, _TH,  27)
+VMCS_UNUSED(                        0x4C38, _S32, _TH,  28)
+VMCS_UNUSED(                        0x4C3A, _S32, _TH,  29)
+VMCS_UNUSED(                        0x4C3C, _S32, _TH,  30)
+VMCS_UNUSED(                        0x4C3E, _S32, _TH,  31)
+VMCS_GROUP_END(32, HOST)
+VMCS_SET_END(32)
+
 
+VMCS_SET_START(NAT)
 /* natural-width control fields. */
-VMCS_FIELD(CR0_GHMASK,              0x6000, TRUE)
-VMCS_FIELD(CR4_GHMASK,              0x6002, TRUE)
-VMCS_FIELD(CR0_SHADOW,              0x6004, TRUE)
-VMCS_FIELD(CR4_SHADOW,              0x6006, TRUE)
-VMCS_FIELD(CR3_TARGVAL0,            0x6008, TRUE)
-VMCS_FIELD(CR3_TARGVAL1,            0x600A, TRUE)
-VMCS_FIELD(CR3_TARGVAL2,            0x600C, TRUE)
-VMCS_FIELD(CR3_TARGVAL3,            0x600E, TRUE)
-
-/* natural-width read-only data fields. */
-VMCS_FIELD(EXIT_QUAL,               0x6400, TRUE)
-VMCS_FIELD(IO_ECX,                  0x6402, TRUE)
-VMCS_FIELD(IO_ESI,                  0x6404, TRUE)
-VMCS_FIELD(IO_EDI,                  0x6406, TRUE)
-VMCS_FIELD(IO_EIP,                  0x6408, TRUE)
-VMCS_FIELD(LINEAR_ADDR,             0x640A, TRUE)
+VMCS_GROUP_START(NAT, CTL)
+VMCS_FIELD(CR0_GHMASK,              0x6000,  _SN, _TC,  0,  _C,  _V, _NA)
+VMCS_FIELD(CR4_GHMASK,              0x6002,  _SN, _TC,  1,  _C,  _V, _NA)
+VMCS_FIELD(CR0_SHADOW,              0x6004,  _SN, _TC,  2, _NC,  _V, _NA)
+VMCS_FIELD(CR4_SHADOW,              0x6006,  _SN, _TC,  3, _NC,  _V, _NA)
+VMCS_FIELD(CR3_TARGVAL0,            0x6008,  _SN, _TC,  4, _NC,  _V, _NA)
+VMCS_FIELD(CR3_TARGVAL1,            0x600A,  _SN, _TC,  5, _NC,  _V, _NA)
+VMCS_FIELD(CR3_TARGVAL2,            0x600C,  _SN, _TC,  6, _NC,  _V, _NA)
+VMCS_FIELD(CR3_TARGVAL3,            0x600E,  _SN, _TC,  7, _NC,  _V, _NA)
+VMCS_UNUSED(                        0x6010,  _SN, _TC,  8)
+VMCS_UNUSED(                        0x6012,  _SN, _TC,  9)
+VMCS_UNUSED(                        0x6014,  _SN, _TC,  10)
+VMCS_UNUSED(                        0x6016,  _SN, _TC,  11)
+VMCS_UNUSED(                        0x6018,  _SN, _TC,  12)
+VMCS_UNUSED(                        0x601A,  _SN, _TC,  13)
+VMCS_UNUSED(                        0x601C,  _SN, _TC,  14)
+VMCS_UNUSED(                        0x601E,  _SN, _TC,  15)
+VMCS_UNUSED(                        0x6020,  _SN, _TC,  16)
+VMCS_UNUSED(                        0x6022,  _SN, _TC,  17)
+VMCS_UNUSED(                        0x6024,  _SN, _TC,  18)
+VMCS_UNUSED(                        0x6026,  _SN, _TC,  19)
+VMCS_UNUSED(                        0x6028,  _SN, _TC,  20)
+VMCS_UNUSED(                        0x602A,  _SN, _TC,  21)
+VMCS_UNUSED(                        0x602C,  _SN, _TC,  22)
+VMCS_UNUSED(                        0x602E,  _SN, _TC,  23)
+VMCS_UNUSED(                        0x6030,  _SN, _TC,  24)
+VMCS_UNUSED(                        0x6032,  _SN, _TC,  25)
+VMCS_UNUSED(                        0x6034,  _SN, _TC,  26)
+VMCS_UNUSED(                        0x6036,  _SN, _TC,  27)
+VMCS_UNUSED(                        0x6038,  _SN, _TC,  28)
+VMCS_UNUSED(                        0x603A,  _SN, _TC,  29)
+VMCS_UNUSED(                        0x603C,  _SN, _TC,  30)
+VMCS_UNUSED(                        0x603E,  _SN, _TC,  31)
+VMCS_GROUP_END(NAT, CTL)
+
+VMCS_GROUP_START(NAT, DATA)
+VMCS_FIELD(EXIT_QUAL,               0x6400,  _SN, _TD,  0, _NC,  _V, _RO)
+VMCS_FIELD(IO_RCX,                  0x6402,  _SN, _TD,  1, _NC,  _V, _RO)
+VMCS_FIELD(IO_RSI,                  0x6404,  _SN, _TD,  2, _NC,  _V, _RO)
+VMCS_FIELD(IO_RDI,                  0x6406,  _SN, _TD,  3, _NC,  _V, _RO)
+VMCS_FIELD(IO_RIP,                  0x6408,  _SN, _TD,  4, _NC,  _V, _RO)
+VMCS_FIELD(LINEAR_ADDR,             0x640A,  _SN, _TD,  5, _NC,  _V, _RO)
+VMCS_UNUSED(                        0x640C,  _SN, _TD,  6)
+VMCS_UNUSED(                        0x640E,  _SN, _TD,  7)
+VMCS_UNUSED(                        0x6410,  _SN, _TD,  8)
+VMCS_UNUSED(                        0x6412,  _SN, _TD,  9)
+VMCS_UNUSED(                        0x6414,  _SN, _TD,  10)
+VMCS_UNUSED(                        0x6416,  _SN, _TD,  11)
+VMCS_UNUSED(                        0x6418,  _SN, _TD,  12)
+VMCS_UNUSED(                        0x641A,  _SN, _TD,  13)
+VMCS_UNUSED(                        0x641C,  _SN, _TD,  14)
+VMCS_UNUSED(                        0x641E,  _SN, _TD,  15)
+VMCS_UNUSED(                        0x6420,  _SN, _TD,  16)
+VMCS_UNUSED(                        0x6422,  _SN, _TD,  17)
+VMCS_UNUSED(                        0x6424,  _SN, _TD,  18)
+VMCS_UNUSED(                        0x6426,  _SN, _TD,  19)
+VMCS_UNUSED(                        0x6428,  _SN, _TD,  20)
+VMCS_UNUSED(                        0x642A,  _SN, _TD,  21)
+VMCS_UNUSED(                        0x642C,  _SN, _TD,  22)
+VMCS_UNUSED(                        0x642E,  _SN, _TD,  23)
+VMCS_UNUSED(                        0x6430,  _SN, _TD,  24)
+VMCS_UNUSED(                        0x6432,  _SN, _TD,  25)
+VMCS_UNUSED(                        0x6434,  _SN, _TD,  26)
+VMCS_UNUSED(                        0x6436,  _SN, _TD,  27)
+VMCS_UNUSED(                        0x6438,  _SN, _TD,  28)
+VMCS_UNUSED(                        0x643A,  _SN, _TD,  29)
+VMCS_UNUSED(                        0x643C,  _SN, _TD,  30)
+VMCS_UNUSED(                        0x643E,  _SN, _TD,  31)
+VMCS_GROUP_END(NAT, DATA)
 
 /* natural-width guest state. */
-VMCS_FIELD(CR0,                     0x6800, TRUE)
-VMCS_FIELD(CR3,                     0x6802, TRUE)
-VMCS_FIELD(CR4,                     0x6804, TRUE)
-VMCS_FIELD(ES_BASE,                 0x6806, TRUE)
-VMCS_FIELD(CS_BASE,                 0x6808, TRUE)
-VMCS_FIELD(SS_BASE,                 0x680A, TRUE)
-VMCS_FIELD(DS_BASE,                 0x680C, TRUE)
-VMCS_FIELD(FS_BASE,                 0x680E, TRUE)
-VMCS_FIELD(GS_BASE,                 0x6810, TRUE)
-VMCS_FIELD(LDTR_BASE,               0x6812, TRUE)
-VMCS_FIELD(TR_BASE,                 0x6814, TRUE)
-VMCS_FIELD(GDTR_BASE,               0x6816, TRUE)
-VMCS_FIELD(IDTR_BASE,               0x6818, TRUE)
-VMCS_FIELD(DR7,                     0x681A, TRUE)
-VMCS_FIELD(ESP,                     0x681C, TRUE)
-VMCS_FIELD(EIP,                     0x681E, TRUE)
-VMCS_FIELD(EFLAGS,                  0x6820, TRUE)
-VMCS_FIELD(PENDDBG,                 0x6822, TRUE)
-VMCS_FIELD(SYSENTER_ESP,            0x6824, TRUE)
-VMCS_FIELD(SYSENTER_EIP,            0x6826, TRUE)
+VMCS_GROUP_START(NAT, GUEST)
+VMCS_FIELD(CR0,                     0x6800,  _SN, _TG,  0, _NC,  _V, _NA)
+VMCS_FIELD(CR3,                     0x6802,  _SN, _TG,  1, _NC,  _V, _RW)
+VMCS_FIELD(CR4,                     0x6804,  _SN, _TG,  2, _NC,  _V, _RW)
+VMCS_FIELD(ES_BASE,                 0x6806,  _SN, _TG,  3, _NC,  _V, _RW)
+VMCS_FIELD(CS_BASE,                 0x6808,  _SN, _TG,  4, _NC,  _V, _RW)
+VMCS_FIELD(SS_BASE,                 0x680A,  _SN, _TG,  5, _NC,  _V, _RW)
+VMCS_FIELD(DS_BASE,                 0x680C,  _SN, _TG,  6, _NC,  _V, _RW)
+VMCS_FIELD(FS_BASE,                 0x680E,  _SN, _TG,  7, _NC,  _V, _RW)
+VMCS_FIELD(GS_BASE,                 0x6810,  _SN, _TG,  8, _NC,  _V, _RW)
+VMCS_FIELD(LDTR_BASE,               0x6812,  _SN, _TG,  9, _NC,  _V, _RW)
+VMCS_FIELD(TR_BASE,                 0x6814,  _SN, _TG, 10, _NC,  _V, _RW)
+VMCS_FIELD(GDTR_BASE,               0x6816,  _SN, _TG, 11, _NC,  _V, _RW)
+VMCS_FIELD(IDTR_BASE,               0x6818,  _SN, _TG, 12, _NC,  _V, _RW)
+VMCS_FIELD(DR7,                     0x681A,  _SN, _TG, 13, _NC,  _V, _NA)
+VMCS_FIELD(RSP,                     0x681C,  _SN, _TG, 14, _NC,  _V, _RW)
+VMCS_FIELD(RIP,                     0x681E,  _SN, _TG, 15, _NC,  _V, _RW)
+VMCS_FIELD(RFLAGS,                  0x6820,  _SN, _TG, 16, _NC,  _V, _RW)
+VMCS_FIELD(PENDDBG,                 0x6822,  _SN, _TG, 17, _NC,  _V, _RW)
+VMCS_FIELD(SYSENTER_ESP,            0x6824,  _SN, _TG, 18, _NC,  _V, _RW)
+VMCS_FIELD(SYSENTER_EIP,            0x6826,  _SN, _TG, 19, _NC,  _V, _RW)
+VMCS_UNUSED(                        0x6828,  _SN, _TG, 20)
+VMCS_UNUSED(                        0x682A,  _SN, _TG, 21)
+VMCS_UNUSED(                        0x682C,  _SN, _TG, 22)
+VMCS_UNUSED(                        0x682E,  _SN, _TG, 23)
+VMCS_UNUSED(                        0x6830,  _SN, _TG, 24)
+VMCS_UNUSED(                        0x6832,  _SN, _TG, 25)
+VMCS_UNUSED(                        0x6834,  _SN, _TG, 26)
+VMCS_UNUSED(                        0x6836,  _SN, _TG, 27)
+VMCS_UNUSED(                        0x6838,  _SN, _TG, 28)
+VMCS_UNUSED(                        0x683A,  _SN, _TG, 29)
+VMCS_UNUSED(                        0x683C,  _SN, _TG, 30)
+VMCS_UNUSED(                        0x683E,  _SN, _TG, 31)
+VMCS_GROUP_END(NAT, GUEST)
 
 /* natural-width host state. */
-VMCS_FIELD(HOST_CR0,                0x6C00, TRUE)
-VMCS_FIELD(HOST_CR3,                0x6C02, TRUE)
-VMCS_FIELD(HOST_CR4,                0x6C04, TRUE)
-VMCS_FIELD(HOST_FSBASE,             0x6C06, TRUE)
-VMCS_FIELD(HOST_GSBASE,             0x6C08, TRUE)
-VMCS_FIELD(HOST_TRBASE,             0x6C0A, TRUE)
-VMCS_FIELD(HOST_GDTRBASE,           0x6C0C, TRUE)
-VMCS_FIELD(HOST_IDTRBASE,           0x6C0E, TRUE)
-VMCS_FIELD(HOST_SYSENTER_ESP,       0x6C10, TRUE)
-VMCS_FIELD(HOST_SYSENTER_EIP,       0x6C12, TRUE)
-VMCS_FIELD(HOST_ESP,                0x6C14, TRUE)
-VMCS_FIELD(HOST_EIP,                0x6C16, TRUE)
+VMCS_GROUP_START(NAT, HOST)
+VMCS_FIELD(HOST_CR0,                0x6C00,  _SN, _TH,  0, _NC,  _V, _NA)
+VMCS_FIELD(HOST_CR3,                0x6C02,  _SN, _TH,  1, _NC,  _V, _NA)
+VMCS_FIELD(HOST_CR4,                0x6C04,  _SN, _TH,  2, _NC,  _V, _NA)
+VMCS_FIELD(HOST_FSBASE,             0x6C06,  _SN, _TH,  3, _NC,  _V, _NA)
+VMCS_FIELD(HOST_GSBASE,             0x6C08,  _SN, _TH,  4, _NC,  _V, _NA)
+VMCS_FIELD(HOST_TRBASE,             0x6C0A,  _SN, _TH,  5, _NC,  _V, _NA)
+VMCS_FIELD(HOST_GDTRBASE,           0x6C0C,  _SN, _TH,  6, _NC,  _V, _NA)
+VMCS_FIELD(HOST_IDTRBASE,           0x6C0E,  _SN, _TH,  7, _NC,  _V, _NA)
+VMCS_FIELD(HOST_SYSENTER_ESP,       0x6C10,  _SN, _TH,  8, _NC,  _V, _NA)
+VMCS_FIELD(HOST_SYSENTER_EIP,       0x6C12,  _SN, _TH,  9, _NC,  _V, _NA)
+VMCS_FIELD(HOST_RSP,                0x6C14,  _SN, _TH, 10, _NC,  _V, _NA)
+VMCS_FIELD(HOST_RIP,                0x6C16,  _SN, _TH, 11, _NC,  _V, _NA)
+VMCS_UNUSED(                        0x6C18,  _SN, _TH, 12)
+VMCS_UNUSED(                        0x6C1A,  _SN, _TH, 13)
+VMCS_UNUSED(                        0x6C1C,  _SN, _TH, 14)
+VMCS_UNUSED(                        0x6C1E,  _SN, _TH, 15)
+VMCS_UNUSED(                        0x6C20,  _SN, _TH, 16)
+VMCS_UNUSED(                        0x6C22,  _SN, _TH, 17)
+VMCS_UNUSED(                        0x6C24,  _SN, _TH, 18)
+VMCS_UNUSED(                        0x6C26,  _SN, _TH, 19)
+VMCS_UNUSED(                        0x6C28,  _SN, _TH, 20)
+VMCS_UNUSED(                        0x6C2A,  _SN, _TH, 21)
+VMCS_UNUSED(                        0x6C2C,  _SN, _TH, 22)
+VMCS_UNUSED(                        0x6C2E,  _SN, _TH, 23)
+VMCS_UNUSED(                        0x6C30,  _SN, _TH, 24)
+VMCS_UNUSED(                        0x6C32,  _SN, _TH, 25)
+VMCS_UNUSED(                        0x6C34,  _SN, _TH, 26)
+VMCS_UNUSED(                        0x6C36,  _SN, _TH, 27)
+VMCS_UNUSED(                        0x6C38,  _SN, _TH, 28)
+VMCS_UNUSED(                        0x6C3A,  _SN, _TH, 29)
+VMCS_UNUSED(                        0x6C3C,  _SN, _TH, 30)
+VMCS_UNUSED(                        0x6C3E,  _SN, _TH, 31)
+VMCS_GROUP_END(NAT, HOST)
+VMCS_SET_END(NAT)
+
+
+#ifdef LOCAL_GROUP_START
+#undef VMCS_GROUP_START
+#undef LOCAL_GROUP_START
+#endif
+
+#ifdef LOCAL_GROUP_END
+#undef VMCS_GROUP_END
+#undef LOCAL_GROUP_END
+#endif
+
+#ifdef LOCAL_SET_START
+#undef VMCS_SET_START
+#undef LOCAL_SET_START
+#endif
+
+#ifdef LOCAL_SET_END
+#undef VMCS_SET_END
+#undef LOCAL_SET_END
+#endif
+
+#ifdef LOCAL_UNUSED
+#undef VMCS_UNUSED
+#undef LOCAL_UNUSED
+#endif
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
index 993a8a9e..2ca47e02 100644
--- a/vmmon-only/include/x86vt.h
+++ b/vmmon-only/include/x86vt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2004-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2004-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -90,6 +90,8 @@
    (CONST64U(1) << MSR_VMX_MISC_ACTSTATE_SHUTDOWN_SHIFT)
 #define MSR_VMX_MISC_ACTSTATE_SIPI              \
    (CONST64U(1) << MSR_VMX_MISC_ACTSTATE_SIPI_SHIFT)
+#define MSR_VMX_MISC_PROCESSOR_TRACE_IN_VMX     \
+   (CONST64U(1) << MSR_VMX_MISC_PROCESSOR_TRACE_IN_VMX_SHIFT)
 #define MSR_VMX_MISC_RDMSR_SMBASE_IN_SMM        \
    (CONST64U(1) << MSR_VMX_MISC_RDMSR_SMBASE_IN_SMM_SHIFT)
 #define MSR_VMX_MISC_ALLOW_ALL_VMWRITES         \
@@ -128,6 +130,8 @@
    (CONST64U(1) << MSR_VMX_EPT_VPID_INVVPID_ALL_CTX_SHIFT)
 #define MSR_VMX_EPT_VPID_INVVPID_VPID_CTX_LOCAL \
    (CONST64U(1) << MSR_VMX_EPT_VPID_INVVPID_VPID_CTX_LOCAL_SHIFT)
+#define MSR_VMX_EPT_VPID_ADV_EXIT_INFO          \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_ADV_EXIT_INFO_SHIFT)
 
 #define VT_VMCS_STANDARD_TAG           0x00000000
 #define VT_VMCS_SHADOW_TAG             0x80000000
@@ -154,8 +158,14 @@
 #define VT_ENCODING_NUM_SIZES                   4
 #define VT_ENCODING_RSVD               0xffff9000
 
+/*
+ * The highest index of any currently defined field is 25, for
+ * TSC_MULTIPLIER.
+ */
+#define VT_ENCODING_MAX_INDEX                  25
+
 enum {
-#define VMCS_FIELD(name, encoding, vvt) VT_VMCS_##name = encoding,
+#define VMCS_FIELD(_name, _val, ...) VT_VMCS_##_name = _val,
 #include "x86vt-vmcs-fields.h"
 #undef VMCS_FIELD
 };
@@ -278,8 +288,12 @@ enum {
    VMX_CPU2(VMCS_SHADOW,        14)                      \
    VMX_CPU2(ENCL,               15)                      \
    VMX_CPU2(RDSEED,             16)                      \
+   VMX_CPU2(PML,                17)                      \
    VMX_CPU2(EPT_VIOL_VE,        18)                      \
-   VMX_CPU2(XSAVES,             20)
+   VMX_CPU2(PT_SUPPRESS_NR_BIT, 19)                      \
+   VMX_CPU2(XSAVES,             20)                      \
+   VMX_CPU2(EPT_MBX,            22)                      \
+   VMX_CPU2(TSC_SCALING,        25)
 
 #define VMX_PROCBASED_CTLS2_CAP                          \
         VMX_PROCBASED_CTLS2_CAP_NDA                      \
@@ -292,15 +306,17 @@ enum {
    VMXCTL(_EXIT_CTLS, _field, _pos)
 #define VMX_EXIT_CTLS_CAP_NDA
 #define VMX_EXIT_CTLS_CAP_PUB                            \
-   VMX_EXIT(SAVE_DEBUGCTL,       2)                      \
-   VMX_EXIT(LONGMODE,            9)                      \
-   VMX_EXIT(LOAD_PGC,           12)                      \
-   VMX_EXIT(INTRACK,            15)                      \
-   VMX_EXIT(SAVE_PAT,           18)                      \
-   VMX_EXIT(LOAD_PAT,           19)                      \
-   VMX_EXIT(SAVE_EFER,          20)                      \
-   VMX_EXIT(LOAD_EFER,          21)                      \
-   VMX_EXIT(SAVE_TIMER,         22)
+   VMX_EXIT(SAVE_DEBUGCTL,        2)                     \
+   VMX_EXIT(LONGMODE,             9)                     \
+   VMX_EXIT(LOAD_PGC,            12)                     \
+   VMX_EXIT(INTRACK,             15)                     \
+   VMX_EXIT(SAVE_PAT,            18)                     \
+   VMX_EXIT(LOAD_PAT,            19)                     \
+   VMX_EXIT(SAVE_EFER,           20)                     \
+   VMX_EXIT(LOAD_EFER,           21)                     \
+   VMX_EXIT(SAVE_TIMER,          22)                     \
+   VMX_EXIT(CLEAR_BNDCFGS,       23)                     \
+   VMX_EXIT(PT_SUPPRESS_VMX_PKT, 24)
 
 #define VMX_EXIT_CTLS_CAP                                \
         VMX_EXIT_CTLS_CAP_NDA                            \
@@ -313,13 +329,15 @@ enum {
    VMXCTL(_ENTRY_CTLS, _field, _pos)
 #define VMX_ENTRY_CTLS_CAP_NDA
 #define VMX_ENTRY_CTLS_CAP_PUB                           \
-   VMX_ENTRY(LOAD_DEBUGCTL,      2)                      \
-   VMX_ENTRY(LONGMODE,           9)                      \
-   VMX_ENTRY(ENTRY_TO_SMM,      10)                      \
-   VMX_ENTRY(SMM_TEARDOWN,      11)                      \
-   VMX_ENTRY(LOAD_PGC,          13)                      \
-   VMX_ENTRY(LOAD_PAT,          14)                      \
-   VMX_ENTRY(LOAD_EFER,         15)
+   VMX_ENTRY(LOAD_DEBUGCTL,        2)                    \
+   VMX_ENTRY(LONGMODE,             9)                    \
+   VMX_ENTRY(ENTRY_TO_SMM,        10)                    \
+   VMX_ENTRY(SMM_TEARDOWN,        11)                    \
+   VMX_ENTRY(LOAD_PGC,            13)                    \
+   VMX_ENTRY(LOAD_PAT,            14)                    \
+   VMX_ENTRY(LOAD_EFER,           15)                    \
+   VMX_ENTRY(LOAD_BNDCFGS,        16)                    \
+   VMX_ENTRY(PT_SUPPRESS_VMX_PKT, 17)
 
 #define VMX_ENTRY_CTLS_CAP                               \
         VMX_ENTRY_CTLS_CAP_NDA                           \
@@ -332,17 +350,18 @@ enum {
    VMXCAP(_MISC, _field, _pos, _len)
 #define VMX_MISC_CAP_NDA
 #define VMX_MISC_CAP_PUB                                 \
-   VMX_MISC(TMR_RATIO,              0,  5)               \
-   VMX_MISC(VMEXIT_SAVES_LMA,       5,  1)               \
-   VMX_MISC(ACTSTATE_HLT,           6,  1)               \
-   VMX_MISC(ACTSTATE_SHUTDOWN,      7,  1)               \
-   VMX_MISC(ACTSTATE_SIPI,          8,  1)               \
-   VMX_MISC(RDMSR_SMBASE_IN_SMM,   15,  1)               \
-   VMX_MISC(CR3_TARGETS,           16,  9)               \
-   VMX_MISC(MAX_MSRS,              25,  3)               \
-   VMX_MISC(ALLOW_ALL_VMWRITES,    29,  1)               \
-   VMX_MISC(ZERO_VMENTRY_INSTLEN,  30,  1)               \
-   VMX_MISC(MSEG_ID,               32, 32)               \
+   VMX_MISC(TMR_RATIO,               0,  5)              \
+   VMX_MISC(VMEXIT_SAVES_LMA,        5,  1)              \
+   VMX_MISC(ACTSTATE_HLT,            6,  1)              \
+   VMX_MISC(ACTSTATE_SHUTDOWN,       7,  1)              \
+   VMX_MISC(ACTSTATE_SIPI,           8,  1)              \
+   VMX_MISC(PROCESSOR_TRACE_IN_VMX, 14,  1)              \
+   VMX_MISC(RDMSR_SMBASE_IN_SMM,    15,  1)              \
+   VMX_MISC(CR3_TARGETS,            16,  9)              \
+   VMX_MISC(MAX_MSRS,               25,  3)              \
+   VMX_MISC(ALLOW_ALL_VMWRITES,     29,  1)              \
+   VMX_MISC(ZERO_VMENTRY_INSTLEN,   30,  1)              \
+   VMX_MISC(MSEG_ID,                32, 32)              \
 
 #define VMX_MISC_CAP                                     \
         VMX_MISC_CAP_NDA                                 \
@@ -427,6 +446,7 @@ enum {
    VMX_EPT(SP_1GB,                 17,  1)              \
    VMX_EPT(INVEPT,                 20,  1)              \
    VMX_EPT(ACCESS_DIRTY,           21,  1)              \
+   VMX_EPT(ADV_EXIT_INFO,          22,  1)              \
    VMX_EPT(INVEPT_EPT_CTX,         25,  1)              \
    VMX_EPT(INVEPT_GLOBAL,          26,  1)              \
    VMX_EPT(INVVPID,                32,  1)              \
@@ -532,68 +552,14 @@ enum {
 /* Exception error must-be-zero bits for VMEntry */
 #define VT_XCP_ERR_MBZ             0xffff8000
 
+
 /* Exit reasons. */
-#define VT_EXITREASON_EXC_OR_NMI            0
-#define VT_EXITREASON_EXTINT                1
-#define VT_EXITREASON_TRIPLEFAULT           2
-#define VT_EXITREASON_INIT                  3
-#define VT_EXITREASON_SIPI                  4
-#define VT_EXITREASON_IOSMI                 5
-#define VT_EXITREASON_OTHERSMI              6
-#define VT_EXITREASON_VINTR_WINDOW          7
-#define VT_EXITREASON_VNMI_WINDOW           8
-#define VT_EXITREASON_TS                    9
-#define VT_EXITREASON_CPUID                10
-#define VT_EXITREASON_GETSEC               11
-#define VT_EXITREASON_HLT                  12
-#define VT_EXITREASON_INVD                 13
-#define VT_EXITREASON_INVLPG               14
-#define VT_EXITREASON_RDPMC                15
-#define VT_EXITREASON_RDTSC                16
-#define VT_EXITREASON_RSM                  17
-#define VT_EXITREASON_VMCALL               18
-#define VT_EXITREASON_VMCLEAR              19
-#define VT_EXITREASON_VMLAUNCH             20
-#define VT_EXITREASON_VMPTRLD              21
-#define VT_EXITREASON_VMPTRST              22
-#define VT_EXITREASON_VMREAD               23
-#define VT_EXITREASON_VMRESUME             24
-#define VT_EXITREASON_VMWRITE              25
-#define VT_EXITREASON_VMXOFF               26
-#define VT_EXITREASON_VMXON                27
-#define VT_EXITREASON_CR                   28
-#define VT_EXITREASON_DR                   29
-#define VT_EXITREASON_IO                   30
-#define VT_EXITREASON_RDMSR                31
-#define VT_EXITREASON_WRMSR                32
-#define VT_EXITREASON_VMENTRYFAIL_GUEST   (33 | VT_EXITREASON_VMENTRYFAIL)
-#define VT_EXITREASON_VMENTRYFAIL_MSR     (34 | VT_EXITREASON_VMENTRYFAIL)
-#define VT_EXITREASON_MWAIT                36
-#define VT_EXITREASON_MTF                  37
-#define VT_EXITREASON_MONITOR              39
-#define VT_EXITREASON_PAUSE                40
-#define VT_EXITREASON_VMENTRYFAIL_MC      (41 | VT_EXITREASON_VMENTRYFAIL)
-#define VT_EXITREASON_TPR                  43
-#define VT_EXITREASON_APIC                 44
-#define VT_EXITREASON_EOI                  45
-#define VT_EXITREASON_GDTR_IDTR            46
-#define VT_EXITREASON_LDTR_TR              47
-#define VT_EXITREASON_EPT_VIOLATION        48
-#define VT_EXITREASON_EPT_MISCONFIG        49
-#define VT_EXITREASON_INVEPT               50
-#define VT_EXITREASON_RDTSCP               51
-#define VT_EXITREASON_TIMER                52
-#define VT_EXITREASON_INVVPID              53
-#define VT_EXITREASON_WBINVD               54
-#define VT_EXITREASON_XSETBV               55
-#define VT_EXITREASON_APIC_WRITE           56
-#define VT_EXITREASON_RDRAND               57
-#define VT_EXITREASON_INVPCID              58
-#define VT_EXITREASON_VMFUNC               59
-#define VT_EXITREASON_ENCLS                60
-#define VT_EXITREASON_RDSEED               61
-#define VT_EXITREASON_XSAVES               63
-#define VT_EXITREASON_XRSTORS              64
+enum {
+#define VT_EXIT(_name, _val) VT_EXITREASON_##_name = _val,
+#include "x86vt-exit-reasons.h"
+#undef VT_EXIT
+};
+
 
 /*
  * VT synthesized exit reasons:
@@ -618,7 +584,6 @@ enum {
         (VT_EXITREASON_SYNTH_EXC_BASE + gatenum) /* 0-31 */
 
 #define VT_EXITREASON_INSIDE_ENCLAVE        (1U << 27)
-#define VT_EXITREASON_VMENTRYFAIL           (1U << 31)
 
 /* Instruction error codes. */
 #define VT_ERROR_VMCALL_VMX_ROOT            1
@@ -690,12 +655,18 @@ enum {
 #define VT_EPT_QUAL_ACCESS_W           (1 << 1)
 #define VT_EPT_QUAL_ACCESS_X           (1 << 2)
 #define VT_EPT_QUAL_PROT_SHIFT         3
-#define VT_EPT_QUAL_PROT_MASK          (0x7 << VT_EPT_QUAL_PROT_SHIFT)
+#define VT_EPT_QUAL_PROT_MASK(_mbx)    (((_mbx) ? 0xf : 0x7) << \
+                                                  VT_EPT_QUAL_PROT_SHIFT)
 #define VT_EPT_QUAL_PROT_R             (1 << 3)
 #define VT_EPT_QUAL_PROT_W             (1 << 4)
 #define VT_EPT_QUAL_PROT_X             (1 << 5)
+#define VT_EPT_QUAL_PROT_XS            (1 << 5)
+#define VT_EPT_QUAL_PROT_XU            (1 << 6)
 #define VT_EPT_QUAL_LA_VALID           (1 << 7)
 #define VT_EPT_QUAL_FINAL_ADDR         (1 << 8)
+#define VT_EPT_QUAL_GUEST_US           (1 << 9)
+#define VT_EPT_QUAL_GUEST_RW           (1 << 10)
+#define VT_EPT_QUAL_GUEST_NX           (1 << 11)
 #define VT_EPT_QUAL_NMIUNMASK          (1 << 12)
 
 
@@ -772,12 +743,120 @@ enum {
     MSR_VMX_EPT_VPID_INVVPID_ALL_CTX)
 
 #define VT_REQUIRED_EPT_SUPPORT                        \
-   (MSR_VMX_EPT_VPID_EPTE_X                          | \
-    MSR_VMX_EPT_VPID_GAW_48                          | \
+   (MSR_VMX_EPT_VPID_GAW_48                          | \
     MSR_VMX_EPT_VPID_ETMT_WB                         | \
     MSR_VMX_EPT_VPID_SP_2MB                          | \
-    MSR_VMX_EPT_VPID_INVEPT                          | \
-    MSR_VMX_EPT_VPID_INVEPT_EPT_CTX)
+    MSR_VMX_EPT_VPID_INVEPT)
+
+#define VT_TSQUAL_CALL  0
+#define VT_TSQUAL_IRET  1
+#define VT_TSQUAL_JMP   2
+#define VT_TSQUAL_GATE  3
+
+typedef union {
+   struct {
+      unsigned selVal:16;
+      unsigned rsvd0:14;
+      unsigned source:2;
+   } bits;
+   uint32 flat;
+} VTTSQualifier;
+
+#define VT_CRQUAL_WR    0
+#define VT_CRQUAL_RD    1
+#define VT_CRQUAL_CLTS  2
+#define VT_CRQUAL_LMSW  3
+
+/* Control register intercept qualifier */
+typedef union {
+   struct {
+      unsigned num:4;   // For MOV-CR
+      unsigned op:2;
+      unsigned mem:1;   // For LMSW
+      unsigned rsvd0:1;
+      unsigned gpr:4;   // For MOV-CR
+      unsigned rsvd1:4;
+      unsigned data:16; // For LMSW
+   } bits;
+   uint32 flat;
+} VTCRQualifier;
+
+#define VT_DRQUAL_WR    0
+#define VT_DRQUAL_RD    1
+
+/* Debug register intercept qualifier */
+typedef union {
+   struct {
+      unsigned num:3;
+      unsigned rsvd0:1;
+      unsigned op:1;
+      unsigned rsvd1:3;
+      unsigned gpr:4;
+      unsigned rsvd2:20;
+   } bits;
+   uint32 flat;
+} VTDRQualifier;
+
+#define VT_IOQUAL_SZ8     0
+#define VT_IOQUAL_SZ16    1
+#define VT_IOQUAL_SZ32    3
+
+/* I/O intercept qualifier */
+typedef union {
+   struct {
+      unsigned opSize:3; // 0 = 1-byte; 1 = 2-byte; 3 = 4-byte
+      unsigned in:1;
+      unsigned string:1;
+      unsigned rep:1;
+      unsigned imm:1;
+      unsigned rsvd0:9;
+      unsigned port:16;
+   } bits;
+   uint32 flat;
+} VTIOQualifier;
+
+#define VT_IINFO_SCALE1    0
+#define VT_IINFO_SCALE2    1
+#define VT_IINFO_SCALE4    2
+#define VT_IINFO_SCALE8    3
+
+#define VT_IINFO_SZ16      0
+#define VT_IINFO_SZ32      1
+#define VT_IINFO_SZ64      2
+
+#define VT_IINFO_SGDT      0
+#define VT_IINFO_SIDT      1
+#define VT_IINFO_LGDT      2
+#define VT_IINFO_LIDT      3
+
+#define VT_IINFO_SLDT      0
+#define VT_IINFO_STR       1
+#define VT_IINFO_LLDT      2
+#define VT_IINFO_LTR       3
+
+/* VM-Exit Instruction-Information */
+typedef union {
+   struct {
+      unsigned scale:2;    // Bits  1:0
+      unsigned rsvd0:1;    // Bit   2
+      unsigned reg1:4;     // Bits  6:3
+      unsigned aSize:3;    // Bits  9:7
+      unsigned modrmReg:1; // Bit  10
+      unsigned oSize:2;    // Bits 12:11
+      unsigned rsvd1:2;    // Bit  14:13
+      unsigned seg:3;      // Bits 17:15
+      unsigned indexReg:5; // Bits 22:18
+      unsigned baseReg:5;  // Bits 27:23
+      unsigned misc:4;     // Bits 31:28
+   } bits;
+   uint32 flat;
+} VTInstrInfo;
+
+typedef struct VTMSREntry {
+   uint32       index;
+   uint32       reserved;
+   uint64       data;
+} VTMSREntry;
 
 typedef uint64 VTConfig[NUM_VMX_MSRS];
 
@@ -941,6 +1020,25 @@ VT_RealModeSupportedFromFeatures(uint64 secondary)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_MBXSupportedFromFeatures --
+ *
+ *   Returns TRUE if the given VMX features provide support for
+ *   mode-based execute control for EPT.
+ *
+ *   Assumes that VT is supported.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_MBXSupportedFromFeatures(uint64 secondary)
+{
+   return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_EPT_MBX) != 0;
+}
+
+
 #if !defined(USERLEVEL) && !defined(MONITOR_APP) /* { */
 /*
  *----------------------------------------------------------------------
diff --git a/vmmon-only/include/x86vtinstr.h b/vmmon-only/include/x86vtinstr.h
index 844f92fc..83630927 100644
--- a/vmmon-only/include/x86vtinstr.h
+++ b/vmmon-only/include/x86vtinstr.h
@@ -34,6 +34,11 @@
 #include "x86_basic_defs.h"
 #include "community_source.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 #define INVALID_VMCS_ADDR    ~0ULL
 
 /*
@@ -67,23 +72,23 @@ VMXStatus_Valid(VMXStatus status)
 #if defined __GNUC__
 
 static INLINE VMXStatus
-VMXON_2_STATUS(MA* vmcs)
+VMXON_2_STATUS(MA* vmxonRegion)
 {
    VMXStatus status;
    __asm__ __volatile__("vmxon %1; lahf; movzbl %%ah, %0"
                         : "=a"(status)
-                        : "m"(*vmcs)
+                        : "m"(*vmxonRegion)
                         : "cc", "memory");
    ASSERT(VMXStatus_Valid(status));
    return status;
 }
 
 static INLINE void
-VMXON_UNCHECKED(MA *vmcs)
+VMXON_UNCHECKED(MA *vmxonRegion)
 {
    __asm__ __volatile__("vmxon %0"
                         :
-                        : "m"(*vmcs)
+                        : "m"(*vmxonRegion)
                         : "cc", "memory");
 }
 
@@ -129,18 +134,6 @@ VMCLEAR_UNCHECKED(MA* vmcs)
                         : "cc", "memory");
 }
 
-static INLINE void
-VMCLEAR(MA* vmcs)
-{
-   if (vmx86_debug) {
-      VMXStatus status;
-      status = VMCLEAR_2_STATUS(vmcs);
-      ASSERT(status == VMX_Success);
-   } else {
-      VMCLEAR_UNCHECKED(vmcs);
-   }
-}
-
 static INLINE VMXStatus
 VMPTRLD_2_STATUS(MA *vmcs)
 {
@@ -208,20 +201,6 @@ VMREAD_UNCHECKED(size_t encoding)
    return retval;
 }
 
-static INLINE size_t
-VMREAD(size_t encoding)
-{
-   size_t retval;
-   if (vmx86_debug) {
-      VMXStatus status;
-      status = VMREAD_2_STATUS(encoding, &retval);
-      ASSERT(status == VMX_Success);
-   } else {
-      retval = VMREAD_UNCHECKED(encoding);
-   }
-   return retval;
-}
-
 static INLINE VMXStatus
 VMWRITE_2_STATUS(size_t encoding, size_t val)
 {
@@ -507,21 +486,21 @@ void          __vmx_vmptrst(unsigned __int64 *);
 
 
 static INLINE VMXStatus
-VMXON_2_STATUS(MA *vmcs)
+VMXON_2_STATUS(MA *vmxonRegion)
 {
    unsigned char mscStatus;
    static const VMXStatus MscToStatus[] =
       {VMX_Success, VMX_FailValid, VMX_FailInvalid};
 
-   mscStatus = __vmx_on((unsigned __int64 *)vmcs);
+   mscStatus = __vmx_on((unsigned __int64 *)vmxonRegion);
    ASSERT(mscStatus < ARRAYSIZE(MscToStatus));
    return MscToStatus[mscStatus];
 }
 
 static INLINE void
-VMXON_UNCHECKED(MA *vmcs)
+VMXON_UNCHECKED(MA *vmxonRegion)
 {
-   (void)__vmx_on((unsigned __int64 *)vmcs);
+   (void)__vmx_on((unsigned __int64 *)vmxonRegion);
 }
 
 static INLINE VMXStatus
@@ -537,6 +516,45 @@ VMXOFF_UNCHECKED(void)
    (void)__vmx_off();
 }
 
+static INLINE void
+VMCLEAR_UNCHECKED(MA *vmcs)
+{
+   (void)__vmx_vmclear((unsigned __int64 *)vmcs);
+}
+
+static INLINE size_t
+VMREAD_UNCHECKED(size_t encoding)
+{
+   size_t retval;
+   (void)__vmx_vmread(encoding, &retval);
+   return retval;
+}
+
+static INLINE VMXStatus
+VMCLEAR_2_STATUS(MA *vmcs)
+{
+   unsigned char mscStatus;
+   static const VMXStatus MscToStatus[] =
+      {VMX_Success, VMX_FailValid, VMX_FailInvalid};
+
+   mscStatus = __vmx_vmclear((unsigned __int64 *)vmcs);
+   ASSERT(mscStatus < ARRAYSIZE(MscToStatus));
+   return MscToStatus[mscStatus];
+}
+ 
+static INLINE VMXStatus
+VMREAD_2_STATUS(size_t encoding, size_t *retval)
+{
+   unsigned char mscStatus;
+   static const VMXStatus MscToStatus[] =
+      {VMX_Success, VMX_FailValid, VMX_FailInvalid};
+ 
+   mscStatus = __vmx_vmread(encoding, retval);
+   ASSERT(mscStatus < ARRAYSIZE(MscToStatus));
+   return MscToStatus[mscStatus];
+}
+
+
 static INLINE VMXStatus
 VMPTRLD_2_STATUS(MA *vmcs)
 {
@@ -573,14 +591,14 @@ VMPTRST_UNCHECKED(MA *vmcs)
 
 
 static INLINE void
-VMXON(MA *vmcs)
+VMXON(MA *vmxonRegion)
 {
    if (vmx86_debug) {
       VMXStatus status;
-      status = VMXON_2_STATUS(vmcs);
+      status = VMXON_2_STATUS(vmxonRegion);
       ASSERT(status == VMX_Success);
    } else {
-      VMXON_UNCHECKED(vmcs); 
+      VMXON_UNCHECKED(vmxonRegion); 
    }
 }
 
@@ -620,4 +638,36 @@ VMPTRST(MA *vmcs)
    }
 }
 
+
+static INLINE void
+VMCLEAR(MA* vmcs)
+{
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMCLEAR_2_STATUS(vmcs);
+      ASSERT(status == VMX_Success);
+   } else {
+      VMCLEAR_UNCHECKED(vmcs);
+   }
+}
+
+static INLINE size_t
+VMREAD(size_t encoding)
+{
+   size_t retval;
+   if (vmx86_debug) {
+      VMXStatus status;
+      status = VMREAD_2_STATUS(encoding, &retval);
+      ASSERT(status == VMX_Success);
+   } else {
+      retval = VMREAD_UNCHECKED(encoding);
+   }
+   return retval;
+}
+
+
+#if defined __cplusplus
+}  // extern "C"
+#endif
+
 #endif /* _X86VTINSTR_H_ */
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 35952379..3080525b 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -23,7 +23,7 @@
 
 #include <linux/file.h>
 #include <linux/highmem.h>
-#include <linux/poll.h>
+#include <linux/mm.h>
 #include <linux/preempt.h>
 #include <linux/slab.h>
 #include <linux/smp.h>
@@ -33,12 +33,11 @@
 
 #include "compat_version.h"
 #include "compat_module.h"
-#include "compat_page.h"
 
 #include "usercalldefs.h"
 
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 16)
-#error Linux before 2.6.16 is not supported
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 32)
+#error Linux kernels before 2.6.32 are not supported
 #endif
 
 #include <asm/io.h>
@@ -66,16 +65,10 @@
 #include "hostif_priv.h"
 #include "vmhost.h"
 
-#include "vmmonInt.h"
-
 static void LinuxDriverQueue(VMLinux *vmLinux);
 static void LinuxDriverDequeue(VMLinux *vmLinux);
 static Bool LinuxDriverCheckPadding(void);
 
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24)
-#define VMW_NOPAGE_2624
-#endif
-
 #define VMMON_UNKNOWN_SWAP_SIZE -1ULL
 
 struct VMXLinuxState linuxState;
@@ -103,27 +96,17 @@ long LinuxDriver_Ioctl(struct file *filp, u_int iocmd,
                        unsigned long ioarg);
 
 static int LinuxDriver_Close(struct inode *inode, struct file *filp);
-static unsigned int LinuxDriverPoll(struct file *file, poll_table *wait);
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
 static int LinuxDriverFault(struct vm_fault *fault);
-#elif defined(VMW_NOPAGE_2624)
-static int LinuxDriverFault(struct vm_area_struct *vma, struct vm_fault *fault);
 #else
-static struct page *LinuxDriverNoPage(struct vm_area_struct *vma,
-                                      unsigned long address,
-                                      int *type);
+static int LinuxDriverFault(struct vm_area_struct *vma, struct vm_fault *fault);
 #endif
 static int LinuxDriverMmap(struct file *filp, struct vm_area_struct *vma);
 
-static void LinuxDriverPollTimeout(unsigned long clientData);
 static unsigned int LinuxDriverEstimateTSCkHz(void);
 
 static struct vm_operations_struct vmuser_mops = {
-#ifdef VMW_NOPAGE_2624
         .fault  = LinuxDriverFault
-#else
-        .nopage = LinuxDriverNoPage
-#endif
 };
 
 static struct file_operations vmuser_fops;
@@ -135,43 +118,33 @@ static VmTimeStart tsckHzStartTime;
 /*
  *----------------------------------------------------------------------
  *
- * LinuxDriverEstimateTSCkHzWork --
+ * LinuxDriverReadTSCAndUptimeSmpCB --
+ * LinuxDriverReadTSCAndUptime --
  *
- *      Estimates TSC frequency in terms of cycles and system uptime
- *      elapsed since module init. At module init, the starting cycle
- *      count and uptime are recorded (in tsckHzStartTime) and a timer
- *      is scheduled to call this function after 4 seconds.
- *
- *      It is possible that vmx queries the TSC rate after module init
- *      but before the 4s timer expires. In that case, we just go ahead
- *      and compute the rate for the duration since the driver loaded.
- *      When the timer expires, the new computed value is dropped. If the
- *      query races with the timer, the first thread to write to 'tsckHz'
- *      wins.
+ *       Read TSC and uptime on CPU 0. Reading on CPU 0 is best
+ *       effort, and the remote smp function call may fail for two
+ *       reasons: either the function is not supportd by the kernel,
+ *       or the cpu went offline. In this unlikely event, we perform
+ *       the read on the local cpu.
  *
  *----------------------------------------------------------------------
  */
 
 static void
-LinuxDriverEstimateTSCkHzWork(void *data)
+LinuxDriverReadTSCAndUptimeSmpCB(void *arg)
 {
-   VmTimeStart curTime;
-   uint64 cycles;
-   uint64 uptime;
-   unsigned int khz;
-
-   ASSERT(tsckHzStartTime.count != 0 && tsckHzStartTime.time != 0);
-   Vmx86_ReadTSCAndUptime(&curTime);
-   cycles = curTime.count - tsckHzStartTime.count;
-   uptime = curTime.time  - tsckHzStartTime.time;
-   khz    = Vmx86_ComputekHz(cycles, uptime);
+   VmTimeStart *time = (VmTimeStart *) arg;
+   Vmx86_ReadTSCAndUptime(time);
+   /* Ensure the above write is visible to the remote caller. */
+   SMP_RW_BARRIER_RW();
+}
 
-   if (khz != 0) {
-       if (Atomic_ReadIfEqualWrite(&tsckHz, 0, khz) == 0) {
-          Log("TSC frequency estimated using system uptime: %u\n", khz);
-       }
-   } else if (Atomic_ReadIfEqualWrite(&tsckHz, 0, cpu_khz) == 0) {
-       Log("Failed to compute TSC frequency, using cpu_khz: %u\n", cpu_khz);
+static void
+LinuxDriverReadTSCAndUptime(VmTimeStart *time)
+{
+   if (smp_call_function_single(0, LinuxDriverReadTSCAndUptimeSmpCB,
+                                (void *)time, 1) != 0) {
+      LinuxDriverReadTSCAndUptimeSmpCB(time);
    }
 }
 
@@ -181,36 +154,52 @@ LinuxDriverEstimateTSCkHzWork(void *data)
  *
  * LinuxDriverEstimateTSCkHz --
  *
- *      Returns the estimated TSC khz, cached in tscKhz. If tsckHz is
- *      0, the routine kicks off estimation work on CPU 0.
+ *      Estimates TSC frequency in terms of cycles and system uptime
+ *      elapsed since module init. At module init, the starting cycle
+ *      count and uptime are recorded (in tsckHzStartTime) and a timer
+ *      is scheduled to call this function after 4 seconds.
+ *
+ *      It is possible that vmx queries the TSC rate after module init
+ *      but before the 4s timer expires. In that case, we just go ahead
+ *      and compute the rate for the duration since the driver loaded.
+ *      When the timer expires, the new computed value is dropped. If the
+ *      query races with the timer, the first thread to write to 'tsckHz'
+ *      wins.
  *
  * Results:
  *
- *      Returns the estimated TSC khz value.
+ *      Returns the estimated TSC khz, cached in tscKhz. If tsckHz is
+ *      0, the reads uptime on CPU 0 and estimates tsc khz, followed
+ *      by caching it in tsckHz.
  *
  *----------------------------------------------------------------------
  */
 
-static unsigned int
+static uint32
 LinuxDriverEstimateTSCkHz(void)
 {
-   int err;
    uint32 khz;
+   VmTimeStart curTime;
+   uint64 cycles;
+   uint64 uptime;
 
    khz = Atomic_Read(&tsckHz);
    if (khz != 0) {
       return khz;
    }
-   err = compat_smp_call_function_single(0, LinuxDriverEstimateTSCkHzWork,
-                                         NULL, 1);
-   /*
-    * The smp function call may fail for two reasons, either
-    * the function is not supportd by the kernel, or the cpu
-    * went offline. In this unlikely event, we just perform
-    * the work wherever we can.
-    */
-   if (err != 0) {
-      LinuxDriverEstimateTSCkHzWork(NULL);
+
+   ASSERT(tsckHzStartTime.count != 0);
+   LinuxDriverReadTSCAndUptime(&curTime);
+   cycles = curTime.count - tsckHzStartTime.count;
+   uptime = curTime.time  - tsckHzStartTime.time;
+   khz    = Vmx86_ComputekHz(cycles, uptime);
+
+   if (khz != 0) {
+       if (Atomic_ReadIfEqualWrite(&tsckHz, 0, khz) == 0) {
+          Log("TSC frequency estimated using system uptime: %u\n", khz);
+       }
+   } else if (Atomic_ReadIfEqualWrite(&tsckHz, 0, cpu_khz) == 0) {
+       Log("Failed to compute TSC frequency, using cpu_khz: %u\n", cpu_khz);
    }
 
    return Atomic_Read(&tsckHz);
@@ -255,23 +244,20 @@ LinuxDriverEstimateTSCkHzDeferred(unsigned long data)
 static void
 LinuxDriverInitTSCkHz(void)
 {
-   unsigned int khz;
- 
-   khz = compat_tsc_khz();
-   if (khz != 0) {
-      Atomic_Write(&tsckHz, khz);
-      Log("Using tsc_khz as TSC frequency: %u\n", khz);
+   if (tsc_khz != 0) {  /* Exported kernel value */
+      Atomic_Write(&tsckHz, tsc_khz);
+      Log("Using tsc_khz as TSC frequency: %u\n", tsc_khz);
       return;
    }
 
-   Vmx86_ReadTSCAndUptime(&tsckHzStartTime);
+   LinuxDriverReadTSCAndUptime(&tsckHzStartTime);
    tscTimer.function = LinuxDriverEstimateTSCkHzDeferred;
    tscTimer.expires  = jiffies + 4 * HZ;
    tscTimer.data     = 0;
    add_timer(&tscTimer);
 }
 
- 
+
 /*
  *----------------------------------------------------------------------
  *
@@ -300,23 +286,13 @@ init_module(void)
    }
 
    CPUID_Init();
+
    if (!Task_Initialize()) {
       return -ENOEXEC;
    }
 
-   /*
-    * Initialize LinuxDriverPoll state
-    */
-
-   init_waitqueue_head(&linuxState.pollQueue);
-   init_timer(&linuxState.pollTimer);
-   linuxState.pollTimer.data = 0;
-   linuxState.pollTimer.function = LinuxDriverPollTimeout;
-
    linuxState.fastClockThread = NULL;
-   linuxState.fastClockFile = NULL;
    linuxState.fastClockRate = 0;
-   linuxState.fastClockPriority = -20;
    linuxState.swapSize = VMMON_UNKNOWN_SWAP_SIZE;
 
    /*
@@ -327,7 +303,6 @@ init_module(void)
 
    memset(&vmuser_fops, 0, sizeof vmuser_fops);
    vmuser_fops.owner = THIS_MODULE;
-   vmuser_fops.poll = LinuxDriverPoll;
    vmuser_fops.unlocked_ioctl = LinuxDriver_Ioctl;
    vmuser_fops.compat_ioctl = LinuxDriver_Ioctl;
    vmuser_fops.open = LinuxDriver_Open;
@@ -394,7 +369,6 @@ cleanup_module(void)
 
    Log("Module %s: unloaded\n", linuxState.deviceName);
 
-   del_timer_sync(&linuxState.pollTimer);
    del_timer_sync(&tscTimer);
 
    Task_Terminate();
@@ -435,7 +409,6 @@ LinuxDriver_Open(struct inode *inode, // IN
    memset(vmLinux, 0, sizeof *vmLinux);
 
    sema_init(&vmLinux->lock4Gb, 1);
-   init_waitqueue_head(&vmLinux->pollQueue);
 
    filp->private_data = vmLinux;
    LinuxDriverQueue(vmLinux);
@@ -591,20 +564,6 @@ LinuxDriver_Close(struct inode *inode, // IN
 
    LinuxDriverDestructor4Gb(vmLinux);
 
-   /*
-    * Clean up poll state.
-    */
-
-   HostIF_PollListLock(0);
-   if (vmLinux->pollBack != NULL) {
-      if ((*vmLinux->pollBack = vmLinux->pollForw) != NULL) {
-         vmLinux->pollForw->pollBack = vmLinux->pollBack;
-      }
-   }
-   HostIF_PollListUnlock(0);
-   // XXX call wake_up()?
-   HostIF_UnmapUserMem(vmLinux->pollTimeoutHandle);
-
    kfree(vmLinux);
    filp->private_data = NULL;
 
@@ -612,262 +571,10 @@ LinuxDriver_Close(struct inode *inode, // IN
 }
 
 
-#define POLLQUEUE_MAX_TASK 1000
-static DEFINE_SPINLOCK(pollQueueLock);
-static void *pollQueue[POLLQUEUE_MAX_TASK];
-static unsigned int pollQueueCount = 0;
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverQueuePoll --
- *
- *      Remember that current process waits for next timer event.
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      None.
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE_SINGLE_CALLER void
-LinuxDriverQueuePoll(void)
-{
-   unsigned long flags;
-
-   spin_lock_irqsave(&pollQueueLock, flags);
-
-   /*
-    * Under normal circumstances every process should be listed
-    * only once in this array. If it becomes problem that process
-    * can be in the array twice, walk array! Maybe you can keep
-    * it sorted by 'current' value then, making IsPollQueued
-    * a bit faster...
-    */
-
-   if (pollQueueCount < POLLQUEUE_MAX_TASK) {
-      pollQueue[pollQueueCount++] = current;
-   }
-   spin_unlock_irqrestore(&pollQueueLock, flags);
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverIsPollQueued --
- *
- *      Determine whether timer event occurred since we queued for it using
- *      LinuxDriverQueuePoll.
- *
- * Results:
- *      0    Event already occurred.
- *      1    Event did not occur yet.
- *
- * Side effects:
- *      None.
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE_SINGLE_CALLER int
-LinuxDriverIsPollQueued(void)
-{
-   unsigned long flags;
-   unsigned int i;
-   int retval = 0;
-
-   spin_lock_irqsave(&pollQueueLock, flags);
-   for (i = 0; i < pollQueueCount; i++) {
-      if (current == pollQueue[i]) {
-         retval = 1;
-         break;
-      }
-   }
-   spin_unlock_irqrestore(&pollQueueLock, flags);
-
-   return retval;
-}
-
-
 /*
  *-----------------------------------------------------------------------------
  *
- * LinuxDriverFlushPollQueue --
- *
- *      Signal to queue that timer event occurred.
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      None.
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE_SINGLE_CALLER void
-LinuxDriverFlushPollQueue(void)
-{
-   unsigned long flags;
-
-   spin_lock_irqsave(&pollQueueLock, flags);
-   pollQueueCount = 0;
-   spin_unlock_irqrestore(&pollQueueLock, flags);
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverWakeUp --
- *
- *      Wake up processes waiting on timer event.
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      None.
- *
- *-----------------------------------------------------------------------------
- */
-
-void
-LinuxDriverWakeUp(Bool selective)  // IN:
-{
-   if (selective && linuxState.pollList != NULL) {
-      struct timeval tv;
-      VmTimeType now;
-      VMLinux *p;
-      VMLinux *next;
-
-      HostIF_PollListLock(1);
-      do_gettimeofday(&tv);
-      now = tv.tv_sec * 1000000ULL + tv.tv_usec;
-
-      for (p = linuxState.pollList; p != NULL; p = next) {
-         next = p->pollForw;
-
-         if (p->pollTime <= now) {
-            if ((*p->pollBack = next) != NULL) {
-               next->pollBack = p->pollBack;
-            }
-            p->pollForw = NULL;
-            p->pollBack = NULL;
-            wake_up(&p->pollQueue);
-         }
-      }
-      HostIF_PollListUnlock(1);
-   }
-
-   LinuxDriverFlushPollQueue();
-   wake_up(&linuxState.pollQueue);
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * LinuxDriverPoll  --
- *
- *      This is used to wake up the VMX when a user call arrives, or
- *      to wake up select() or poll() at the next clock tick.
- *
- *----------------------------------------------------------------------
- */
-
-static unsigned int
-LinuxDriverPoll(struct file *filp,  // IN:
-                poll_table *wait)   // IN:
-{
-   VMLinux *vmLinux = (VMLinux *) filp->private_data;
-   unsigned int mask = 0;
-
-   /*
-    * Set up or check the timeout for fast wakeup.
-    *
-    * Thanks to Petr for this simple and correct implementation:
-    *
-    * There are four cases of wait == NULL:
-    *    another file descriptor is ready in the same poll()
-    *    just slept and woke up
-    *    nonblocking poll()
-    *    did not sleep due to memory allocation on 2.4.21-9.EL
-    * In first three cases, it's okay to return POLLIN.
-    * Unfortunately, for 4th variant we have to do some
-    * bookkeeping to not return POLLIN when timer did not expire
-    * yet.
-    *
-    * We may schedule a timer unnecessarily if an existing
-    * timer fires between poll_wait() and timer_pending().
-    *
-    * -- edward
-    */
-
-   if (wait == NULL) {
-      if (vmLinux->pollBack == NULL && !LinuxDriverIsPollQueued()) {
-         mask = POLLIN;
-      }
-   } else {
-      if (linuxState.fastClockThread && vmLinux->pollTimeoutPtr != NULL) {
-         struct timeval tv;
-
-         do_gettimeofday(&tv);
-         poll_wait(filp, &vmLinux->pollQueue, wait);
-         vmLinux->pollTime = *vmLinux->pollTimeoutPtr +
-                                       tv.tv_sec * 1000000ULL + tv.tv_usec;
-         if (vmLinux->pollBack == NULL) {
-            HostIF_PollListLock(2);
-            if (vmLinux->pollBack == NULL) {
-               if ((vmLinux->pollForw = linuxState.pollList) != NULL) {
-                  vmLinux->pollForw->pollBack = &vmLinux->pollForw;
-               }
-               linuxState.pollList = vmLinux;
-               vmLinux->pollBack = &linuxState.pollList;
-            }
-            HostIF_PollListUnlock(2);
-         }
-      } else {
-         LinuxDriverQueuePoll();
-         poll_wait(filp, &linuxState.pollQueue, wait);
-
-         if (!timer_pending(&linuxState.pollTimer)) {
-            mod_timer(&linuxState.pollTimer, jiffies + 1);
-         }
-      }
-   }
-
-   return mask;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * LinuxDriverPollTimeout  --
- *
- *      Wake up a process waiting in poll/select.  This is called from
- *      the timer, and hence processed in the bottom half
- *
- *----------------------------------------------------------------------
- */
-
-static void
-LinuxDriverPollTimeout(unsigned long clientData)  // IN:
-{
-   LinuxDriverWakeUp(FALSE);
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverNoPage/LinuxDriverFault --
+ * LinuxDriverFault --
  *
  *      Callback for returning allocated page for memory mapping
  *
@@ -883,16 +590,12 @@ LinuxDriverPollTimeout(unsigned long clientData)  // IN:
  *-----------------------------------------------------------------------------
  */
 
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
 static int
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
 LinuxDriverFault(struct vm_fault *fault)     //IN/OUT
-#elif defined(VMW_NOPAGE_2624)
-static int LinuxDriverFault(struct vm_area_struct *vma, //IN
-                            struct vm_fault *fault)     //IN/OUT
 #else
-static struct page *LinuxDriverNoPage(struct vm_area_struct *vma, //IN
-                                      unsigned long address,      //IN
-                                      int *type)                  //OUT: Fault type
+LinuxDriverFault(struct vm_area_struct *vma, //IN
+                 struct vm_fault *fault)     //IN/OUT
 #endif
 {
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
@@ -902,28 +605,15 @@ static struct page *LinuxDriverNoPage(struct vm_area_struct *vma, //IN
    unsigned long pg;
    struct page* page;
 
-#ifdef VMW_NOPAGE_2624
    pg = fault->pgoff;
-#else
-   pg = ((address - vma->vm_start) >> PAGE_SHIFT) + vma->vm_pgoff;
-#endif
    pg = VMMON_MAP_OFFSET(pg);
    if (pg >= vmLinux->size4Gb) {
-#ifdef VMW_NOPAGE_2624
       return VM_FAULT_SIGBUS;
-#else
-      return 0;
-#endif
    }
    page = vmLinux->pages4Gb[pg];
    get_page(page);
-#ifdef VMW_NOPAGE_2624
    fault->page = page;
    return 0;
-#else
-   *type = VM_FAULT_MINOR;
-   return page;
-#endif
 }
 
 
@@ -1198,7 +888,7 @@ LinuxDriverSyncCallOnEachCPU(SyncFunc func,  // IN:
     * on this CPU too.
     */
 
-   compat_smp_call_function(LinuxDriverSyncCallHook, &args, 0);
+   smp_call_function(LinuxDriverSyncCallHook, &args, 0);
 
    /*
     * smp_call_function doesn't return until all cpus have been
@@ -1262,10 +952,10 @@ LinuxDriverReadTSC(void *data,   // OUT: TSC values
    /* Any looping means another CPU changed min/max. */
    do {
       old = Atomic_Read64(&tscDelta->min);
-   } while (old > tsc && !Atomic_CMPXCHG64(&tscDelta->min, &old, &tsc));
+   } while (old > tsc && !Atomic_CMPXCHG64(&tscDelta->min, old, tsc));
    do {
       old = Atomic_Read64(&tscDelta->max);
-   } while (old < tsc && !Atomic_CMPXCHG64(&tscDelta->max, &old, &tsc));
+   } while (old < tsc && !Atomic_CMPXCHG64(&tscDelta->max, old, tsc));
 
    return TRUE;
 }
@@ -1356,24 +1046,18 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    switch (iocmd) {
    case IOCTL_VMX86_VERSION:
    case IOCTL_VMX86_CREATE_VM:
-   case IOCTL_VMX86_INIT_CROSSGDT:
    case IOCTL_VMX86_SET_UID:
    case IOCTL_VMX86_GET_NUM_VMS:
    case IOCTL_VMX86_GET_TOTAL_MEM_USAGE:
    case IOCTL_VMX86_SET_HARD_LIMIT:
-   case IOCTL_VMX86_PAE_ENABLED:
-   case IOCTL_VMX86_VMX_ENABLED:
    case IOCTL_VMX86_GET_IPI_VECTORS:
    case IOCTL_VMX86_GET_KHZ_ESTIMATE:
    case IOCTL_VMX86_GET_ALL_CPUID:
    case IOCTL_VMX86_GET_ALL_MSRS:
-   case IOCTL_VMX86_SET_POLL_TIMEOUT_PTR:
-   case IOCTL_VMX86_GET_KERNEL_CLOCK_RATE:
    case IOCTL_VMX86_GET_REFERENCE_CLOCK_HZ:
    case IOCTL_VMX86_INIT_PSEUDO_TSC:
    case IOCTL_VMX86_CHECK_PSEUDO_TSC:
    case IOCTL_VMX86_GET_PSEUDO_TSC:
-   case IOCTL_VMX86_SET_HOST_CLOCK_PRIORITY:
    case IOCTL_VMX86_SYNC_GET_TSCS:
    case IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS:
       break;
@@ -1394,65 +1078,79 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       retval = VMMON_VERSION;
       break;
 
-   case IOCTL_VMX86_CREATE_VM:
+   case IOCTL_VMX86_CREATE_VM: {
+      VMCreateBlock args;
+
       if (vm != NULL) {
          retval = -EINVAL;
          break;
       }
-
-      vm = Vmx86_CreateVM();
+      retval = HostIF_CopyFromUser(&args, (VA64)ioarg, sizeof args);
+      if (retval != 0) {
+         break;
+      }
+      vm = Vmx86_CreateVM(args.bsBlob, args.bsBlobSize);
 
       if (vm == NULL) {
          retval = -ENOMEM;
       } else {
          vmLinux->vm = vm;
-         retval = vm->userID;
-      }
-      break;
-
-   case IOCTL_VMX86_RELEASE_VM:
-      vmLinux->vm = NULL;
-      Vmx86_ReleaseVM(vm);
-      break;
-
-   case IOCTL_VMX86_ALLOC_CROSSGDT: {
-      InitBlock initBlock;
-
-      if (Task_AllocCrossGDT(&initBlock)) {
-         retval = HostIF_CopyToUser((char *)ioarg, &initBlock,
-                                    sizeof initBlock);
-      } else {
-         retval = -EINVAL;
+         args.vmid = vm->userID;
+         retval = HostIF_CopyToUser((VA64)ioarg, &args, sizeof args);
       }
       break;
    }
 
-   case IOCTL_VMX86_INIT_VM: {
-      InitBlock initParams;
+   case IOCTL_VMX86_PROCESS_BOOTSTRAP: {
+      VMProcessBootstrapBlock *args;
+      Bool res;
 
-      retval = HostIF_CopyFromUser(&initParams, (char *)ioarg,
-                                   sizeof initParams);
-      if (retval != 0) {
+      args = HostIF_AllocKernelMem(sizeof *args, TRUE);
+      if (args == NULL) {
+         retval = -ENOMEM;
          break;
       }
-      if (Vmx86_InitVM(vm, &initParams)) {
-         retval = -EINVAL;
+      retval = HostIF_CopyFromUser(args, (VA64)ioarg, sizeof *args);
+      if (retval != 0) {
+         HostIF_FreeKernelMem(args);
          break;
       }
-      retval = HostIF_CopyToUser((char *)ioarg, &initParams,
-                                 sizeof initParams);
+      res = Vmx86_ProcessBootstrap(vm,
+                                   args->bsBlobAddr,
+                                   args->numBytes,
+                                   args->headerOffset,
+                                   args->numVCPUs,
+                                   args->ptRootVAs,
+                                   args->shRegions);
+      if (!res) {
+         retval = -ENOMEM;
+      }
+      HostIF_FreeKernelMem(args);
       break;
    }
 
-   case IOCTL_VMX86_INIT_CROSSGDT: {
-      InitCrossGDT initCrossGDT;
+   case IOCTL_VMX86_RELEASE_VM:
+      vmLinux->vm = NULL;
+      Vmx86_ReleaseVM(vm);
+      break;
 
-      retval = HostIF_CopyFromUser(&initCrossGDT, (char *)ioarg,
-                                   sizeof initCrossGDT);
+   case IOCTL_VMX86_INIT_VM: {
+      InitBlock *initParams;
 
-      if ((retval == 0) && Task_InitCrossGDT(&initCrossGDT)) {
-         retval = -EIO;
+      initParams = HostIF_AllocKernelMem(sizeof *initParams, TRUE);
+      if (initParams == NULL) {
+         retval = -ENOMEM;
+         break;
       }
+      retval = HostIF_CopyFromUser(initParams, ioarg, sizeof *initParams);
+      if (retval == 0) {
+         if (Vmx86_InitVM(vm, initParams) == 0) {
+            retval = HostIF_CopyToUser(ioarg, initParams, sizeof *initParams);
+         } else {
+            retval = -EINVAL;
+         }
+      }
+      HostIF_FreeKernelMem(initParams);
       break;
    }
 
@@ -1477,31 +1175,31 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_LOCK_PAGE: {
       VMLockPage args;
 
-      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
       if (retval) {
          break;
       }
       args.ret.status = Vmx86_LockPage(vm, args.uAddr, FALSE, &args.ret.mpn);
-      retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
+      retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
       break;
    }
 
    case IOCTL_VMX86_LOCK_PAGE_NEW: {
       VMLockPage args;
 
-      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
       if (retval) {
          break;
       }
       args.ret.status = Vmx86_LockPage(vm, args.uAddr, TRUE, &args.ret.mpn);
-      retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
+      retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
       break;
    }
 
    case IOCTL_VMX86_UNLOCK_PAGE: {
       VA64 uAddr;
 
-      retval = HostIF_CopyFromUser(&uAddr, (void *)ioarg, sizeof uAddr);
+      retval = HostIF_CopyFromUser(&uAddr, ioarg, sizeof uAddr);
       if (retval) {
          break;
       }
@@ -1512,7 +1210,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_UNLOCK_PAGE_BY_MPN: {
       VMMUnlockPageByMPN args;
 
-      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
       if (retval) {
          break;
       }
@@ -1523,12 +1221,12 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_LOOK_UP_MPN: {
       VMLockPage args;
 
-      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
       if (retval) {
          break;
       }
       args.ret.status = Vmx86_LookupUserMPN(vm, args.uAddr, &args.ret.mpn);
-      retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
+      retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
       break;
    }
 
@@ -1543,7 +1241,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_SET_HARD_LIMIT: {
       int32 limit;
 
-      retval = HostIF_CopyFromUser(&limit, (void *)ioarg, sizeof limit);
+      retval = HostIF_CopyFromUser(&limit, ioarg, sizeof limit);
       if (retval != 0) {
          break;
       }
@@ -1556,19 +1254,19 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_ADMIT: {
       VMMemInfoArgs args;
 
-      retval = HostIF_CopyFromUser(&args, (void *)ioarg, sizeof args);
+      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
       if (retval != 0) {
          break;
       }
       Vmx86_Admit(vm, &args);
-      retval = HostIF_CopyToUser((void *)ioarg, &args, sizeof args);
+      retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
       break;
    }
 
    case IOCTL_VMX86_READMIT: {
       OvhdMem_Deltas delta;
 
-      retval = HostIF_CopyFromUser(&delta, (void *)ioarg, sizeof delta);
+      retval = HostIF_CopyFromUser(&delta, ioarg, sizeof delta);
       if (retval != 0) {
          break;
       }
@@ -1582,7 +1280,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_UPDATE_MEM_INFO: {
       VMMemMgmtInfoPatch patch;
 
-      retval = HostIF_CopyFromUser(&patch, (void *)ioarg, sizeof patch);
+      retval = HostIF_CopyFromUser(&patch, ioarg, sizeof patch);
       if (retval == 0) {
          Vmx86_UpdateMemInfo(vm, &patch);
       }
@@ -1591,17 +1289,15 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
 
    case IOCTL_VMX86_GET_MEM_INFO: {
       VA64 uAddr;
-      VMMemInfoArgs *userVA;
       VMMemInfoArgs in;
       VMMemInfoArgs *out;
 
-      retval = HostIF_CopyFromUser(&uAddr, (void *)ioarg, sizeof uAddr);
+      retval = HostIF_CopyFromUser(&uAddr, ioarg, sizeof uAddr);
       if (retval) {
          break;
       }
 
-      userVA = VA64ToPtr(uAddr);
-      retval = HostIF_CopyFromUser(&in, userVA, sizeof in);
+      retval = HostIF_CopyFromUser(&in, uAddr, sizeof in);
       if (retval) {
          break;
       }
@@ -1623,26 +1319,18 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
          break;
       }
 
-      retval = HostIF_CopyToUser(userVA, out,
+      retval = HostIF_CopyToUser(uAddr, out,
                                  VM_GET_MEM_INFO_SIZE(out->numVMs));
       HostIF_FreeKernelMem(out);
       break;
    }
 
-   case IOCTL_VMX86_PAE_ENABLED:
-      retval = Vmx86_PAEEnabled();
-      break;
-
-   case IOCTL_VMX86_VMX_ENABLED:
-      retval = Vmx86_VMXEnabled();
-      break;
-
    case IOCTL_VMX86_APIC_INIT: {
       VMAPICInfo info;
       Bool setVMPtr;
       Bool probe;
 
-      retval = HostIF_CopyFromUser(&info, (VMAPICInfo *)ioarg, sizeof info);
+      retval = HostIF_CopyFromUser(&info, ioarg, sizeof info);
       if (retval != 0) {
          break;
       }
@@ -1667,8 +1355,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_SEND_IPI: {
       VCPUSet ipiTargets;
 
-      retval = HostIF_CopyFromUser(&ipiTargets, (VCPUSet *) ioarg,
-                                   sizeof ipiTargets);
+      retval = HostIF_CopyFromUser(&ipiTargets, ioarg, sizeof ipiTargets);
 
       if (retval == 0) {
          HostIF_IPI(vm, &ipiTargets);
@@ -1689,8 +1376,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       ipiVectors.monitorIPIVector = monitorIPIVector;
       ipiVectors.hvIPIVector      = hvIPIVector;
 
-      retval = HostIF_CopyToUser((void *)ioarg, &ipiVectors,
-                                  sizeof ipiVectors);
+      retval = HostIF_CopyToUser(ioarg, &ipiVectors, sizeof ipiVectors);
       break;
    }
 
@@ -1700,17 +1386,15 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
 
    case IOCTL_VMX86_GET_ALL_CPUID: {
       VA64 uAddr;
-      CPUIDQuery *userVA;
       CPUIDQuery in;
       CPUIDQuery *out;
 
-      retval = HostIF_CopyFromUser(&uAddr, (void *)ioarg, sizeof uAddr);
+      retval = HostIF_CopyFromUser(&uAddr, ioarg, sizeof uAddr);
       if (retval) {
          break;
       }
 
-      userVA = VA64ToPtr(uAddr);
-      retval = HostIF_CopyFromUser(&in, userVA, sizeof in);
+      retval = HostIF_CopyFromUser(&in, uAddr, sizeof in);
       if (retval) {
          break;
       }
@@ -1740,26 +1424,25 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
          break;
       }
 
-      retval = HostIF_CopyToUser((int8 *)userVA + sizeof *userVA,
-                                  &out->logicalCPUs[0],
-                           out->numLogicalCPUs * sizeof out->logicalCPUs[0]);
+      retval = HostIF_CopyToUser(uAddr + sizeof in,
+                                 &out->logicalCPUs[0],
+                                 out->numLogicalCPUs *
+                                 sizeof out->logicalCPUs[0]);
       HostIF_FreeKernelMem(out);
       break;
    }
 
    case IOCTL_VMX86_GET_ALL_MSRS: {
       VA64 uAddr;
-      MSRQuery *userVA;
       MSRQuery in;
       MSRQuery *out;
 
-      retval = HostIF_CopyFromUser(&uAddr, (void *)ioarg, sizeof uAddr);
+      retval = HostIF_CopyFromUser(&uAddr, ioarg, sizeof uAddr);
       if (retval) {
          break;
       }
 
-      userVA = VA64ToPtr(uAddr);
-      retval = HostIF_CopyFromUser(&in, userVA, sizeof in);
+      retval = HostIF_CopyFromUser(&in, uAddr, sizeof in);
       if (retval) {
          break;
       }
@@ -1789,9 +1472,10 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
          break;
       }
 
-      retval = HostIF_CopyToUser((int8 *)userVA + sizeof *userVA,
-                                  &out->logicalCPUs[0],
-                            out->numLogicalCPUs * sizeof out->logicalCPUs[0]);
+      retval = HostIF_CopyToUser(uAddr + sizeof in,
+                                 &out->logicalCPUs[0],
+                                 out->numLogicalCPUs *
+                                 sizeof out->logicalCPUs[0]);
       HostIF_FreeKernelMem(out);
       break;
    }
@@ -1800,7 +1484,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_FREE_LOCKED_PAGES: {
          VMMPNList req;
 
-         retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+         retval = HostIF_CopyFromUser(&req, ioarg, sizeof req);
          if (retval) {
            break;
          }
@@ -1818,141 +1502,98 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_GET_NEXT_ANON_PAGE: {
       VMMPNNext req;
 
-      retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+      retval = HostIF_CopyFromUser(&req, ioarg, sizeof req);
       if (retval) {
          req.outMPN = INVALID_MPN;
       } else {
          req.outMPN = Vmx86_GetNextAnonPage(vm, req.inMPN);
       }
-      retval = HostIF_CopyToUser((void *)ioarg, &req, sizeof req);
+      retval = HostIF_CopyToUser(ioarg, &req, sizeof req);
       break;
    }
 
-   case IOCTL_VMX86_GET_LOCKED_PAGES_LIST: {
-         VMMPNList req;
+   case IOCTL_VMX86_READ_PAGE: {
+         void *tempPage;
+         VMMReadWritePage req;
 
-         retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+         retval = HostIF_CopyFromUser(&req, ioarg, sizeof req);
          if (retval) {
             break;
          }
-         retval = Vmx86_GetLockedPageList(vm, req.mpnList, req.mpnCount);
-         break;
-      }
-
-   case IOCTL_VMX86_READ_PAGE: {
-         VMMReadWritePage req;
 
-         retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
-         if (retval) {
+         tempPage = HostIF_AllocPage();
+         if (tempPage == NULL) {
+            retval = -ENOMEM;
             break;
          }
-         retval = HostIF_ReadPage(vm, req.mpn, req.uAddr, FALSE);
+
+         retval = HostIF_ReadPhysical(vm, MPN_2_MA(req.mpn),
+                                      PtrToVA64(tempPage), TRUE, PAGE_SIZE);
+         if (retval == 0) {
+            retval = HostIF_CopyToUser(req.uAddr, tempPage, PAGE_SIZE);
+         }
+
+         HostIF_FreePage(tempPage);
          break;
       }
 
    case IOCTL_VMX86_WRITE_PAGE: {
          VMMReadWritePage req;
 
-         retval = HostIF_CopyFromUser(&req, (void *)ioarg, sizeof req);
+         retval = HostIF_CopyFromUser(&req, ioarg, sizeof req);
          if (retval) {
             break;
          }
-         retval = HostIF_WritePage(vm, req.mpn, req.uAddr, FALSE);
+         retval = HostIF_WritePhysical(vm, MPN_2_MA(req.mpn), req.uAddr, FALSE,
+                                       PAGE_SIZE);
          break;
       }
 
-   case IOCTL_VMX86_SET_POLL_TIMEOUT_PTR: {
-      vmLinux->pollTimeoutPtr = NULL;
-      HostIF_UnmapUserMem(vmLinux->pollTimeoutHandle);
-      if (ioarg != 0) {
-         vmLinux->pollTimeoutPtr = HostIF_MapUserMem((VA)ioarg,
-                                              sizeof *vmLinux->pollTimeoutPtr,
-                                                 &vmLinux->pollTimeoutHandle);
-
-         if (vmLinux->pollTimeoutPtr == NULL) {
-            retval = -EINVAL;
-            break;
-         }
-      }
-      break;
-   }
-
-   case IOCTL_VMX86_GET_KERNEL_CLOCK_RATE:
-      retval = HZ;
-      break;
-
-   case IOCTL_VMX86_FAST_SUSP_RES_SET_OTHER_FLAG:
-      retval = Vmx86_FastSuspResSetOtherFlag(vm, ioarg);
-      break;
-
-   case IOCTL_VMX86_FAST_SUSP_RES_GET_MY_FLAG:
-      retval = Vmx86_FastSuspResGetMyFlag(vm, ioarg);
-      break;
-
    case IOCTL_VMX86_GET_REFERENCE_CLOCK_HZ: {
       uint64 refClockHz = HostIF_UptimeFrequency();
 
-      retval = HostIF_CopyToUser((void *)ioarg, &refClockHz,
-                                 sizeof refClockHz);
+      retval = HostIF_CopyToUser(ioarg, &refClockHz, sizeof refClockHz);
       break;
    }
 
    case IOCTL_VMX86_INIT_PSEUDO_TSC: {
       PTSCInitParams params;
 
-      retval = HostIF_CopyFromUser(&params, (void *)ioarg, sizeof params);
+      retval = HostIF_CopyFromUser(&params, ioarg, sizeof params);
       if (retval != 0) {
          break;
       }
       Vmx86_InitPseudoTSC(&params);
-      retval = HostIF_CopyToUser((void *)ioarg, &params, sizeof params);
+      retval = HostIF_CopyToUser(ioarg, &params, sizeof params);
       break;
    }
 
    case IOCTL_VMX86_CHECK_PSEUDO_TSC: {
       PTSCCheckParams params;
 
-      retval = HostIF_CopyFromUser(&params, (void *)ioarg, sizeof params);
+      retval = HostIF_CopyFromUser(&params, ioarg, sizeof params);
       if (retval != 0) {
          break;
       }
       params.usingRefClock = Vmx86_CheckPseudoTSC(&params.lastTSC,
                                                   &params.lastRC);
 
-      retval = HostIF_CopyToUser((void *)ioarg, &params, sizeof params);
+      retval = HostIF_CopyToUser(ioarg, &params, sizeof params);
       break;
    }
 
    case IOCTL_VMX86_GET_PSEUDO_TSC: {
       uint64 ptsc = Vmx86_GetPseudoTSC();
 
-      retval = HostIF_CopyToUser((void *)ioarg, &ptsc, sizeof ptsc);
+      retval = HostIF_CopyToUser(ioarg, &ptsc, sizeof ptsc);
       break;
    }
 
-   case IOCTL_VMX86_SET_HOST_CLOCK_PRIORITY:
-      /*
-       * This affects the global fast clock priority, and it only
-       * takes effect when the fast clock rate transitions from zero
-       * to a non-zero value.
-       *
-       * This is used to allow VMs to optionally work around
-       * bug 218750 by disabling our default priority boost. If any
-       * VM chooses to apply this workaround, the effect is permanent
-       * until vmmon is reloaded!
-       */
-
-      HostIF_FastClockLock(3);
-      linuxState.fastClockPriority = MAX(-20, MIN(19, (int)ioarg));
-      HostIF_FastClockUnlock(3);
-      retval = 0;
-      break;
-
    case IOCTL_VMX86_SYNC_GET_TSCS: {
       uint64 delta;
 
       if (LinuxDriverSyncReadTSCs(&delta)) {
-         retval = HostIF_CopyToUser((void *)ioarg, &delta, sizeof delta);
+         retval = HostIF_CopyToUser(ioarg, &delta, sizeof delta);
        } else {
          retval = -EBUSY;
       }
@@ -1961,10 +1602,10 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
 
    case IOCTL_VMX86_SET_HOST_SWAP_SIZE: {
       uint64 swapSize;
-      retval = HostIF_CopyFromUser(&swapSize, (void *)ioarg, sizeof swapSize);
+      retval = HostIF_CopyFromUser(&swapSize, ioarg, sizeof swapSize);
       if (retval != 0) {
          Warning("Could not copy swap size from user, status %d\n", retval);
-	 break;
+         break;
       }
       linuxState.swapSize = swapSize;
       break;
@@ -1972,11 +1613,11 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
 
    case IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS: {
       uint64 ctrs = Vmx86_GetUnavailablePerfCtrs();
-      retval = HostIF_CopyToUser((void *)ioarg, &ctrs, sizeof ctrs);
+      retval = HostIF_CopyToUser(ioarg, &ctrs, sizeof ctrs);
       break;
    }
 
-   default: 
+   default:
       Warning("Unknown ioctl %d\n", iocmd);
       retval = -EINVAL;
    }
diff --git a/vmmon-only/linux/driver.h b/vmmon-only/linux/driver.h
index 698afc9f..650acc03 100644
--- a/vmmon-only/linux/driver.h
+++ b/vmmon-only/linux/driver.h
@@ -26,10 +26,10 @@
 #include <linux/miscdevice.h>
 #include <linux/mutex.h>
 #include <linux/sched.h>
+#include <linux/semaphore.h>
 #include <linux/wait.h>
 
 #include "vmx86.h"
-#include "compat_semaphore.h"
 #include "driver_vmcore.h"
 
 
@@ -51,7 +51,7 @@ typedef struct VMMappedUserMem {
 struct VMDriver;
 
 /* 16 pages (64KB) looks as a good limit for one allocation */
-#define VMMON_MAX_LOWMEM_PAGES	16
+#define VMMON_MAX_LOWMEM_PAGES  16
 
 typedef struct VMLinux {
    struct VMLinux *next;
@@ -66,17 +66,6 @@ typedef struct VMLinux {
    struct semaphore lock4Gb;
    unsigned int size4Gb;
    struct page *pages4Gb[VMMON_MAX_LOWMEM_PAGES];
-
-   /*
-    * LinuxDriverPoll() support
-    */
-
-   wait_queue_head_t pollQueue;
-   volatile uint32 *pollTimeoutPtr;
-   VMMappedUserMem *pollTimeoutHandle;
-   VmTimeType pollTime;
-   struct VMLinux *pollForw;
-   struct VMLinux **pollBack;
 } VMLinux;
 
 
@@ -95,19 +84,8 @@ typedef struct VMXLinuxState {
    char buf[LINUXLOG_BUFFER_SIZE];
    VMLinux *head;
 
-   /*
-    * for LinuxDriverPoll()
-    */
-
-   struct timer_list pollTimer;
-   wait_queue_head_t pollQueue;
-
-   struct VMLinux *pollList;
-
    struct task_struct *fastClockThread;
-   struct file *fastClockFile;
    unsigned fastClockRate;
-   long fastClockPriority;
    uint64 swapSize;
 } VMXLinuxState;
 
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 80b57877..78199daf 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -29,7 +29,6 @@
 #include "driver-config.h"
 
 /* Must come before vmware.h --hpreg */
-#include "compat_page.h"
 #include <linux/binfmts.h>
 #include <linux/delay.h>
 #include <linux/file.h>
@@ -40,43 +39,21 @@
 
 #include <linux/preempt.h>
 #include <linux/poll.h>
+#include <linux/mm.h>
 #include <linux/mman.h>
 
 #include <linux/smp.h>
 
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 25)
-#   include <asm/asm.h>
-#endif
-#if defined(_ASM_EXTABLE)
-#   define VMW_ASM_EXTABLE(from, to) _ASM_EXTABLE(from, to)
-#else
-    /* Compat version copied from asm.h of 2.6.25 kernel */
-#   define VMW_ASM_FORM(x)  " " #x " "
-#   define VMW_ASM_EX_SEC   " .section __ex_table,\"a\"\n"
-#   ifdef CONFIG_X86_32
-#      define VMW_ASM_SEL(a,b) VMW_ASM_FORM(a)
-#   else
-#      define VMW_ASM_SEL(a,b) VMW_ASM_FORM(b)
-#   endif
-#   define VMW_ASM_PTR        VMW_ASM_SEL(.long, .quad)
-#   define VMW_ASM_ALIGN      VMW_ASM_SEL(.balign 4, .balign 8)
-#   define VMW_ASM_EXTABLE(from,to) \
-           VMW_ASM_EX_SEC    \
-           VMW_ASM_ALIGN "\n" \
-           VMW_ASM_PTR #from "," #to "\n" \
-           " .previous\n"
-#endif
-
+#include <asm/asm.h>
 #include <asm/io.h>
+#include <asm/page.h>
 #include <asm/uaccess.h>
-#include <linux/mc146818rtc.h>
 #include <linux/capability.h>
 #include <linux/kthread.h>
 #include <linux/wait.h>
+#include <linux/hrtimer.h>
 #include <linux/signal.h>
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
 #include <linux/taskstats_kern.h> // For linux/sched/signal.h without version check
-#endif
 
 #include "vmware.h"
 #include "x86apic.h"
@@ -96,27 +73,23 @@
 #include "vcpuid.h"
 
 #include "pgtbl.h"
-#include "vmmonInt.h"
 #include "versioned_atomic.h"
 
+#if !defined(CONFIG_HIGH_RES_TIMERS)
+#error CONFIG_HIGH_RES_TIMERS required for acceptable performance
+#endif
+
 /*
- * Determine if we can use high resolution timers.
+ * Although this is not really related to kernel-compatibility, I put this
+ * helper macro here for now for a lack of better place --hpreg
+ *
+ * The exit(2) path does, in this order:
+ * . set current->files to NULL
+ * . close all fds, which potentially calls LinuxDriver_Close()
+ *
+ * fget() requires current->files != NULL, so we must explicitely check --hpreg
  */
-
-#ifdef CONFIG_HIGH_RES_TIMERS
-#   include <linux/hrtimer.h>
-#   define VMMON_USE_HIGH_RES_TIMERS
-#   if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 28)
-#      define VMMON_USE_SCHEDULE_HRTIMEOUT
-#   else
-#      define VMMON_USE_COMPAT_SCHEDULE_HRTIMEOUT
-static void HostIFWakeupClockThread(unsigned long data);
-static DECLARE_TASKLET(timerTasklet, HostIFWakeupClockThread, 0);
-#   endif
-#   define close_rtc(filp, files) do {} while(0)
-#else
-#   define close_rtc(filp, files) filp_close(filp, files)
-#endif
+#define vmware_fget(_fd) (current->files ? fget(_fd) : NULL)
 
 #define UPTIME_FREQ CONST64(1000000)
 
@@ -346,9 +319,6 @@ static Mutex globalMutex;
  */
 static Mutex fastClockMutex;
 
-/* This mutex protects linuxState.pollList.  */
-static Mutex pollListMutex;
-
 
 /*
  *----------------------------------------------------------------------
@@ -397,13 +367,8 @@ HostIF_WaitForThreads(VMDriver *vm,     // UNUSED:
                       Vcpuid currVcpu)  // UNUSED:
 
 {
-#ifdef VMMON_USE_SCHEDULE_HRTIMEOUT
    ktime_t timeout = ktime_set(0, CROSSCALL_SLEEP_US * 1000);
    schedule_hrtimeout(&timeout, HRTIMER_MODE_REL);
-#else
-   /* Fallback to ms timer resolution is fine for older kernels. */
-   schedule_timeout(msecs_to_jiffies(CROSSCALL_SLEEP_US / 1000) + 1);
-#endif
 }
 
 
@@ -438,7 +403,7 @@ HostIF_CancelWaitForThreads(VMDriver *vm,     // IN:
  * HostIF_WakeUpYielders --
  *
  *      Wakeup vCPUs that are waiting for the current vCPU.
- *      
+ *
  * Results:
  *      The requested vCPUs are nudged if they are sleeping due to
  *      Vmx86_YieldToSet.
@@ -506,7 +471,6 @@ HostIF_InitGlobalLock(void)
 {
    MutexInit(&globalMutex, "global");
    MutexInit(&fastClockMutex, "fastClock");
-   MutexInit(&pollListMutex, "pollList");
 }
 
 
@@ -521,7 +485,7 @@ HostIF_InitGlobalLock(void)
  *      None
  *
  * Side effects:
- *      Should be a very low contention lock. 
+ *      Should be a very low contention lock.
  *      The current thread is rescheduled if the lock is busy.
  *
  *-----------------------------------------------------------------------------
@@ -564,7 +528,7 @@ HostIF_GlobalUnlock(int callerID) // IN
  * HostIF_GlobalLockIsHeld --
  *
  *      Determine if the global lock is held by the current thread.
- * 
+ *
  * Results:
  *      TRUE if yes
  *      FALSE if no
@@ -594,7 +558,7 @@ HostIF_GlobalLockIsHeld(void)
  *      None
  *
  * Side effects:
- *      Should be a very low contention lock. 
+ *      Should be a very low contention lock.
  *      The current thread is rescheduled if the lock is busy.
  *
  *-----------------------------------------------------------------------------
@@ -630,52 +594,6 @@ HostIF_FastClockUnlock(int callerID) // IN
 }
 
 
-/*
- *-----------------------------------------------------------------------------
- *
- * HostIF_PollListLock --
- *
- *      Grabs the linuxState.pollList lock.
- *
- * Results:
- *      None
- *
- * Side effects:
- *      The current thread is rescheduled if the lock is busy.
- *
- *-----------------------------------------------------------------------------
- */
-
-void
-HostIF_PollListLock(int callerID) // IN
-{
-   MutexLock(&pollListMutex, callerID);
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * HostIF_PollListUnlock --
- *
- *      Releases the linuxState.pollList lock.
- *
- * Results:
- *      None
- *
- * Side effects:
- *      None
- *
- *-----------------------------------------------------------------------------
- */
-
-void
-HostIF_PollListUnlock(int callerID) // IN
-{
-   MutexUnlock(&pollListMutex, callerID);
-}
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -729,7 +647,7 @@ static int
 HostIFHostMemInit(VMDriver *vm)  // IN:
 {
    VMHost *vmh = vm->vmhost;
-   
+
    vmh->lockedPages = PhysTrack_Alloc(vm);
    if (!vmh->lockedPages) {
       return -1;
@@ -824,8 +742,8 @@ HostIF_AllocMachinePage(void)
  *
  * HostIF_FreeMachinePage --
  *
- *      Free an anonymous machine page allocated by 
- *      HostIF_AllocMachinePage().  This page is not tracked in any 
+ *      Free an anonymous machine page allocated by
+ *      HostIF_AllocMachinePage().  This page is not tracked in any
  *      phystracker.
  *
  * Results:
@@ -854,9 +772,8 @@ HostIF_FreeMachinePage(MPN mpn)  // IN:
  *      Alloc non-swappable memory.
  *
  * Results:
- *      negative value on complete failure
- *      non-negative value on partial/full completion, number of MPNs
- *          allocated & filled in pmpn returned.
+ *      negative value on complete failure non-negative value on partial/full
+ *      completion, number of allocated MPNs returned.
  *
  * Side effects:
  *      Pages allocated.
@@ -865,13 +782,11 @@ HostIF_FreeMachinePage(MPN mpn)  // IN:
  */
 
 int
-HostIF_AllocLockedPages(VMDriver *vm,	     // IN: VM instance pointer
-			VA64 addr,	     // OUT: pointer to user or kernel buffer for MPNs
-			unsigned numPages,   // IN: number of pages to allocate
-			Bool kernelMPNBuffer)// IN: is the MPN buffer in kernel or user address space?
+HostIF_AllocLockedPages(VMDriver *vm,         // IN: VM instance pointer
+                        VA64 addr,            // OUT: buffer address
+                        unsigned numPages,    // IN: number of pages to allocate
+                        Bool kernelMPNBuffer) // IN: kernel vs user space
 {
-   MPN *pmpn = VA64ToPtr(addr);
-
    VMHost *vmh = vm->vmhost;
    unsigned int cnt;
    int err = 0;
@@ -886,19 +801,20 @@ HostIF_AllocLockedPages(VMDriver *vm,	     // IN: VM instance pointer
       pg = alloc_page(GFP_HIGHUSER);
       if (!pg) {
          err = -ENOMEM;
-	 break;
+         break;
       }
       mpn = (MPN)page_to_pfn(pg);
       if (kernelMPNBuffer) {
+         MPN *pmpn = VA64ToPtr(addr);
          *pmpn = mpn;
-      } else if (HostIF_CopyToUser(pmpn, &mpn, sizeof *pmpn) != 0) {
-	__free_page(pg);
-	err = -EFAULT;
-	break;
+      } else if (HostIF_CopyToUser(addr, &mpn, sizeof mpn) != 0) {
+         __free_page(pg);
+         err = -EFAULT;
+         break;
       }
-      pmpn++;
+      addr += sizeof mpn;
       if (PhysTrack_Test(vmh->AWEPages, mpn)) {
-	Warning("%s: duplicate MPN %016" FMT64 "x\n", __func__, mpn);
+         Warning("%s: duplicate MPN %016" FMT64 "x\n", __func__, mpn);
       }
       PhysTrack_Add(vmh->AWEPages, mpn);
    }
@@ -925,10 +841,10 @@ HostIF_AllocLockedPages(VMDriver *vm,	     // IN: VM instance pointer
  */
 
 int
-HostIF_FreeLockedPages(VMDriver *vm,	     // IN: VM instance pointer
-		       VA64 addr,            // IN: user or kernel array of MPNs
-		       unsigned numPages,    // IN: number of pages to free
-		       Bool kernelMPNBuffer) // IN: is the MPN buffer in kernel or user address space?
+HostIF_FreeLockedPages(VMDriver *vm,         // IN: VM instance pointer
+                       VA64 addr,            // IN: array of MPNs
+                       unsigned numPages,    // IN: number of pages to free
+                       Bool kernelMPNBuffer) // IN: kernel vs user address
 {
    const int MPN_BATCH = 64;
    MPN const *pmpn = VA64ToPtr(addr);
@@ -953,7 +869,7 @@ HostIF_FreeLockedPages(VMDriver *vm,	     // IN: VM instance pointer
          return -EINVAL;
       }
 
-      if (HostIF_CopyFromUser(mpns, pmpn, numPages * sizeof *pmpn)) {
+      if (HostIF_CopyFromUser(mpns, addr, numPages * sizeof *pmpn)) {
          printk(KERN_DEBUG "Cannot read from process address space at %p\n",
                 pmpn);
          HostIF_FreeKernelMem(mpns);
@@ -1108,38 +1024,6 @@ HostIF_LookupUserMPN(VMDriver *vm, // IN: VMDriver
 }
 
 
-/*
- *----------------------------------------------------------------------
- *
- * HostIF_InitFP --
- *
- *      masks IRQ13 if not previously the case.
- *
- * Results:
- *      prevents INTR #0x2d (IRQ 13) from being generated --
- *      assume that Int16 works for interrupt reporting
- *      
- *
- * Side effects:
- *      PIC
- *
- *----------------------------------------------------------------------
- */
-
-void
-HostIF_InitFP(VMDriver *vm)  // IN:
-{
-   int mask = (1 << (0xD - 0x8));
-
-   uint8 val = inb(0xA1);
-
-   if (!(val & mask)) { 
-      val = val | mask;
-      outb(val, 0xA1);
-   }
-}
-
-
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1149,7 +1033,7 @@ HostIF_InitFP(VMDriver *vm)  // IN:
  *      If ppages is NULL, pages are only marked as dirty.
  *
  * Results:
- *      Zero on success, non-zero on failure. 
+ *      Zero on success, non-zero on failure.
  *
  * Side effects:
  *      None
@@ -1164,16 +1048,7 @@ HostIFGetUserPages(void *uvAddr,          // IN
 {
    int retval;
 
-   down_read(&current->mm->mmap_sem);
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 9, 0)
-   retval = get_user_pages((unsigned long)uvAddr, numPages, 0, ppages, NULL);
-#elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 6, 0)
-   retval = get_user_pages((unsigned long)uvAddr, numPages, 0, 0, ppages, NULL);
-#else
-   retval = get_user_pages(current, current->mm, (unsigned long)uvAddr,
-                           numPages, 0, 0, ppages, NULL);
-#endif
-   up_read(&current->mm->mmap_sem);
+   retval = get_user_pages_fast((unsigned long)uvAddr, numPages, 0, ppages);
 
    return retval != numPages;
 }
@@ -1184,11 +1059,11 @@ HostIFGetUserPages(void *uvAddr,          // IN
  *
  * HostIF_IsLockedByMPN --
  *
- *      Checks if mpn was locked using allowMultipleMPNsPerVA.  
+ *      Checks if mpn was locked using allowMultipleMPNsPerVA.
  *
  * Results:
  *      TRUE if mpn is present in the physTracker.
- *      
+ *
  *
  * Side effects:
  *     None.
@@ -1310,7 +1185,7 @@ HostIF_UnlockPage(VMDriver *vm,  // IN:
 
    vpn = VA_2_VPN((VA)addr);
    e = MemTrack_LookupVPN(vm->memtracker, vpn);
-    
+
    if (e == NULL) {
       return PAGE_UNLOCK_NOT_TRACKED;
    }
@@ -1356,7 +1231,7 @@ HostIF_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
    {
       void *va = VA64ToPtr(uAddr);
       MemTrackEntry *e;
-      
+
       /*
        * Verify for debugging that VA and MPN make sense.
        * PgtblVa2MPN() can fail under high memory pressure.
@@ -1374,7 +1249,7 @@ HostIF_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
       }
 
       /*
-       * Verify that this MPN was locked with 
+       * Verify that this MPN was locked with
        * HostIF_LockPage(allowMultipleMPNsPerVA = TRUE).
        * That means that this MPN should not be in the MemTracker.
        */
@@ -1387,7 +1262,7 @@ HostIF_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
          return PAGE_UNLOCK_MISMATCHED_TYPE;
       }
    }
-#endif 
+#endif
 
    HOST_UNLOCK_PFN_BYMPN(vm, mpn);
 
@@ -1395,7 +1270,7 @@ HostIF_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
 }
 
 
-static void 
+static void
 UnlockEntry(void *clientData,         // IN:
             MemTrackEntry *entryPtr)  // IN:
 {
@@ -1441,10 +1316,10 @@ HostIF_FreeAllResources(VMDriver *vm) // IN
       }
       vm->vmhost->crosspagePagesCount = 0;
       if (vm->vmhost->hostAPICIsMapped) {
-	 ASSERT(vm->hostAPIC.base != NULL);
-	 iounmap((void*)vm->hostAPIC.base);
-	 vm->hostAPIC.base = NULL;
-	 vm->vmhost->hostAPICIsMapped = FALSE;
+         ASSERT(vm->hostAPIC.base != NULL);
+         iounmap((void*)vm->hostAPIC.base);
+         vm->hostAPIC.base = NULL;
+         vm->vmhost->hostAPICIsMapped = FALSE;
       }
       HostIF_FreeKernelMem(vm->vmhost);
       vm->vmhost = NULL;
@@ -1458,11 +1333,11 @@ HostIF_FreeAllResources(VMDriver *vm) // IN
  *
  * HostIF_AllocKernelMem
  *
- *      Allocate some kernel memory for the driver. 
+ *      Allocate some kernel memory for the driver.
  *
  * Results:
- *      The address allocated or NULL on error. 
- *      
+ *      The address allocated or NULL on error.
+ *
  *
  * Side effects:
  *      memory is malloced
@@ -1474,8 +1349,8 @@ HostIF_AllocKernelMem(size_t size,  // IN:
                       int wired)    // IN:
 {
    void * ptr = kmalloc(size, GFP_KERNEL);
-   
-   if (ptr == NULL) { 
+
+   if (ptr == NULL) {
       Warning("%s failed (size=%p)\n", __func__, (void*)size);
    }
 
@@ -1503,7 +1378,7 @@ void *
 HostIF_AllocPage(void)
 {
    VA kvAddr;
-   
+
    kvAddr = __get_free_page(GFP_KERNEL);
    if (kvAddr == 0) {
       Warning("%s: __get_free_page() failed\n", __func__);
@@ -1518,7 +1393,7 @@ HostIF_AllocPage(void)
  *
  * HostIF_FreeKernelMem
  *
- *      Free kernel memory allocated for the driver. 
+ *      Free kernel memory allocated for the driver.
  *
  * Results:
  *      None.
@@ -1548,6 +1423,56 @@ HostIF_FreePage(void *ptr)  // IN:
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_MapPage --
+ *
+ *      Maps the specified MPN into the host kernel address space.
+ *      returns the VPN of the mapping.
+ *
+ * Results:
+ *      The VPN in the kernel address space of the new mapping, or 0 if
+ *      the mapping failed.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+VPN
+HostIF_MapPage(MPN mpn) // IN:
+{
+   struct page *p = pfn_to_page(mpn);
+   void *mappedAddr = vmap(&p, 1, VM_MAP, PAGE_KERNEL);
+   return mappedAddr == NULL ? 0 : VA_2_VPN((VA)mappedAddr);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_UnmapPage --
+ *
+ *      Unmaps the specified VPN from the host kernel address space.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_UnmapPage(VPN vpn) // IN:
+{
+   vunmap((void *)VPN_2_VA(vpn));
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -1557,7 +1482,7 @@ HostIF_FreePage(void *ptr)  // IN:
  *      from the kernel without causing the host to die or to be really upset.
  *
  * Results:
- *	The maximum number of pages that can be locked. 
+ *      The maximum number of pages that can be locked.
  *
  * Side effects:
  *      none
@@ -1567,7 +1492,7 @@ HostIF_FreePage(void *ptr)  // IN:
 
 unsigned int
 HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
-			       unsigned int currentlyLockedPages) // IN
+                               unsigned int currentlyLockedPages) // IN
 {
    /*
     * This variable is available and exported to modules,
@@ -1578,16 +1503,13 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
 
    unsigned int totalPhysicalPages = totalram_pages;
 
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 28)
-   return MemDefaults_CalcMaxLockedPages(totalPhysicalPages);
-#else
    /*
     * Use the memory information linux exports as of late for a more
     * precise estimate of locked memory.  All kernel page-related structures
     * (slab, pagetable) are as good as locked.  Unevictable includes things
-    * that are explicitly marked as such (like mlock()).  Huge pages are 
-    * also as good as locked, since we don't use them.  Lastly, without 
-    * available swap, anonymous pages become locked in memory as well. 
+    * that are explicitly marked as such (like mlock()).  Huge pages are
+    * also as good as locked, since we don't use them.  Lastly, without
+    * available swap, anonymous pages become locked in memory as well.
     */
 
    unsigned int forHost;
@@ -1607,7 +1529,7 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
    unsigned int swapPages = BYTES_2_PAGES(linuxState.swapSize);
 
    if (anonPages > swapPages) {
-      lockedPages += anonPages - swapPages; 
+      lockedPages += anonPages - swapPages;
    }
    forHost = lockedPages + LOCKED_PAGE_SLACK;
    if (forHost > totalPhysicalPages) {
@@ -1615,7 +1537,6 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
    }
 
    return totalPhysicalPages - forHost;
-#endif
 }
 
 
@@ -1644,7 +1565,7 @@ HostIF_Wait(unsigned int timeoutMs)
  *      Waits for pages to be available for allocation or locking.
  *
  * Results:
- *	New pages are likely to be available for allocation or locking.
+ *      New pages are likely to be available for allocation or locking.
  *
  * Side effects:
  *      none
@@ -1652,7 +1573,7 @@ HostIF_Wait(unsigned int timeoutMs)
  *----------------------------------------------------------------------
  */
 
-void 
+void
 HostIF_WaitForFreePages(unsigned int timeoutMs)  // IN:
 {
    static unsigned count;
@@ -1677,20 +1598,20 @@ HostIF_WaitForFreePages(unsigned int timeoutMs)  // IN:
  *      timeofday to have small drift (due to NTP rate correction, etc).
  *      We handle this by rebasing the jiffies based monotonic clock
  *      every second (see HostIFUptimeResyncMono).
- *      
+ *
  * Results:
  *      The uptime, in units of UPTIME_FREQ.  Also returns the jiffies
  *      value that was used in the monotonic time calculation.
  *
  * Side effects:
- *      May reset the uptime base in the case gettimeofday warp was 
+ *      May reset the uptime base in the case gettimeofday warp was
  *      detected.
  *
  *----------------------------------------------------------------------
  */
 
 static uint64
-HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies 
+HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies
 {
    struct timeval tv;
    uint64 monotime, uptime, upBase, monoBase;
@@ -1712,14 +1633,14 @@ HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies
 
    do_gettimeofday(&tv);
    upBase = Atomic_Read64(&uptimeState.uptimeBase);
-   
+
    monotime = (uint64)(jifs - jifBase) * (UPTIME_FREQ / HZ);
    monotime += monoBase;
 
    uptime = tv.tv_usec * (UPTIME_FREQ / 1000000) + tv.tv_sec * UPTIME_FREQ;
    uptime += upBase;
-   
-   /* 
+
+   /*
     * Use the jiffies based monotonic time to sanity check gettimeofday.
     * If they differ by more than one second, assume the time of day has
     * been warped, and use the jiffies time to undo (most of) the warp.
@@ -1731,7 +1652,7 @@ HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies
       uint64 newUpBase = monotime - (uptime - upBase);
 
       attempts++;
-      if (!Atomic_CMPXCHG64(&uptimeState.uptimeBase, &upBase, &newUpBase) && 
+      if (!Atomic_CMPXCHG64(&uptimeState.uptimeBase, upBase, newUpBase) &&
           attempts < 5) {
          /* Another thread updated uptimeBase.  Recalculate uptime. */
          goto retry;
@@ -1772,7 +1693,7 @@ HostIFUptimeResyncMono(unsigned long data)  // IN: ignored
    unsigned long jifs;
    uintptr_t flags;
 
-   /* 
+   /*
     * Read the uptime and the corresponding jiffies value.  This will
     * also correct the uptime (which is based on time of day) if needed
     * before we rebase monotonic time (which is based on jiffies).
@@ -1780,7 +1701,7 @@ HostIFUptimeResyncMono(unsigned long data)  // IN: ignored
 
    uint64 uptime = HostIFReadUptimeWork(&jifs);
 
-   /* 
+   /*
     * Every second, recalculate monoBase and jiffiesBase to squash small
     * drift between gettimeofday and jiffies.  Also, this prevents
     * (jiffies - jiffiesBase) wrap on 32-bits.
@@ -1825,8 +1746,8 @@ HostIF_InitUptime(void)
 
    uptimeState.jiffiesBase = jiffies;
    do_gettimeofday(&tv);
-   Atomic_Write64(&uptimeState.uptimeBase, 
-                  -(tv.tv_usec * (UPTIME_FREQ / 1000000) + 
+   Atomic_Write64(&uptimeState.uptimeBase,
+                  -(tv.tv_usec * (UPTIME_FREQ / 1000000) +
                     tv.tv_sec * UPTIME_FREQ));
 
    init_timer(&uptimeState.timer);
@@ -1927,11 +1848,11 @@ HostIF_UptimeFrequency(void)
  */
 
 int
-HostIF_CopyFromUser(void *dst,        // OUT
-                    const void *src,  // IN
-                    unsigned int len) // IN
+HostIF_CopyFromUser(void *dst,      // OUT
+                    VA64 src,       // IN
+                    size_t len)     // IN
 {
-   return copy_from_user(dst, src, len) ? -EFAULT : 0;
+   return copy_from_user(dst, VA64ToPtr(src), len) ? -EFAULT : 0;
 }
 
 
@@ -1954,12 +1875,12 @@ HostIF_CopyFromUser(void *dst,        // OUT
  *-----------------------------------------------------------------------------
  */
 
-int 
-HostIF_CopyToUser(void *dst,        // OUT
+int
+HostIF_CopyToUser(VA64 dst,         // OUT
                   const void *src,  // IN
-                  unsigned int len) // IN
+                  size_t len)       // IN
 {
-   return copy_to_user(dst, src, len) ? -EFAULT : 0;
+   return copy_to_user(VA64ToPtr(dst), src, len) ? -EFAULT : 0;
 }
 
 
@@ -1967,15 +1888,15 @@ HostIF_CopyToUser(void *dst,        // OUT
  *-----------------------------------------------------------------------------
  *
  * HostIF_MapCrossPage --
- *    
- *    Obtain kernel pointer to crosspage. 
  *
- *    We must return a VA that is obtained through a kernel mapping, so that 
+ *    Obtain kernel pointer to crosspage.
+ *
+ *    We must return a VA that is obtained through a kernel mapping, so that
  *    the mapping never goes away (see bug 29753).
  *
- *    However, the LA corresponding to that VA must not overlap with the 
- *    monitor (see bug 32922). The userland code ensures that by only 
- *    allocating cross pages from low memory. For those pages, the kernel 
+ *    However, the LA corresponding to that VA must not overlap with the
+ *    monitor (see bug 32922). The userland code ensures that by only
+ *    allocating cross pages from low memory. For those pages, the kernel
  *    uses a permanent mapping, instead of a temporary one with a high LA.
  *
  * Results:
@@ -2020,18 +1941,15 @@ HostIF_MapCrossPage(VMDriver *vm, // IN
 /*
  *-----------------------------------------------------------------------------
  *
- * HostIF_AllocCrossGDT --
- *
- *      Allocate the per-vmmon cross GDT page set.
+ * HostIF_AllocKernelPages --
  *
- *      See bora/doc/worldswitch-pages.txt for the requirements on the cross
- *      GDT page set addresses.
+ *      Allocates and maps a set of locked pages.
  *
  * Results:
- *      On success: Host kernel virtual address of the first cross GDT page.
- *                  Use HostIF_FreeCrossGDT() with the same value to free.
- *                  The 'crossGDTMPNs' array is filled with the MPNs of all the
- *                  cross GDT pages.
+ *      On success: Host kernel virtual address of the first page.
+ *                  Use HostIF_FreeKernelPages() with the same value to free.
+ *                  The 'mpns' array is filled with the MPNs of the
+ *                  allocated pages, in sequence.
  *      On failure: NULL.
  *
  * Side effects:
@@ -2041,64 +1959,40 @@ HostIF_MapCrossPage(VMDriver *vm, // IN
  */
 
 void *
-HostIF_AllocCrossGDT(uint32 numPages,     // IN: Number of pages
-                     MPN maxValidFirst,   // IN: Highest valid MPN of first page
-                     MPN *crossGDTMPNs)   // OUT: Array of MPNs
+HostIF_AllocKernelPages(unsigned numPages, // IN: Number of pages
+                        MPN     *mpns)     // OUT: Array of MPNs
 {
    MPN startMPN;
    struct page *pages;
-   uint32 i;
-   void *crossGDT;
-
-   /*
-    * In practice, allocating a low page (MPN <= 0x100000 - 1) is equivalent to
-    * allocating a page with MPN <= 0xFEC00 - 1:
-    *
-    * o PC architecture guarantees that there is no RAM in top 16MB of 4GB
-    *   range.
-    *
-    * o 0xFEC00000 is IOAPIC base.  There could be RAM immediately below,
-    *   but not above.
-    *
-    * How do we allocate a low page? We can safely use GFP_DMA32 when
-    * available.  On 64bit kernels before GFP_DMA32 was introduced we
-    * fall back to DMA zone (which is not quite necessary for boxes
-    * with less than ~3GB of memory).  On 32bit kernels we are using
-    * normal zone - which is usually 1GB, and at most 4GB (for 4GB/4GB
-    * kernels).  And for 4GB/4GB kernels same restriction as for 64bit
-    * kernels applies - there is no RAM in top 16MB immediately below
-    * 4GB so alloc_pages() cannot return such page.
-    */
+   unsigned i;
+   void *ptr;
 
-   ASSERT(0xFEC00 - 1 <= maxValidFirst);
    for (i = 0; (1 << i) < numPages; i++) { }
-#ifdef GFP_DMA32
-   pages = alloc_pages(GFP_KERNEL | GFP_DMA32, i);
-#else
-   pages = alloc_pages(GFP_KERNEL | GFP_DMA, i);
-#endif
-   crossGDT = NULL;
+   /* Allocates physically contiguous pages. */
+   pages = alloc_pages(GFP_KERNEL, i);
+
    if (pages == NULL) {
-      Warning("%s: unable to alloc crossGDT (%u)\n", __func__, i);
-   } else {
-      startMPN = page_to_pfn(pages);
-      for (i = 0; i < numPages; i++) {
-         crossGDTMPNs[i] = startMPN + i;
-      }
-      crossGDT = (void *)page_address(pages);
+      return NULL;
    }
 
-   return crossGDT;
+   startMPN = page_to_pfn(pages);
+
+   for (i = 0; i < numPages; i++) {
+      mpns[i] = startMPN + i;
+   }
+   ptr = (void *)page_address(pages);
+   ASSERT(!(PtrToVA64(ptr) & (PAGE_SIZE - 1))); /* Page-aligned */
+
+   return ptr;
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * HostIF_FreeCrossGDT --
+ * HostIF_FreeKernelPages --
  *
- *      Free the per-vmmon cross GDT page set allocated with
- *      HostIF_AllocCrossGDT().
+ *      Frees a set of pages allocated with HostIF_AllocKernelPages().
  *
  * Results:
  *      None
@@ -2110,13 +2004,13 @@ HostIF_AllocCrossGDT(uint32 numPages,     // IN: Number of pages
  */
 
 void
-HostIF_FreeCrossGDT(uint32 numPages, // IN: Number of pages
-                    void *crossGDT)  // IN: Kernel VA of first cross GDT page
+HostIF_FreeKernelPages(unsigned numPages, // IN: Number of pages
+                       void    *ptr)      // IN: Kernel VA of first page
 {
-   uint32 i;
+   unsigned i;
 
    for (i = 0; (1 << i) < numPages; i++) { }
-   free_pages((VA)crossGDT, i);
+   free_pages((VA)ptr, i);
 }
 
 
@@ -2163,7 +2057,7 @@ HostIF_VMLock(VMDriver *vm, // IN
  *      None
  *
  * Side effects:
- *      Can wake up the thread blocked on this lock. 
+ *      Can wake up the thread blocked on this lock.
  *
  *-----------------------------------------------------------------------------
  */
@@ -2186,7 +2080,7 @@ HostIF_VMUnlock(VMDriver *vm, // IN
  * HostIF_VMLockIsHeld --
  *
  *      Determine if the per-VM lock is held by the current thread.
- * 
+ *
  * Results:
  *      TRUE if yes
  *      FALSE if no
@@ -2242,18 +2136,18 @@ HostIF_VMLockIsHeld(VMDriver *vm) // IN
  *
  *----------------------------------------------------------------------
  */
- 
+
 static Bool
 isVAReadable(VA r)  // IN:
 {
    mm_segment_t old_fs;
    uint32 dummy;
    int ret;
-   
+
    old_fs = get_fs();
    set_fs(get_ds());
    r = APICR_TO_ADDR(r, APICR_VERSION);
-   ret = HostIF_CopyFromUser(&dummy, (void*)r, sizeof(dummy));
+   ret = HostIF_CopyFromUser(&dummy, r, sizeof dummy);
    set_fs(old_fs);
 
    return ret == 0;
@@ -2279,7 +2173,7 @@ isVAReadable(VA r)  // IN:
 
 static void
 SetVMAPICAddr(VMDriver *vm, // IN/OUT: driver state
-              MA ma)	    // IN: host APIC's ma
+              MA ma)        // IN: host APIC's ma
 {
    volatile void *hostapic;
 
@@ -2287,11 +2181,11 @@ SetVMAPICAddr(VMDriver *vm, // IN/OUT: driver state
    hostapic = (volatile void *) ioremap_nocache(ma, PAGE_SIZE);
    if (hostapic) {
       if ((APIC_VERSIONREG(hostapic) & 0xF0) == 0x10) {
-	 vm->hostAPIC.base = (volatile uint32 (*)[4]) hostapic;
-	 ASSERT(vm->vmhost != NULL);
-	 vm->vmhost->hostAPICIsMapped = TRUE;
+         vm->hostAPIC.base = (volatile uint32 (*)[4]) hostapic;
+         ASSERT(vm->vmhost != NULL);
+         vm->vmhost->hostAPICIsMapped = TRUE;
       } else {
-	 iounmap((void*)hostapic);
+         iounmap((void*)hostapic);
       }
    }
 }
@@ -2321,10 +2215,10 @@ SetVMAPICAddr(VMDriver *vm, // IN/OUT: driver state
 
 static Bool
 ProbeAPIC(VMDriver *vm,   // IN/OUT: driver state
-	  Bool setVMPtr)  // IN: set a pointer to the APIC's virtual address
+          Bool setVMPtr)  // IN: set a pointer to the APIC's virtual address
 {
    MA ma = APIC_GetMA();
-   
+
    if (ma == (MA)-1) {
       return FALSE;
    }
@@ -2425,7 +2319,7 @@ HostIF_APICInit(VMDriver *vm,   // IN:
  *    Perform the semaphore wait (P) operation, possibly blocking.
  *
  * Result:
- *    1 (which equals MX_WAITNORMAL) if success, 
+ *    1 (which equals MX_WAITNORMAL) if success,
  *    negated error code otherwise.
  *
  * Side-effects:
@@ -2434,7 +2328,7 @@ HostIF_APICInit(VMDriver *vm,   // IN:
  *-----------------------------------------------------------------------------
  */
 
-int   
+int
 HostIF_SemaphoreWait(VMDriver *vm,   // IN:
                      Vcpuid vcpuid,  // IN:
                      uint64 *args)   // IN:
@@ -2457,7 +2351,7 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
    {
       struct poll_wqueues table;
       unsigned int mask;
-      
+
       poll_initwait(&table);
       current->state = TASK_INTERRUPTIBLE;
       mask = file->f_op->poll(file, &table.pt);
@@ -2532,7 +2426,7 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
  *-----------------------------------------------------------------------------
  */
 
-void 
+void
 HostIF_SemaphoreForceWakeup(VMDriver *vm,       // IN:
                             const VCPUSet *vcs) // IN:
 {
@@ -2620,34 +2514,6 @@ HostIF_SemaphoreSignal(uint64 *args)  // IN:
    return res;
 }
 
-#if ((LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 27)) || !defined(CONFIG_SMP))
-#   define VMMON_USE_CALL_FUNC
-#endif
-
-#if defined(VMMON_USE_CALL_FUNC)
-/*
- *----------------------------------------------------------------------
- *
- * LinuxDriverIPIHandler  --
- *
- *      Null IPI handler - for monitor to notice AIO completion
- *
- *----------------------------------------------------------------------
- */
-void
-LinuxDriverIPIHandler(void *info)
-{
-   return;
-}
-
-#if LINUX_VERSION_CODE > KERNEL_VERSION(2, 6, 17)
-#define VMMON_CALL_FUNC_SYNC 0  // async; we've not seen any problems
-#else
-#define VMMON_CALL_FUNC_SYNC 1  // sync; insure no problems from old releases
-#endif
-
-#endif
-
 
 /*
  *----------------------------------------------------------------------
@@ -2677,17 +2543,8 @@ HostIF_IPI(VMDriver *vm,                // IN:
       uint32 targetHostCpu = vm->currentHostCpu[v];
       if (targetHostCpu != INVALID_PCPU) {
          ASSERT(targetHostCpu < MAX_PCPUS);
-#if defined(VMMON_USE_CALL_FUNC)
-         /* older kernels IPI broadcast; use async when possible */
-         (void) compat_smp_call_function(LinuxDriverIPIHandler,
-                                         NULL, VMMON_CALL_FUNC_SYNC);
-	 mode = IPI_BROADCAST;
-	 break;
-#else
-         /* Newer kernels have (async) IPI targetting */
          arch_send_call_function_single_ipi(targetHostCpu);
-	 mode = IPI_UNICAST;
-#endif
+         mode = IPI_UNICAST;
       }
    } ROF_EACH_VCPU_IN_SET();
 
@@ -2812,7 +2669,7 @@ HostIF_CallOnEachCPU(void (*func)(void*), // IN: function to call
 {
    preempt_disable();
    (*func)(data);
-   (void)compat_smp_call_function(*func, data, 1);
+   (void)smp_call_function(*func, data, 1);
    preempt_enable();
 }
 
@@ -2865,6 +2722,13 @@ HostIFCheckTrackedMPN(VMDriver *vm, // IN: The VM instance
          return TRUE;
       }
    }
+
+   if (vm->ptpTracker) {
+      if (MemTrack_LookupMPN(vm->ptpTracker, mpn) != NULL) {
+         HostIF_VMUnlock(vm, 32);
+         return TRUE;
+      }
+   }
    HostIF_VMUnlock(vm, 32);
 
    if (vmx86_debug) {
@@ -2881,11 +2745,11 @@ HostIFCheckTrackedMPN(VMDriver *vm, // IN: The VM instance
 /*
  *----------------------------------------------------------------------
  *
- * HostIF_ReadPage --
+ * HostIF_ReadPhysical --
  *
- *      Reads one page of data from a machine page and returns it in the
- *      specified kernel or user buffer.  The machine page must be owned by
- *      the specified VM.
+ *      Reads bytes from a machine address and stores it in a kernel or
+ *      user buffer. The address and number of bytes must describe
+ *      memory on a single machine page owned by the specified VM.
  *
  * Results:
  *      0 on success
@@ -2898,33 +2762,37 @@ HostIFCheckTrackedMPN(VMDriver *vm, // IN: The VM instance
  */
 
 int
-HostIF_ReadPage(VMDriver *vm,        // IN: The VM instance
-                MPN mpn,             // MPN of the page
-                VA64 addr,           // buffer for data
-                Bool kernelBuffer)   // is the buffer in kernel space?
+HostIF_ReadPhysical(VMDriver *vm,      // IN: The VM instance
+                    MA ma,             // MA to be read
+                    VA64 addr,         // dst for read data
+                    Bool kernelBuffer, // is the buffer in kernel space?
+                    size_t len)        // number of bytes to read
 {
-   void *buf = VA64ToPtr(addr);
    int ret = 0;
-   const void* ptr;
+   void* ptr;
    struct page* page;
+   MPN mpn = MA_2_MPN(ma);
+   uint32 offset = ma & (PAGE_SIZE - 1);
 
    if (mpn == INVALID_MPN) {
       return -EFAULT;
    }
-   if (HostIFCheckTrackedMPN(vm, mpn) == FALSE) {
+   if (MA_2_MPN(ma + len - 1) != mpn) {
+      return -EFAULT;
+   }
+   if (!HostIFCheckTrackedMPN(vm, mpn)) {
       return -EFAULT;
    }
-
    page = pfn_to_page(mpn);
    ptr = kmap(page);
    if (ptr == NULL) {
       return -ENOMEM;
    }
-   
+
    if (kernelBuffer) {
-      memcpy(buf, ptr, PAGE_SIZE);
+      memcpy(VA64ToPtr(addr), ptr + offset, len);
    } else {
-      ret = HostIF_CopyToUser(buf, ptr, PAGE_SIZE);
+      ret = HostIF_CopyToUser(addr, ptr + offset, len);
    }
    kunmap(page);
 
@@ -2935,10 +2803,11 @@ HostIF_ReadPage(VMDriver *vm,        // IN: The VM instance
 /*
  *----------------------------------------------------------------------
  *
- * HostIF_WritePage --
+ * HostIF_WritePhysical --
  *
- *      Writes one page of data from a kernel or user buffer onto the specified
- *      machine page.  The machine page must be owned by the specified VM.
+ *      Writes bytes from a kernel or user mode buffer to a machine
+ *      address. The address and number of bytes must describe memory on
+ *      a single machine page owned by the specified VM.
  *
  * Results:
  *      0 on success
@@ -2951,19 +2820,23 @@ HostIF_ReadPage(VMDriver *vm,        // IN: The VM instance
  */
 
 int
-HostIFWritePageWork(MPN mpn,              // MPN of the page
-                    VA64 addr,            // data to write to the page
-                    Bool kernelBuffer)    // is the buffer in kernel space?
+HostIFWritePhysicalWork(MA ma,             // MA to be written to
+                        VA64 addr,         // src data to write
+                        Bool kernelBuffer, // is the buffer in kernel space?
+                        size_t len)        // number of bytes to write
 {
-   void const *buf = VA64ToPtr(addr);
    int ret = 0;
    void* ptr;
    struct page* page;
+   MPN mpn = MA_2_MPN(ma);
+   uint32 offset = ma & (PAGE_SIZE - 1);
 
    if (mpn == INVALID_MPN) {
       return -EFAULT;
    }
-
+   if (MA_2_MPN(ma + len - 1) != mpn) {
+      return -EFAULT;
+   }
    page = pfn_to_page(mpn);
    ptr = kmap(page);
    if (ptr == NULL) {
@@ -2971,9 +2844,9 @@ HostIFWritePageWork(MPN mpn,              // MPN of the page
    }
 
    if (kernelBuffer) {
-      memcpy(ptr, buf, PAGE_SIZE);
+      memcpy(ptr + offset, VA64ToPtr(addr), len);
    } else {
-      ret = HostIF_CopyFromUser(ptr, buf, PAGE_SIZE);
+      ret = HostIF_CopyFromUser(ptr + offset, addr, len);
    }
    kunmap(page);
 
@@ -2981,15 +2854,16 @@ HostIFWritePageWork(MPN mpn,              // MPN of the page
 }
 
 int
-HostIF_WritePage(VMDriver *vm,      // IN: The VM instance
-                 MPN mpn,              // MPN of the page
-                 VA64 addr,            // data to write to the page
-                 Bool kernelBuffer)    // is the buffer in kernel space?
+HostIF_WritePhysical(VMDriver *vm,      // IN: The VM instance
+                     MA ma,             // MA to be written to
+                     VA64 addr,         // src data to write
+                     Bool kernelBuffer, // is the buffer in kernel space?
+                     size_t len)        // number of bytes to write
 {
-   if (HostIFCheckTrackedMPN(vm, mpn) == FALSE) {
+   if (!HostIFCheckTrackedMPN(vm, MA_2_MPN(ma))) {
       return -EFAULT;
    }
-   return HostIFWritePageWork(mpn, addr, kernelBuffer);
+   return HostIFWritePhysicalWork(ma, addr, kernelBuffer, len);
 }
 
 
@@ -3016,55 +2890,7 @@ int
 HostIF_WriteMachinePage(MPN mpn,   // IN: MPN of the page
                         VA64 addr) // IN: data to write to the page
 {
-   return HostIFWritePageWork(mpn, addr, TRUE);
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * HostIF_GetLockedPageList --
- *
- *      puts MPNs of pages that were allocated by HostIF_AllocLockedPages()
- *      into user mode buffer.
- *
- * Results:
- *      non-negative number of the MPNs in the buffer on success.
- *      negative error code on error (-EFAULT)
- *
- * Side effects:
- *      none
- *
- *----------------------------------------------------------------------
- */
-
-int
-HostIF_GetLockedPageList(VMDriver* vm,          // IN: VM instance pointer
-                         VA64 uAddr,            // OUT: user mode buffer for MPNs
-                         unsigned int numPages) // IN: size of the buffer in MPNs
-{
-   MPN *mpns = VA64ToPtr(uAddr);
-   MPN mpn;
-   unsigned count;
-
-   struct PhysTracker* AWEPages;
-
-   if (!vm->vmhost || !vm->vmhost->AWEPages) {
-      return 0;
-   }
-   AWEPages = vm->vmhost->AWEPages;
-
-   for (mpn = 0, count = 0;
-        (count < numPages) &&
-        (INVALID_MPN != (mpn = PhysTrack_GetNext(AWEPages, mpn)));
-        count++) {
-
-      if (HostIF_CopyToUser(&mpns[count], &mpn, sizeof *mpns) != 0) {
-         return -EFAULT;
-      }
-   }
-
-   return count;
+   return HostIFWritePhysicalWork(MPN_2_MA(mpn), addr, TRUE, PAGE_SIZE);
 }
 
 
@@ -3106,7 +2932,7 @@ HostIF_GetNextAnonPage(VMDriver *vm, MPN inMPN)
  * Side effects:
  *    None.
  *
- *---------------------------------------------------------------------- 
+ *----------------------------------------------------------------------
  */
 
 uint32
@@ -3116,136 +2942,12 @@ HostIF_GetCurrentPCPU(void)
 }
 
 
-#ifdef VMMON_USE_COMPAT_SCHEDULE_HRTIMEOUT
-/*
- *----------------------------------------------------------------------
- *
- * HostIFWakeupClockThread --
- *
- *      Wake up the fast clock thread.  Can't do this from the timer
- *      callback, because it holds locks that the scheduling code
- *      might take. 
- *
- * Results:
- *      None.
- *      
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static void 
-HostIFWakeupClockThread(unsigned long data)  //IN:
-{
-   wake_up_process(linuxState.fastClockThread);
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * HostIFTimerCallback --
- *      
- *      Schedule a tasklet to wake up the fast clock thread.
- *
- * Results:
- *      Tell the kernel not to restart the timer.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
- 
-static enum hrtimer_restart 
-HostIFTimerCallback(struct hrtimer *timer)  //IN:
-{
-   tasklet_schedule(&timerTasklet);
-
-   return HRTIMER_NORESTART;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * HostIFScheduleHRTimeout --
- *      
- *      Schedule an hrtimer to wake up the fast clock thread.
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      Sleep.
- *
- *----------------------------------------------------------------------
- */
-
-static void 
-HostIFScheduleHRTimeout(ktime_t *expires)  //IN:
-{
-   struct hrtimer t;
-
-   if (expires && !expires->tv64) {
-      __set_current_state(TASK_RUNNING);
-
-      return;
-   }
-
-   hrtimer_init(&t, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
-   t.function = HostIFTimerCallback;
-   hrtimer_start(&t, *expires, HRTIMER_MODE_REL);
-
-   if (hrtimer_active(&t)) {
-      schedule();
-   }
-   
-   hrtimer_cancel(&t);
-   __set_current_state(TASK_RUNNING);
-}
-#endif //VMMON_USE_COMPAT_SCHEDULE_HRTIMEOUT
-
-
-#ifndef VMMON_USE_HIGH_RES_TIMERS
-/*
- *----------------------------------------------------------------------
- *
- * HostIFDoIoctl --
- *
- *    Issue ioctl.  Assume kernel is not locked.  It is not true now,
- *    but it makes things easier to understand, and won't surprise us
- *    later when we get rid of kernel lock from our code.
- *
- * Results:
- *    Same as ioctl method.
- *
- * Side effects:
- *    none.
- *
- *---------------------------------------------------------------------- 
- */
-
-static long
-HostIFDoIoctl(struct file *filp,
-              u_int iocmd,
-              unsigned long ioarg)
-{
-   if (filp->f_op->unlocked_ioctl) {
-      return filp->f_op->unlocked_ioctl(filp, iocmd, ioarg);
-   }
-   return -ENOIOCTLCMD;
-}
-#endif //VMON_USE_HIGH_RES_TIMERS
-
-
 /*
  *----------------------------------------------------------------------
  *
  * HostIFStartTimer --
  *
- *      Starts the timer using either /dev/rtc or high-resolution timers.
+ *      Starts the high-resolution timer.
  *
  * Results:
  *      Returns 0 on success, -1 on failure.
@@ -3257,83 +2959,26 @@ HostIFDoIoctl(struct file *filp,
  */
 
 int
-HostIFStartTimer(Bool rateChanged,  //IN: Did rate change? 
-		 unsigned int rate, //IN: current clock rate
-                 struct file *filp) //IN: /dev/rtc descriptor
+HostIFStartTimer(Bool rateChanged,  //IN: Did rate change?
+                 unsigned int rate) //IN: current clock rate
 {
-#ifdef VMMON_USE_HIGH_RES_TIMERS
    static unsigned long slack = 0;
    static ktime_t expires;
    int timerPeriod;
 
    if (rateChanged) {
-      timerPeriod = NSEC_PER_SEC / rate; 
+      timerPeriod = NSEC_PER_SEC / rate;
       expires = ktime_set(0, timerPeriod);
       /*
        * Allow the kernel to expire the timer at its convenience.
        * ppoll() uses 0.1% of the timeout value.  I think we can
        * tolerate 1%.
        */
-          
+
       slack = timerPeriod / 100;
    }
    set_current_state(TASK_INTERRUPTIBLE);
-#   ifdef VMMON_USE_SCHEDULE_HRTIMEOUT
    schedule_hrtimeout_range(&expires, slack, HRTIMER_MODE_REL);
-#   else
-   HostIFScheduleHRTimeout(&expires);
-#   endif
-#else
-   unsigned p2rate;
-   int res;
-   unsigned long buf;
-   loff_t pos = 0;
-
-   if (rateChanged) {
-      /*
-       * The host will already have HZ timer interrupts per second.  So
-       * in order to satisfy the requested rate, we need up to (rate -
-       * HZ) additional interrupts generated by the RTC.  That way, if
-       * the guest ask for a bit more than 1024 virtual interrupts per
-       * second (which is a common case for Windows with multimedia
-       * timers), we'll program the RTC to 1024 rather than 2048, which
-       * saves a considerable amount of CPU.  PR 519228.
-       */
-      if (rate > HZ) {
-         rate -= HZ;
-      } else {
-         rate = 0;
-      }
-      /*
-       * Don't set the RTC rate to 64 Hz or lower: some kernels have a
-       * bug in the HPET emulation of RTC that will cause the RTC
-       * frequency to get stuck at 64Hz.  See PR 519228 comment #23.
-       */
-      p2rate = 128;
-      // Hardware rate must be a power of 2
-      while (p2rate < rate && p2rate < 8192) {
-         p2rate <<= 1;
-      }
-
-      res = HostIFDoIoctl(filp, RTC_IRQP_SET, p2rate);
-      if (res < 0) {
-         Warning("/dev/rtc set rate %d failed: %d\n", p2rate, res);
-
-         return -1;
-      }
-      if (kthread_should_stop()) {
-         return -1;
-      }
-   }
-   res = filp->f_op->read(filp, (void *) &buf, sizeof(buf), &pos);
-   if (res <= 0) {
-      if (res != -ERESTARTSYS) {
-         Log("/dev/rtc read failed: %d\n", res);
-      }
-
-      return -1;
-   }
-#endif
 
    return 0;
 }
@@ -3360,9 +3005,8 @@ HostIFStartTimer(Bool rateChanged,  //IN: Did rate change?
  */
 
 static int
-HostIFFastClockThread(void *data)  // IN:
+HostIFFastClockThread(void *unused)  // IN:
 {
-   struct file *filp = (struct file *) data;
    int res;
    mm_segment_t oldFS;
    unsigned int rate = 0;
@@ -3371,13 +3015,12 @@ HostIFFastClockThread(void *data)  // IN:
    oldFS = get_fs();
    set_fs(KERNEL_DS);
    allow_signal(SIGKILL);
-   set_user_nice(current, linuxState.fastClockPriority);
 
    while ((rate = linuxState.fastClockRate) > MIN_RATE) {
       if (kthread_should_stop()) {
          goto out;
       }
-      res = HostIFStartTimer(rate != prevRate, rate, filp);
+      res = HostIFStartTimer(rate != prevRate, rate);
       if (res < 0) {
          goto out;
       }
@@ -3390,19 +3033,9 @@ HostIFFastClockThread(void *data)  // IN:
        */
       Vmx86_MonTimerIPI();
 #endif
-
-      /*
-       * Wake threads that are waiting for a fast poll timeout at
-       * userlevel.  This is needed only on Linux.  On Windows,
-       * we get shorter timeouts simply by increasing the host
-       * clock rate.
-       */
-
-      LinuxDriverWakeUp(TRUE);
    }
 
  out:
-   LinuxDriverWakeUp(TRUE);
    set_fs(oldFS);
 
    /*
@@ -3475,34 +3108,15 @@ HostIF_SetFastClockRate(unsigned int rate) // IN: Frequency in Hz.
     * system, whereas on a P4 system physical CPU 0 gets all of them.
     *
     * Long story short, unless the monitor requested rate is significantly
-    * higher than HZ, we don't need to send IPIs or exclusively grab /dev/rtc
-    * to periodically kick vCPU threads running in the monitor on all physical
-    * CPUs.
+    * higher than HZ, we don't need to send IPIs to periodically kick vCPU
+    * threads running in the monitor on all physical CPUs.
     */
 
    if (rate > MIN_RATE) {
       if (!linuxState.fastClockThread) {
          struct task_struct *rtcTask;
-         struct file *filp = NULL;
-
-#if !defined(VMMON_USE_HIGH_RES_TIMERS)
-         int res;
 
-         filp = filp_open("/dev/rtc", O_RDONLY, 0);
-         if (IS_ERR(filp)) {
-            Warning("/dev/rtc open failed: %d\n", (int)(VA)filp);
-
-            return -(int)(VA)filp;
-         }
-         res = HostIFDoIoctl(filp, RTC_PIE_ON, 0);
-         if (res < 0) {
-            Warning("/dev/rtc enable interrupt failed: %d\n", res);
-            filp_close(filp, current->files);
-
-            return -res;
-         }
-#endif
-         rtcTask = kthread_run(HostIFFastClockThread, filp, "vmware-rtc");
+         rtcTask = kthread_run(HostIFFastClockThread, NULL, "vmware-clk");
          if (IS_ERR(rtcTask)) {
             long err = PTR_ERR(rtcTask);
 
@@ -3513,23 +3127,18 @@ HostIF_SetFastClockRate(unsigned int rate) // IN: Frequency in Hz.
              */
 
             if (err != -ERESTARTNOINTR) {
-               Warning("/dev/rtc cannot start watch thread: %ld\n", err);
+               Warning("vmmon cannot start hrtimer watch thread: %ld\n", err);
             }
-	    close_rtc(filp, current->files);
-
             return -err;
          }
          linuxState.fastClockThread = rtcTask;
-	 linuxState.fastClockFile = filp;
       }
    } else {
       if (linuxState.fastClockThread) {
          force_sig(SIGKILL, linuxState.fastClockThread);
          kthread_stop(linuxState.fastClockThread);
-	 close_rtc(linuxState.fastClockFile, current->files);
 
          linuxState.fastClockThread = NULL;
-	 linuxState.fastClockFile = NULL;
       }
    }
 
@@ -3542,7 +3151,7 @@ HostIF_SetFastClockRate(unsigned int rate) // IN: Frequency in Hz.
  *
  * HostIF_MapUserMem --
  *
- *	Obtain kernel pointer to user memory. The pages backing the user memory
+ *      Obtain kernel pointer to user memory. The pages backing the user memory
  *      address are locked into memory (this allows the pointer to be used in
  *      contexts where paging is undesirable or impossible).
  *
@@ -3552,7 +3161,7 @@ HostIF_SetFastClockRate(unsigned int rate) // IN: Frequency in Hz.
  *      On failure, returns NULL.
  *
  * Side effects:
- *	Yes.
+ *      Yes.
  *
  *-----------------------------------------------------------------------------
  */
@@ -3620,7 +3229,7 @@ HostIF_MapUserMem(VA addr,                  // IN: User memory virtual address
 
    printk(KERN_DEBUG "%s: p = 0x%p, offset = 0x%p, numPagesNeeded = %"FMTSZ"u,"
           " handleSize = %"FMTSZ"u, mappedAddr = 0x%p\n",
-          __func__, p, (void *)offset, numPagesNeeded, handleSize, mappedAddr); 
+          __func__, p, (void *)offset, numPagesNeeded, handleSize, mappedAddr);
 
    newHandle->numPages = numPagesNeeded;
    newHandle->addr = mappedAddr;
@@ -3635,13 +3244,13 @@ HostIF_MapUserMem(VA addr,                  // IN: User memory virtual address
  *
  * HostIF_UnmapUserMem --
  *
- *	Unmap user memory from HostIF_MapUserMem().
+ *      Unmap user memory from HostIF_MapUserMem().
  *
  * Results:
- *	None.
+ *      None.
  *
  * Side effects:
- *	Yes.
+ *      Yes.
  *
  *-----------------------------------------------------------------------------
  */
@@ -3656,7 +3265,7 @@ HostIF_UnmapUserMem(VMMappedUserMem *handle) // IN: Handle to mapped memory
    }
 
    printk(KERN_DEBUG "%s: numPages = %"FMTSZ"u, addr = 0x%p\n",
-          __func__, handle->numPages, handle->addr); 
+          __func__, handle->numPages, handle->addr);
 
    if (handle->numPages > 1) {
       vunmap(handle->addr);
@@ -3682,7 +3291,7 @@ HostIF_UnmapUserMem(VMMappedUserMem *handle) // IN: Handle to mapped memory
  *      0 if successful, and MSR value is returned via *val.
  *
  *      If the MSR is unimplemented, *val is set to 0, and a
- *      non-zero value is returned: -1 for Win32, -EFAULT for Linux,
+ *      non-zero value is returned: -1 for Win32, -EIO for Linux,
  *      and 1 for MacOS.
  *
  * Side effects:
@@ -3694,18 +3303,12 @@ int
 HostIF_SafeRDMSR(unsigned int msr,   // IN
                  uint64 *val)        // OUT: MSR value
 {
-   int ret;
-   unsigned low, high;
-   asm volatile("2: rdmsr ; xor %0,%0\n"
-                "1:\n\t"
-                ".section .fixup,\"ax\"\n\t"
-                "3: mov %4,%0 ; jmp 1b\n\t"
-                ".previous\n\t"
-                VMW_ASM_EXTABLE(2b, 3b)
-                : "=r"(ret), "=a"(low), "=d"(high)
-                : "c"(msr), "i"(-EFAULT), "1"(0), "2"(0)); // init eax/edx to 0
-   *val = (low | ((u64)(high) << 32));
+   int err;
+   u64 v;
 
-   return ret;
+   err = rdmsrl_safe(msr, &v);
+   *val = (err == 0) ? v : 0;  // Linux corrupts 'v' on error
+
+   return err;
 }
 
diff --git a/vmmon-only/linux/hostif_priv.h b/vmmon-only/linux/hostif_priv.h
index 8e731ba8..fd790660 100644
--- a/vmmon-only/linux/hostif_priv.h
+++ b/vmmon-only/linux/hostif_priv.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2009-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2009-2015 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -25,14 +25,6 @@
 #ifndef _HOSTIF_PRIV_H_
 #define _HOSTIF_PRIV_H_
 
-/* Functions for transferring data to/from userspace. */
-EXTERN int    HostIF_CopyFromUser(void *dst, const void *src, unsigned int len);
-EXTERN int    HostIF_CopyToUser(void *dst, const void *src, unsigned int len);
-
-/* Functions for dealing with the poll list lock. */
-EXTERN void   HostIF_PollListLock(int callerID);
-EXTERN void   HostIF_PollListUnlock(int callerID);
-
 /* Functions for mapping and unmapping userspace memory. */
 struct VMMappedUserMem;
 EXTERN void  *HostIF_MapUserMem(VA addr, size_t size,
diff --git a/vmmon-only/linux/vmhost.h b/vmmon-only/linux/vmhost.h
index 8041ba2b..f686902f 100644
--- a/vmmon-only/linux/vmhost.h
+++ b/vmmon-only/linux/vmhost.h
@@ -23,7 +23,7 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
-#include "compat_semaphore.h"
+#include <linux/semaphore.h>
 
 
 #ifdef VMX86_DEBUG
@@ -73,7 +73,7 @@ typedef struct Mutex {
  */
 
 typedef struct VMHost {
-   /* 
+   /*
     * Used for shared modifications to VM's VMDriver data, mostly page locking.
     * It has higher rank than the global mutex.
     */
@@ -84,15 +84,15 @@ typedef struct VMHost {
    struct task_struct *vcpuSemaTask[MAX_INITBLOCK_CPUS];
    /*
     * Pages that were allocated/mapped by VMX and locked by the driver and
-    * don't have a particular VA. 
+    * don't have a particular VA.
     */
    struct PhysTracker *lockedPages;
    /*
-    * Locked pages that were allocated by the driver and don't have 
+    * Locked pages that were allocated by the driver and don't have
     * a particular VA. They are used as monitor anonymous pages or
     * as pages for "AWE" guest memory.
     */
-   struct PhysTracker *AWEPages; 
+   struct PhysTracker *AWEPages;
    /* Is VMDriver.hostAPIC mapped or is from __fix_to_virt(FIX_APIC_BASE)? */
    Bool               hostAPICIsMapped;
 } VMHost;
diff --git a/vmmon-only/linux/vmmonInt.h b/vmmon-only/linux/vmmonInt.h
deleted file mode 100644
index 4dc04e90..00000000
--- a/vmmon-only/linux/vmmonInt.h
+++ /dev/null
@@ -1,109 +0,0 @@
-/*********************************************************
- * Copyright (C) 1998,2015 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef __VMMONINT_H__
-#define __VMMONINT_H__
-
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMCORE
-#include "includeCheck.h"
-
-
-/*
- * Hide all kernel compatibility stuff in these macros and functions.
- */
-
-#ifdef VMW_HAVE_SMP_CALL_3ARG
-#define compat_smp_call_function(fn, info, wait) smp_call_function(fn, info, wait)
-#else
-#define compat_smp_call_function(fn, info, wait) smp_call_function(fn, info, 1, wait)
-#endif
-
-
-/*
- *----------------------------------------------------------------------
- *
- * compat_tsc_khz --
- *
- *    Compatibility wrapper for tsc_khz.
- *
- * Returns:
- *
- *    Returns 0 if symbol is not exported by the kernel, else
- *    value of tsc_khz.
- *
- *----------------------------------------------------------------------
- */
-
-static inline unsigned int
-compat_tsc_khz(void)
-{
-#if defined(VMW_HAVE_TSC_KHZ)
-   return tsc_khz;
-#else
-   return 0;
-#endif
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * compat_smp_call_function_single --
- *
- *    Compatibility wrapper for calling smp_call_function_single.
- *    Versions prior to 2.6.20 did not export the symbol for both
- *    i386 and x86_64 kernels.
- *
- * Returns:
- *
- *    Returns -ENOSYS if the host kernel does not implement or export
- *    the function, else returns the error status of
- *    smp_call_function_single.
- *
- *----------------------------------------------------------------------
- */
-
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 20)
-#   ifdef VMW_HAVE_SMP_CALL_3ARG
-#      define compat_smp_call_function_single(cpu, fn, info, wait) \
-              smp_call_function_single(cpu, fn, info, wait)
-#   else
-#      define compat_smp_call_function_single(cpu, fn, info, wait) \
-              smp_call_function_single(cpu, fn, info, 1, wait)
-#   endif // VMW_HAVE_SMP_CALL_3ARG
-#else // VERSION >= 2.6.20
-#      define compat_smp_call_function_single(cpu, fn, info, wait) (-ENOSYS)
-#endif
-
-
-/*
- * Although this is not really related to kernel-compatibility, I put this
- * helper macro here for now for a lack of better place --hpreg
- *
- * The exit(2) path does, in this order:
- * . set current->files to NULL
- * . close all fds, which potentially calls LinuxDriver_Close()
- *
- * fget() requires current->files != NULL, so we must explicitely check --hpreg
- */
-#define vmware_fget(_fd) (current->files ? fget(_fd) : NULL)
-
-extern void LinuxDriverWakeUp(Bool selective);
-
-#endif /* __VMMONINT_H__ */
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/vmcore/moduleloop.c
index a6b2c1a8..589b4bf3 100644
--- a/vmmon-only/vmcore/moduleloop.c
+++ b/vmmon-only/vmcore/moduleloop.c
@@ -41,6 +41,7 @@
 #include "memtrack.h"
 #include "driver_vmcore.h"
 #include "usercalldefs.h"
+#include "cpuid.h"
 
 /*
  *----------------------------------------------------------------------
@@ -74,7 +75,7 @@ Vmx86_RunVM(VMDriver *vm,   // IN:
    VMCrossPageData *crosspage = &vm->crosspage[vcpuid]->crosspageData;
    int              bailValue = 0;
 
-   ASSERT(crosspage);
+   ASSERT(crosspage && CPUID_HostSupportsHV());
 
    /*
     * Check if we were interrupted by signal.
@@ -172,15 +173,13 @@ skipTaskSwitch:;
       }
 
       case MODULECALL_SEMAFORCEWAKEUP: {
-         ASSERT_ON_COMPILE(sizeof(VCPUSet) <= sizeof(crosspage->args));
-         HostIF_SemaphoreForceWakeup(vm, (VCPUSet *) &crosspage->args[0]);
+         HostIF_SemaphoreForceWakeup(vm, &crosspage->vcpuSet);
          break;
       }
 
       case MODULECALL_IPI: {
          HostIFIPIMode mode;
-         ASSERT_ON_COMPILE(sizeof(VCPUSet) <= sizeof(crosspage->args));
-         mode = HostIF_IPI(vm, (VCPUSet *) &crosspage->args[0]);
+         mode = HostIF_IPI(vm, &crosspage->vcpuSet);
          retval = (mode != IPI_NONE);
          break;
       }
@@ -225,11 +224,9 @@ skipTaskSwitch:;
       }
 
       case MODULECALL_COSCHED: {
-         uint32 spinUS = (uint32)crosspage->args[2];
-         ASSERT_ON_COMPILE(sizeof(VCPUSet) + sizeof(uint32) <=
-                           sizeof(crosspage->args));
-         Vmx86_YieldToSet(vm, vcpuid, (VCPUSet *) &crosspage->args[0],
-                          spinUS, FALSE);
+         uint32 spinUS = (uint32)crosspage->args[0];
+         ASSERT_ON_COMPILE(sizeof(uint32) <= sizeof(crosspage->args));
+         Vmx86_YieldToSet(vm, vcpuid, &crosspage->vcpuSet, spinUS, FALSE);
          break;
       }
 
@@ -251,6 +248,18 @@ skipTaskSwitch:;
          retval = crosspage->retval;
       } break;
 
+      case MODULECALL_VMCLEAR_VMCS_ALL_CPUS: {
+         MA vmcs = (MA)crosspage->args[0];
+         Vmx86_FlushVMCSAllCPUs(vmcs);
+      } break;
+
+      case MODULECALL_GET_PAGE_ROOT: {
+         MPN mpn;
+         Vcpuid targetVcpuid = (Vcpuid)crosspage->args[0];
+         retval = Vmx86_GetPageRoot(vm, targetVcpuid, &mpn);
+         crosspage->args[0] = mpn;
+      } break;
+
       default:
          Warning("ModuleCall %d not supported\n", crosspage->moduleCallType);
       }
diff --git a/vmnet-only/Makefile b/vmnet-only/Makefile
index 459846e1..caab6b91 100644
--- a/vmnet-only/Makefile
+++ b/vmnet-only/Makefile
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+# Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -84,8 +84,6 @@ endif
 
 ifneq ($(VM_KBUILD), no)
 
-VMCCVER := $(shell $(CC) -dumpversion)
-
 # If there is no version defined, we are in toplevel pass, not yet in kernel makefiles...
 ifeq ($(VERSION),)
 
@@ -100,14 +98,6 @@ auto-build: $(DRIVER_KO)
 $(DRIVER): $(DRIVER_KO)
 	if [ $< -nt $@ ] || [ ! -e $@ ] ; then cp -f $< $@; fi
 
-# Pass gcc version down the chain, so we can detect if kernel attempts to use unapproved compiler
-VM_CCVER := $(VMCCVER)
-export VM_CCVER
-VM_CC := $(CC)
-export VM_CC
-
-MAKEOVERRIDES := $(filter-out CC=%,$(MAKEOVERRIDES))
-
 #
 # Define a setup target that gets built before the actual driver.
 # This target may not be used at all, but if it is then it will be defined
diff --git a/vmnet-only/Makefile.kernel b/vmnet-only/Makefile.kernel
index 2d8e6f6c..09a1e3c9 100644
--- a/vmnet-only/Makefile.kernel
+++ b/vmnet-only/Makefile.kernel
@@ -20,10 +20,6 @@
 INCLUDE := -I$(SRCROOT)
 
 EXTRA_CFLAGS := $(CC_OPTS) $(INCLUDE)
-EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/netdev_has_net.c,-DVMW_NETDEV_HAS_NET, )
-EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/netdev_has_dev_net.c,-DVMW_NETDEV_HAS_DEV_NET, )
-EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/nfhook_uses_skb.c,-DVMW_NFHOOK_USES_SKB, )
-EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/skblin.c,  -DVMW_SKB_LINEARIZE_2618, )
 
 obj-m += $(DRIVER).o
 
diff --git a/vmnet-only/Makefile.normal b/vmnet-only/Makefile.normal
index a2181821..ab18108b 100644
--- a/vmnet-only/Makefile.normal
+++ b/vmnet-only/Makefile.normal
@@ -46,10 +46,6 @@ INCLUDE := -I. -I$(HEADER_DIR)
 INCLUDE += $(shell $(CC) $(INCLUDE) -E geninclude.c \
 	   | sed -n -e 's!^APATH!-I$(HEADER_DIR)/asm!p')
 
-CC_OPTS += $(call vm_check_build, $(SRCROOT)/netdev_has_net.c,-DVMW_NETDEV_HAS_NET, )
-CC_OPTS += $(call vm_check_build, $(SRCROOT)/netdev_has_dev_net.c,-DVMW_NETDEV_HAS_DEV_NET, )
-CC_OPTS += $(call vm_check_build, $(SRCROOT)/skblin.c, -DVMW_SKB_LINEARIZE_2618, )
-
 CFLAGS := -O $(CC_WARNINGS) $(CC_OPTS) $(INCLUDE) $(GLOBAL_DEFS)
 
 OBJS := driver.o hub.o userif.o netif.o bridge.o procfs.o smac_compat.o \
diff --git a/vmnet-only/bridge.c b/vmnet-only/bridge.c
index 8cdaf11d..25a74429 100644
--- a/vmnet-only/bridge.c
+++ b/vmnet-only/bridge.c
@@ -41,6 +41,7 @@
 #include <linux/file.h>
 #include <linux/ip.h>
 #include <linux/tcp.h>
+#include <linux/if_arp.h>
 #include <net/tcp.h>
 #include <net/ipv6.h>
 
@@ -77,7 +78,6 @@ struct VNetBridge {
    struct sock             *sk;             // socket associated with skb's
    struct packet_type       pt;             // used to add packet handler
    Bool                     enabledPromisc; // track if promisc enabled
-   Bool                     warnPromisc;    // tracks if warning has been logged
    Bool                     forceSmac;      // whether to use smac unconditionally
    struct sk_buff          *history[VNET_BRIDGE_HISTORY];  // avoid duplicate packets
    spinlock_t		    historyLock;    // protects 'history'
@@ -146,7 +146,6 @@ VNetBridgeStartPromisc(VNetBridge *bridge,      // IN:
    if (!bridge->enabledPromisc && !bridge->wirelessAdapter) {
       dev_set_promiscuity(dev, 1);
       bridge->enabledPromisc = TRUE;
-      bridge->warnPromisc = FALSE;
       LOG(0, (KERN_NOTICE "bridge-%s: enabled promiscuous mode\n",
 	      bridge->name));
    }
@@ -213,11 +212,9 @@ static INLINE_SINGLE_CALLER int
 VNetBridgeDevCompatible(VNetBridge *bridge,      // IN: Bridge
                         struct net_device *net)  // IN: Network device
 {
-#ifdef VMW_NETDEV_HAS_NET
-   if (compat_dev_net(net) != &init_net) {
+   if (dev_net(net) != &init_net) {
       return 0;
    }
-#endif
    return strcmp(net->name, bridge->name) == 0;
 }
 
@@ -636,7 +633,7 @@ VNetBridgeReceiveFromVNet(VNetJack        *this, // IN: jack
 	 unsigned long flags;
 	 int i;
 
-	 atomic_inc(&clone->users);
+	 clone = skb_get(clone);
 
 	 clone->dev = dev;
 	 clone->protocol = eth_type_trans(clone, dev);
@@ -811,22 +808,10 @@ VNetBridgeIsBridged(VNetJack *this) // IN: jack
 static Bool
 VNetBridgeIsDeviceWireless(struct net_device *dev) //IN: sock
 {
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 22)
-#  if defined(CONFIG_WIRELESS_EXT)
+#if defined(CONFIG_WIRELESS_EXT)
    return dev->ieee80211_ptr != NULL || dev->wireless_handlers != NULL;
-#  else
-   return dev->ieee80211_ptr != NULL;
-#  endif
-#elif defined(CONFIG_WIRELESS_EXT)
-   return dev->wireless_handlers != NULL;
-#elif !defined(CONFIG_NET_RADIO)
-   return FALSE;
-#elif defined WIRELESS_EXT && WIRELESS_EXT > 19
-   return dev->wireless_handlers != NULL;
-#elif defined WIRELESS_EXT && WIRELESS_EXT > 12
-   return dev->wireless_handlers != NULL || dev->get_wireless_stats != NULL;
 #else
-   return dev->get_wireless_stats != NULL;
+   return dev->ieee80211_ptr != NULL;
 #endif
 }
 
@@ -911,7 +896,7 @@ VNetBridgeUp(VNetBridge *bridge, // IN: bridge struct
     */
 
    dev_lock_list();
-   bridge->dev = DEV_GET(bridge);
+   bridge->dev = __dev_get_by_name(&init_net, bridge->name);
    LOG(2, (KERN_DEBUG "bridge-%s: got dev %p\n",
 	   bridge->name, bridge->dev));
    if (bridge->dev == NULL) {
@@ -926,17 +911,10 @@ VNetBridgeUp(VNetBridge *bridge, // IN: bridge struct
       retval = -ENODEV;
       goto out;
    }
-
-   /*
-    * At a minimum, the header size should be the same as ours.
-    *
-    * XXX we should either do header translation or ensure this
-    * is an Ethernet.
-    */
-
-   if (bridge->dev->hard_header_len != ETH_HLEN) {
-      LOG(1, (KERN_DEBUG "bridge-%s: can't bridge with %s, bad header length %d\n",
-	      bridge->name, bridge->dev->name, bridge->dev->hard_header_len));
+   if (bridge->dev->type != ARPHRD_ETHER) {
+      LOG(1, (KERN_DEBUG "bridge-%s: can't bridge with %s (header length %d, "
+              "type %d).\n", bridge->name, bridge->dev->name,
+              bridge->dev->hard_header_len, bridge->dev->type));
       dev_unlock_list();
       retval = -EINVAL;
       goto out;
@@ -990,7 +968,6 @@ VNetBridgeUp(VNetBridge *bridge, // IN: bridge struct
 
    bridge->pt.af_packet_priv = bridge->sk;
    bridge->enabledPromisc = FALSE;
-   bridge->warnPromisc = FALSE;
    dev_add_pack(&bridge->pt);
    dev_unlock_list();
 
@@ -1406,154 +1383,6 @@ VNetBridgeComputeHeaderPos(struct sk_buff *skb) // IN: buffer to examine
 }
 
 
-/*
- * We deal with three types of kernels:
- * New kernels: skb_shinfo() has gso_size member, and there is
- *              skb_gso_segment() helper to split GSO skb into flat ones.
- * Older kernels: skb_shinfo() has tso_size member, and there is
- *                no helper.
- * Oldest kernels: without any segmentation offload support.
- */
-#if defined(NETIF_F_GSO) || LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 18)
-#define VNetBridgeIsGSO(skb) skb_shinfo(skb)->gso_size
-#define VNetBridgeGSOSegment(skb) skb_gso_segment(skb, 0)
-#elif defined(NETIF_F_TSO)
-#define VNetBridgeIsGSO(skb) skb_shinfo(skb)->tso_size
-
-
-/*
- *----------------------------------------------------------------------
- *
- * VNetBridgeGSOSegment --
- *
- *	Split a large TCP/IPv4 sk_buff into multiple sk_buffs of
- *	size skb_shinfo(skb)->tso_size
- *	Called from VNetBridgeSendLargePacket().
- *
- * Results:
- *	List of skbs created.
- *
- * Side effects:
- *	The incoming packet is split into multiple packets.
- *
- *----------------------------------------------------------------------
- */
-
-static struct sk_buff *
-VNetBridgeGSOSegment(struct sk_buff *skb)        // IN: packet to split
-{
-   struct sk_buff *segs = NULL;
-   struct sk_buff **next = &segs;
-   int bytesPerPacket, bytesLeft;
-   int macHdrLen, ipHdrLen, tcpHdrLen, allHdrLen;
-   int curByteOffset;
-   uint16 ipID;
-   uint32 seqNo;
-
-   if (((struct ethhdr *)compat_skb_mac_header(skb))->h_proto != htons(ETH_P_IP)) {
-      return ERR_PTR(-EPFNOSUPPORT);
-   }
-
-   if (compat_skb_ip_header(skb)->protocol != IPPROTO_TCP) {
-      return ERR_PTR(-EPROTONOSUPPORT);
-   }
-
-   macHdrLen = compat_skb_network_header(skb) - compat_skb_mac_header(skb);
-   ipHdrLen = compat_skb_ip_header(skb)->ihl << 2;
-   tcpHdrLen = compat_skb_tcp_header(skb)->doff << 2;
-   allHdrLen = macHdrLen + ipHdrLen + tcpHdrLen;
-
-   ipID = ntohs(compat_skb_ip_header(skb)->id);
-   seqNo = ntohl(compat_skb_tcp_header(skb)->seq);
-
-   /* Host TCP stack populated this (MSS) for the host NIC driver */
-   bytesPerPacket = skb_shinfo(skb)->tso_size;
-
-   bytesLeft = skb->len - allHdrLen;
-   curByteOffset = allHdrLen;
-
-   while (bytesLeft) {
-      struct sk_buff *newSkb;
-      int payloadSize = (bytesLeft < bytesPerPacket) ? bytesLeft : bytesPerPacket;
-
-      newSkb = dev_alloc_skb(payloadSize + allHdrLen + NET_IP_ALIGN);
-      if (!newSkb) {
-         while (segs) {
-            newSkb = segs;
-            segs = segs->next;
-            newSkb->next = NULL;
-            dev_kfree_skb(newSkb);
-         }
-         return ERR_PTR(-ENOMEM);
-      }
-      skb_reserve(newSkb, NET_IP_ALIGN);
-      newSkb->dev = skb->dev;
-      newSkb->protocol = skb->protocol;
-      newSkb->pkt_type = skb->pkt_type;
-      newSkb->ip_summed = VM_TX_CHECKSUM_PARTIAL;
-
-      /*
-       * MAC+IP+TCP copy
-       * This implies that ALL fields in the IP and TCP headers are copied from
-       * the original skb. This is convenient: we'll only fix up fields that
-       * need to be changed below
-       */
-      memcpy(skb_put(newSkb, allHdrLen), skb->data, allHdrLen);
-
-      /* Fix up pointers to different layers */
-      compat_skb_reset_mac_header(newSkb);
-      compat_skb_set_network_header(newSkb, macHdrLen);
-      compat_skb_set_transport_header(newSkb, macHdrLen + ipHdrLen);
-
-      /* Payload copy */
-      skb_copy_bits(skb, curByteOffset, compat_skb_tail_pointer(newSkb), payloadSize);
-      skb_put(newSkb, payloadSize);
-
-      curByteOffset+=payloadSize;
-      bytesLeft -= payloadSize;
-
-      /* Fix up IP hdr */
-      compat_skb_ip_header(newSkb)->tot_len = htons(payloadSize + tcpHdrLen + ipHdrLen);
-      compat_skb_ip_header(newSkb)->id = htons(ipID);
-      compat_skb_ip_header(newSkb)->check = 0;
-      /* Recompute new IP checksum */
-      compat_skb_ip_header(newSkb)->check =
-              ip_fast_csum(compat_skb_network_header(newSkb),
-                           compat_skb_ip_header(newSkb)->ihl);
-
-      /* Fix up TCP hdr */
-      compat_skb_tcp_header(newSkb)->seq = htonl(seqNo);
-      /* Clear FIN/PSH if not last packet */
-      if (bytesLeft > 0) {
-         compat_skb_tcp_header(newSkb)->fin = 0;
-         compat_skb_tcp_header(newSkb)->psh = 0;
-      }
-      /* Recompute partial TCP checksum */
-      compat_skb_tcp_header(newSkb)->check =
-         ~csum_tcpudp_magic(compat_skb_ip_header(newSkb)->saddr,
-                            compat_skb_ip_header(newSkb)->daddr,
-                            payloadSize+tcpHdrLen, IPPROTO_TCP, 0);
-
-      /* Offset of field */
-      newSkb->csum = offsetof(struct tcphdr, check);
-
-      /* Join packet to the list of segments */
-      *next = newSkb;
-      next = &newSkb->next;
-
-      /* Bump up our counters */
-      ipID++;
-      seqNo += payloadSize;
-
-   }
-   return segs;
-}
-#else
-#define VNetBridgeIsGSO(skb) (0)
-#define VNetBridgeGSOSegment(skb) ERR_PTR(-ENOSYS)
-#endif
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -1582,7 +1411,7 @@ VNetBridgeSendLargePacket(struct sk_buff *skb,        // IN: packet to split
 {
    struct sk_buff *segs;
 
-   segs = VNetBridgeGSOSegment(skb);
+   segs = skb_gso_segment(skb, 0);
    dev_kfree_skb(skb);
    if (IS_ERR(segs)) {
       LOG(1, (KERN_DEBUG "bridge-%s: cannot segment packet: error %ld\n",
@@ -1713,7 +1542,7 @@ VNetBridgeReceiveFromDev(struct sk_buff *skb,         // IN: packet to receive
    /*
     * If this is a large packet, chop chop chop (if supported)...
     */
-   if (VNetBridgeIsGSO(skb)) {
+   if (skb_shinfo(skb)->gso_size) {
       VNetBridgeSendLargePacket(skb, bridge);
    } else {
       VNetSend(&bridge->port.jack, skb);
diff --git a/vmnet-only/community_source.h b/vmnet-only/community_source.h
index 2d32d8fa..754416e0 100644
--- a/vmnet-only/community_source.h
+++ b/vmnet-only/community_source.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2009-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2009-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmnet-only/compat_netdevice.h b/vmnet-only/compat_netdevice.h
index e1a3b0ee..0b34ccdf 100644
--- a/vmnet-only/compat_netdevice.h
+++ b/vmnet-only/compat_netdevice.h
@@ -337,7 +337,9 @@ typedef netdev_features_t compat_netdev_features_t;
 typedef u32 compat_netdev_features_t;
 #endif
 
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 7, 0)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 7, 0) || \
+    (defined(RHEL_RELEASE_CODE) && RHEL_RELEASE_CODE >= 0x0704) || \
+    (defined(CONFIG_SUSE_KERNEL) && LINUX_VERSION_CODE >= KERNEL_VERSION(4, 4, 73))
 #define compat_netif_trans_update(d) netif_trans_update(d)
 #else
 #define compat_netif_trans_update(d) do { (d)->trans_start = jiffies; } while (0)
diff --git a/vmnet-only/driver.c b/vmnet-only/driver.c
index 7e7ad99c..b3da8cbb 100644
--- a/vmnet-only/driver.c
+++ b/vmnet-only/driver.c
@@ -1682,11 +1682,7 @@ VNetSnprintf(char *str,          // OUT: resulting string
 
    va_start(args, format);
 
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 4, 8)
    length = vsnprintf(str, size, format, args);
-#else
-   length = vsprintf(str, format, args);
-#endif
 
    va_end(args);
 
diff --git a/vmnet-only/monitorAction_exported.h b/vmnet-only/monitorAction_exported.h
deleted file mode 100644
index 28b57c2c..00000000
--- a/vmnet-only/monitorAction_exported.h
+++ /dev/null
@@ -1,156 +0,0 @@
-/*********************************************************
- * Copyright (C) 2010-2013 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef _MONITORACTION_EXPORTED_H_
-#define _MONITORACTION_EXPORTED_H_
-
-#define INCLUDE_ALLOW_VMX
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_DISTRIBUTE
-#include "includeCheck.h"
-
-#include "vm_assert.h"
-#include "vm_atomic.h"
-#include "vm_basic_types.h"
-
-/*
- * Please bump the version number if your change will break the
- * compatability to the drivers.
- */
-#define ACTION_EXPORTED_VERSION   2
-
-#define ACTION_WORD_SIZE   (sizeof(uint64) * 8)
-#define ACTION_NUM_WORDS   (2)
-#define ACTION_NUM_IDS     (ACTION_NUM_WORDS * ACTION_WORD_SIZE)
-
-#define MONACTION_INVALID  MAX_UINT32
-
-typedef uint32 MonitorIdemAction;
-
-/*
- * Representation of a set of actions.
- */
-typedef struct MonitorActionSet {
-   volatile uint64 word[ACTION_NUM_WORDS];
-} MonitorActionSet;
-
-#ifndef __cplusplus
-typedef enum MonitorActionSetName MonitorActionSetName;
-#endif
-
-/*
- * Summary of action and interrupt states.
- */
-typedef struct MonitorActionIntr {
-   MonitorActionSet  pendingSet;
-   volatile Bool     action;
-   Bool              intr;
-   Bool              nmi;
-   Bool              db;
-   uint32            _pad;
-} MonitorActionIntr;
-
-/*
- *------------------------------------------------------------------------
- * MonitorActionSet_AtomicInclude --
- *
- *    This function atomically adds an action to an action set.
- *
- * Results:
- *    TRUE if the action being added did not exist in the action set.
- *    FALSE otherwise.
- *
- * Side effects:
- *    The given action set will be updated.
- *------------------------------------------------------------------------
- */
-static INLINE Bool
-MonitorActionSet_AtomicInclude(MonitorActionSet *set, const uint32 actionID)
-{
-   Atomic_uint64 *atomicSet =
-      Atomic_VolatileToAtomic64(&set->word[actionID / ACTION_WORD_SIZE]);
-   uint64 mask = (uint64)1 << (actionID % ACTION_WORD_SIZE);
-   uint64 oldWord;
-   uint64 newWord;
-
-   ASSERT_ON_COMPILE((ACTION_WORD_SIZE & (ACTION_WORD_SIZE - 1)) == 0);
-#ifdef VMX86_DEBUG
-   /* If ASSERT is not desirable, do explicit check. Please see PR 567811. */
-#ifdef MODULE
-   if (UNLIKELY(actionID / ACTION_WORD_SIZE >= ACTION_NUM_WORDS)) {
-      return FALSE;
-   }
-#else
-   ASSERT(actionID / ACTION_WORD_SIZE < ACTION_NUM_WORDS);
-#endif // MODULE
-#endif // VMX86_DEBUG
-   do {
-      oldWord = Atomic_Read64(atomicSet);
-      newWord = oldWord | mask;
-   } while (!Atomic_CMPXCHG64(atomicSet, &oldWord, &newWord));
-   return (oldWord & mask) == 0;
-}
-
-
-/*
- *----------------------------------------------------------------------------
- * MonitorAction_SetBits --
- *
- *      The core logic for posting an action. Update the set of pending
- *      actions of the target VCPU in the shared area to mark the action
- *      as present. Make sure the bit is set in the pendingSet first to
- *      avoid a race with the drain loop.
- *
- *      It's the responsibility of the callers to ensure that the change
- *      to actionIntr->action is globally visible before any IPI is sent
- *      (the change to pendingSet is pushed out by the cmpxchg in
- *      MonitorActionSet_AtomicInclude).
- *
- * Results:
- *      TRUE if the action being posted was not pending before.
- *      FALSE otherwise (other threads could have posted the same action).
- *
- * Side effects:
- *      None.
- *----------------------------------------------------------------------------
- */
-static INLINE Bool
-MonitorAction_SetBits(MonitorActionIntr *actionIntr, MonitorIdemAction actionID)
-{
-   /* Careful if optimizing this: see PR70016. */
-   Bool newAction =
-      MonitorActionSet_AtomicInclude(&actionIntr->pendingSet, actionID);
-   actionIntr->action = TRUE;
-   return newAction;
-}
-
-/*
- * C1 states entered by monitor while waiting for an action
- */
-typedef enum {
-   VMM_C1_STATE_INVALID = 0,
-   VMM_C1_STATE_HLT,
-   VMM_C1_STATE_MWAIT,
-   VMM_C1_STATE_PAUSE
-} vmmC1StateType;
-
-#endif // _MONITORACTION_EXPORTED_H_
diff --git a/vmnet-only/net.h b/vmnet-only/net.h
index 28fd10d7..c226f92d 100644
--- a/vmnet-only/net.h
+++ b/vmnet-only/net.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmnet-only/netdev_has_dev_net.c b/vmnet-only/netdev_has_dev_net.c
deleted file mode 100644
index 7ae5a015..00000000
--- a/vmnet-only/netdev_has_dev_net.c
+++ /dev/null
@@ -1,37 +0,0 @@
-/*********************************************************
- * Copyright (C) 2008 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * Detect whether there is dev_net accessor for dev->nd_net.
- * It appeared between 2.6.25 and 2.6.26-rc1.
- */
-
-#include "compat_version.h"
-#include "compat_autoconf.h"
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 25)
-#   error This compile test intentionally fails.
-#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 26)
-#   include <linux/netdevice.h>
-
-struct net * 
-vmware_dev_net(struct net_device *dev)
-{
-   return dev_net(dev);
-}
-#endif
diff --git a/vmnet-only/netdev_has_net.c b/vmnet-only/netdev_has_net.c
deleted file mode 100644
index 210c9de0..00000000
--- a/vmnet-only/netdev_has_net.c
+++ /dev/null
@@ -1,43 +0,0 @@
-/*********************************************************
- * Copyright (C) 2007 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * Detect whether there is separate net namespace.  It got introduced after
- * 2.6.23.  If this builds, there are two arguments to __dev_get_by_name...
- * For lower boundary use 2.6.23 - hopefully nobody crossports patch to
- * older kernels.  Note that this also affects sk_alloc interface -
- * for that there are two versions: sk_alloc(net, family, gfp, proto, 1) for
- * kernels 2.6.23 < x <= 2.6.24-rc1, and 4 argument version
- * sk_alloc(net, family, gfp, proto) for 2.6.24-rc1 < x.  We do ignore 2.6.24-rc1
- * as hopefully in few weeks all 2.6.24-rc1 users will be gone.
- */
-
-#include "compat_version.h"
-#include "compat_autoconf.h"
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 23)
-#   error This compile test intentionally fails.
-#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 24)
-#   include <linux/netdevice.h>
-
-struct net_device * 
-vmware_get_by_name(void)
-{
-   return __dev_get_by_name(0, "dummy");
-}
-#endif
diff --git a/vmnet-only/nfhook_uses_skb.c b/vmnet-only/nfhook_uses_skb.c
deleted file mode 100644
index fd61b67b..00000000
--- a/vmnet-only/nfhook_uses_skb.c
+++ /dev/null
@@ -1,45 +0,0 @@
-/*********************************************************
- * Copyright (C) 2007 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * Detect whether nf_hookfn takes struct sk_buff* skb, or struct sk_buff** pskb.
- * Kernels before 2.6.23 take pskb, kernels since 2.6.24 take skb, and we
- * are not sure about 2.6.23 itself, as change occured between 2.6.23 and
- * 2.6.24-rc1.
- */
-
-#include "compat_version.h"
-#include "compat_autoconf.h"
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 23)
-#   error This compile test intentionally fails.
-#elif LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 24)
-#   include <linux/netfilter.h>
-
-nf_hookfn test_function;
-
-unsigned int
-test_function(unsigned int hooknum,
-              struct sk_buff *skb,
-	      const struct net_device *in,
-	      const struct net_device *out,
-	      int (*defn)(struct sk_buff*))
-{
-   return 1234;
-}
-#endif
diff --git a/vmnet-only/skblin.c b/vmnet-only/skblin.c
deleted file mode 100644
index e3a6ccdc..00000000
--- a/vmnet-only/skblin.c
+++ /dev/null
@@ -1,41 +0,0 @@
-/*********************************************************
- * Copyright (C) 2006 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * Detect whether skb_linearize takes one or two arguments.
- */
-
-#include "compat_version.h"
-#include "compat_autoconf.h"
-
-#if LINUX_VERSION_CODE <= KERNEL_VERSION(2, 6, 17)
-/*
- * Since 2.6.18 all kernels have single-argument skb_linearize.  For
- * older kernels use autodetection.  Not using autodetection on newer
- * kernels saves us from compile failure on some post 2.6.18 kernels
- * which do not have selfcontained skbuff.h.
- */
-
-#include <linux/skbuff.h>
-
-int test_skb_linearize(struct sk_buff *skb)
-{
-   return skb_linearize(skb);
-}
-
-#endif
diff --git a/vmnet-only/smac.c b/vmnet-only/smac.c
index 71b711ef..c1c8da8f 100644
--- a/vmnet-only/smac.c
+++ b/vmnet-only/smac.c
@@ -2908,17 +2908,16 @@ SMAC_CheckPacketToHost(SMACState *state,     // IN: pointer to state
 		   arpHeaderWord2));
       return PacketStatusDropPacket;
    } else { // if EAPOL packet: typeClass == EthClassEAPOL
-
-      /*
-       * Allow outgoing EAPOL packets to proceed unmolested provided the
-       * source address matches the hardware address.
-       */
-
-      if (!MAC_EQ(state->macAddress, eh->srcAddr)) {
-         VNETKdPrint((MODULE_NAME "ToHostEAPOL: outgoing request using "
-                      "non-wireless-hardware-addr eth source MAC, dropping\n"));
+      if (!ClonePacket(packets)) {
+         VNETKdPrint((MODULE_NAME "  ToHostEapol: couldn't clone packet\n"));
          return PacketStatusDropPacket;
       }
+
+      /* For wireless, send EAPOL packets to host side. */
+      CopyDataToClonedPacket(packets, state->macAddress,
+                             ETH_ALEN /* offset for source MAC */,
+                             ETH_ALEN /* length */);
+
       return PacketStatusForwardPacket;
    }
 }
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index a7aee049..acc6ca69 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -36,9 +36,7 @@
 #include <linux/slab.h>
 #include <linux/version.h>
 #include <linux/wait.h>
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
 #include <linux/taskstats_kern.h>  // For <linux/sched/signal.h> without version dependency
-#endif
 
 #include <net/checksum.h>
 #include <net/sock.h>
@@ -50,7 +48,6 @@
 #include "vmnetInt.h"
 #include "vm_atomic.h"
 #include "vm_assert.h"
-#include "monitorAction_exported.h"
 
 typedef struct VNetUserIFStats {
    unsigned    read;
@@ -66,12 +63,9 @@ typedef struct VNetUserIF {
    VNetPort               port;
    struct sk_buff_head    packetQueue;
    Atomic_uint32         *pollPtr;
-   MonitorActionIntr     *actionIntr;
    uint32                 pollMask;
-   MonitorIdemAction      actionID;
    uint32*                recvClusterCount;
    wait_queue_head_t      waitQueue;
-   struct page*           actPage;
    struct page*           pollPage;
    struct page*           recvClusterPage;
    VNetUserIFStats        stats;
@@ -115,16 +109,7 @@ UserifLockPage(VA addr) // IN
    struct page *page = NULL;
    int retval;
 
-   down_read(&current->mm->mmap_sem);
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 9, 0)
-   retval = get_user_pages(addr, 1, FOLL_WRITE, &page, NULL);
-#elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 6, 0)
-   retval = get_user_pages(addr, 1, 1, 0, &page, NULL);
-#else
-   retval = get_user_pages(current, current->mm, addr,
-                           1, 1, 0, &page, NULL);
-#endif
-   up_read(&current->mm->mmap_sem);
+   retval = get_user_pages_fast(addr, 1, FOLL_WRITE, &page);
 
    if (retval != 1) {
       return NULL;
@@ -185,15 +170,15 @@ VNetUserIfMapUint32Ptr(VA uAddr,        // IN: pointer to user memory
  *
  * VNetUserIfSetupNotify --
  *
- *    Sets up notification by filling in pollPtr, actPtr, and recvClusterCount
+ *    Sets up notification by filling in pollPtr and recvClusterCount
  *    fields.
- * 
- * Results: 
+ *
+ * Results:
  *    0 on success
  *    < 0 on failure: the actual value determines the type of failure
  *
  * Side effects:
- *    Fields pollPtr, actPtr, recvClusterCount, pollPage, actPage, and 
+ *    Fields pollPtr, recvClusterCount, pollPage, and
  *    recvClusterPage are filled in VNetUserIf structure.
  *
  *-----------------------------------------------------------------------------
@@ -206,14 +191,12 @@ VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
    unsigned long flags;
    struct sk_buff_head *q = &userIf->packetQueue;
    uint32 *pollPtr;
-   MonitorActionIntr *actionIntr;
    uint32 *recvClusterCount;
    struct page *pollPage = NULL;
-   struct page *actPage = NULL;
    struct page *recvClusterPage = NULL;
    int retval;
 
-   if (userIf->pollPtr || userIf->actionIntr || userIf->recvClusterCount) {
+   if (userIf->pollPtr || userIf->recvClusterCount) {
       LOG(0, (KERN_DEBUG "vmnet: Notification mechanism already active\n"));
       return -EBUSY;
    }
@@ -230,12 +213,6 @@ VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
       goto error_free;
    }
 
-   if ((retval = VNetUserIfMapPtr((VA)vn->actPtr, sizeof *actionIntr,
-                                  &actPage,
-                                  (void **)&actionIntr)) < 0) {
-      goto error_free;
-   }
-
    if ((retval = VNetUserIfMapUint32Ptr((VA)vn->recvClusterPtr,
                                         &recvClusterPage,
                                         &recvClusterCount)) < 0) {
@@ -243,7 +220,7 @@ VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
    }
 
    spin_lock_irqsave(&q->lock, flags);
-   if (userIf->pollPtr || userIf->actionIntr || userIf->recvClusterCount) {
+   if (userIf->pollPtr || userIf->recvClusterCount) {
       spin_unlock_irqrestore(&q->lock, flags);
       retval = -EBUSY;
       LOG(0, (KERN_DEBUG "vmnet: Notification mechanism already active\n"));
@@ -252,12 +229,9 @@ VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
 
    userIf->pollPtr = (Atomic_uint32 *)pollPtr;
    userIf->pollPage = pollPage;
-   userIf->actionIntr = actionIntr;
-   userIf->actPage = actPage;
    userIf->recvClusterCount = recvClusterCount;
    userIf->recvClusterPage = recvClusterPage;
    userIf->pollMask = vn->pollMask;
-   userIf->actionID = vn->actionID;
    spin_unlock_irqrestore(&q->lock, flags);
    return 0;
 
@@ -266,10 +240,6 @@ VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
       kunmap(pollPage);
       put_page(pollPage);
    }
-   if (actPage) {
-      kunmap(actPage);
-      put_page(actPage);
-   }
    if (recvClusterPage) {
       kunmap(recvClusterPage);
       put_page(recvClusterPage);
@@ -283,12 +253,12 @@ VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
  * VNetUserIfUnsetupNotify --
  *
  *      Destroys permanent mapping for notify structure provided by user.
- * 
- * Results: 
+ *
+ * Results:
  *      None.
  *
  * Side effects:
- *      Fields pollPtr, actPtr, recvClusterCount, etc. in VNetUserIf
+ *      Fields pollPtr, recvClusterCount, etc. in VNetUserIf
  *      structure are cleared.
  *
  *----------------------------------------------------------------------
@@ -299,7 +269,6 @@ VNetUserIfUnsetupNotify(VNetUserIF *userIf) // IN
 {
    unsigned long flags;
    struct page *pollPage = userIf->pollPage;
-   struct page *actPage = userIf->actPage;
    struct page *recvClusterPage = userIf->recvClusterPage;
 
    struct sk_buff_head *q = &userIf->packetQueue;
@@ -307,12 +276,9 @@ VNetUserIfUnsetupNotify(VNetUserIF *userIf) // IN
    spin_lock_irqsave(&q->lock, flags);
    userIf->pollPtr = NULL;
    userIf->pollPage = NULL;
-   userIf->actionIntr = NULL;
-   userIf->actPage = NULL;
    userIf->recvClusterCount = NULL;
    userIf->recvClusterPage = NULL;
    userIf->pollMask = 0;
-   userIf->actionID = -1;
    spin_unlock_irqrestore(&q->lock, flags);
 
    /* Release */
@@ -320,10 +286,6 @@ VNetUserIfUnsetupNotify(VNetUserIF *userIf) // IN
       kunmap(pollPage);
       put_page(pollPage);
    }
-   if (actPage) {
-      kunmap(actPage);
-      put_page(actPage);
-   }
    if (recvClusterPage) {
       kunmap(recvClusterPage);
       put_page(recvClusterPage);
@@ -436,9 +398,12 @@ VNetUserIfReceive(VNetJack       *this, // IN
    __skb_queue_tail(&userIf->packetQueue, skb);
    if (userIf->pollPtr) {
       Atomic_Or(userIf->pollPtr, userIf->pollMask);
+#if 0
+      /* Potential optimization: avoid waking based on cluster size */
       if (skb_queue_len(&userIf->packetQueue) >= (*userIf->recvClusterCount)) {
-         MonitorAction_SetBits(userIf->actionIntr, userIf->actionID);
+         // TODO
       }
+#endif
    }
    spin_unlock_irqrestore(&userIf->packetQueue.lock, flags);
 
@@ -866,14 +831,6 @@ VNetUserIfIoctl(VNetPort      *port,  // IN
    case SIOCSETNOTIFY:
       return -EINVAL;
    case SIOCSETNOTIFY2:
-#ifdef VMX86_SERVER
-      /* 
-       * This ioctl always return failure on ESX since we cannot map pages into 
-       * the console os that are from the VMKernel address space which  was the
-       * only case we used this.
-       */
-      return -EINVAL;
-#else // VMX86_SERVER
    /*
     * ORs pollMask into the integer pointed to by ptr if pending packet. Is
     * cleared when all packets are drained.
@@ -886,11 +843,8 @@ VNetUserIfIoctl(VNetPort      *port,  // IN
          return -EFAULT;
       }
 
-      ASSERT_ON_COMPILE(VNET_NOTIFY_VERSION == 5);
-      ASSERT_ON_COMPILE(ACTION_EXPORTED_VERSION == 2);
-      if (vn.version != VNET_NOTIFY_VERSION ||
-          vn.actionVersion != ACTION_EXPORTED_VERSION ||
-          vn.actionID / ACTION_WORD_SIZE >= ACTION_NUM_WORDS) {
+      ASSERT_ON_COMPILE(VNET_NOTIFY_VERSION == 6);
+      if (vn.version != VNET_NOTIFY_VERSION) {
          return -ENOTTY;
       }
 
@@ -901,10 +855,8 @@ VNetUserIfIoctl(VNetPort      *port,  // IN
 
       break;
    }
-#endif // VMX86_SERVER
    case SIOCUNSETNOTIFY:
       if (!userIf->pollPtr) {
-	 /* This should always happen on ESX. */
          return -EINVAL;
       }
       VNetUserIfUnsetupNotify(userIf);
@@ -1110,13 +1062,10 @@ VNetUserIf_Create(VNetPort **ret) // OUT
    userIf->port.jack.portsChanged = NULL;
    userIf->port.jack.isBridged = NULL;
    userIf->pollPtr = NULL;
-   userIf->actionIntr = NULL;
    userIf->recvClusterCount = NULL;
    userIf->pollPage = NULL;
-   userIf->actPage = NULL;
    userIf->recvClusterPage = NULL;
    userIf->pollMask = 0;
-   userIf->actionID = -1;
    userIf->port.exactFilterLen = 0;
    userIf->eventSender = NULL;
 
diff --git a/vmnet-only/vm_assert.h b/vmnet-only/vm_assert.h
index b368e1da..8cdbc93e 100644
--- a/vmnet-only/vm_assert.h
+++ b/vmnet-only/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -99,24 +99,13 @@ void Warning(const char *fmt, ...) PRINTF_DECL(1, 2);
 #if defined VMKPANIC
 void Panic_SaveRegs(void);
 
-#ifdef VMX86_DEBUG
-void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
-#else
 NORETURN void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
-#endif
-
-NORETURN void Panic_NoSaveNoReturn(const char *fmt, ...) PRINTF_DECL(1, 2);
 
 #define Panic(fmt...) do { \
    Panic_SaveRegs();       \
    Panic_NoSave(fmt);      \
 } while(0)
 
-#define Panic_NoReturn(fmt...) do { \
-   Panic_SaveRegs();                \
-   Panic_NoSaveNoReturn(fmt);       \
-} while(0)
-
 #else
 NORETURN void Panic(const char *fmt, ...) PRINTF_DECL(1, 2);
 #endif
@@ -176,8 +165,6 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 
 #define ASSERT_NOT_IMPLEMENTED(cond) \
            ASSERT_IFNOT(cond, NOT_IMPLEMENTED())
-#define ASSERT_NOT_IMPLEMENTED_BUG(bug, cond) \
-           ASSERT_IFNOT(cond, NOT_IMPLEMENTED_BUG(bug))
 
 #if defined VMKPANIC || defined VMM
 #define NOT_IMPLEMENTED()        _ASSERT_PANIC_NORETURN(AssertNotImplemented)
@@ -202,10 +189,8 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
            ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertMemAlloc))
 
 #ifdef VMX86_DEVEL
-#define ASSERT_DEVEL(cond) ASSERT(cond)
 #define NOT_TESTED()       Warning(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
 #else
-#define ASSERT_DEVEL(cond) ((void)0)
 #define NOT_TESTED()       Log(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
 #endif
 
@@ -305,7 +290,7 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 #define ASSERT_ON_COMPILE(e) \
    do {                      \
       _Static_assert(e, #e); \
-   } while (0);
+   } while (0)
 #endif
 
 /*
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index 07f32eab..38d45fde 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -32,7 +32,6 @@
 #define _ATOMIC_H_
 
 #define INCLUDE_ALLOW_USERLEVEL
-
 #define INCLUDE_ALLOW_MODULE
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMKDRIVERS
@@ -45,6 +44,10 @@
 #include "vm_basic_types.h"
 #include "vm_assert.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
 /*
  * In the Atomic_* definitions below, memory ordering and atomicity are somewhat
  * conflated in an inconsistent manner. First, we have Atomic_{Read,Write},
@@ -84,153 +87,15 @@
  */
 
 #ifdef VM_ARM_64
-#include "vm_basic_asm_arm64.h"
-
-#define ARM_64_ATOMIC_16_OPV_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint16 _sample;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxrh   %w0, [%2]      \n\t" \
-      #op "       %w0, %w0, %w3  \n\t" \
-      "   stxrh   %w1, %w0, [%2] \n\t" \
-      "   cbnz    %w1, 1b        \n\t" \
-      : "=&r" (_sample),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-})
-
-#define ARM_64_ATOMIC_16_OPO_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint16 _newval;                     \
-   uint16 _oldval;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxrh   %w0, [%3]      \n\t" \
-      #op "       %w1, %w0, %w4  \n\t" \
-      "   stxrh   %w2, %w1, [%3] \n\t" \
-      "   cbnz    %w2, 1b        \n\t" \
-      : "=&r" (_oldval),               \
-        "=&r" (_newval),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-   _oldval;                            \
-})
-
-#define ARM_64_ATOMIC_32_OPV_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint32 _sample;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxr    %w0, [%2]      \n\t" \
-      #op "       %w0, %w0, %w3  \n\t" \
-      "   stxr    %w1, %w0, [%2] \n\t" \
-      "   cbnz    %w1, 1b        \n\t" \
-      : "=&r" (_sample),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-})
-
-#define ARM_64_ATOMIC_32_OPO_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint32 _newval;                     \
-   uint32 _oldval;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxr    %w0, [%3]      \n\t" \
-      #op "       %w1, %w0, %w4  \n\t" \
-      "   stxr    %w2, %w1, [%3] \n\t" \
-      "   cbnz    %w2, 1b        \n\t" \
-      : "=&r" (_oldval),               \
-        "=&r" (_newval),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-   _oldval;                            \
-})
-
-#define ARM_64_ATOMIC_64_OPV_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint64 _sample;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxr    %x0, [%2]      \n\t" \
-      #op "       %x0, %x0, %x3  \n\t" \
-      "   stxr    %w1, %x0, [%2] \n\t" \
-      "   cbnz    %w1, 1b        \n\t" \
-      : "=&r" (_sample),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-})
-
-#define ARM_64_ATOMIC_64_OPO_PRIVATE(atm,modval,op) ({ \
-   uint32 _failed;                     \
-   uint64 _newval;                     \
-   uint64 _oldval;                     \
-   __asm__ __volatile__ (              \
-      "1: ldxr    %x0, [%3]      \n\t" \
-      #op "       %x1, %x0, %x4  \n\t" \
-      "   stxr    %w2, %x1, [%3] \n\t" \
-      "   cbnz    %w2, 1b        \n\t" \
-      : "=&r" (_oldval),               \
-        "=&r" (_newval),               \
-        "=&r" (_failed)                \
-      : "r" (atm),                     \
-        "r" (modval)                   \
-      : "memory");                     \
-   _oldval;                            \
-})
-
-#define ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
-   DMB();                                       \
-   ARM_64_ATOMIC_16_OPV_PRIVATE(atm,modval,op); \
-   DMB();                                       \
-})
-
-#define ARM_64_ATOMIC_16_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
-   uint16 _oldval_fenced;                                        \
-   DMB();                                                        \
-   _oldval_fenced = ARM_64_ATOMIC_16_OPO_PRIVATE(atm,modval,op); \
-   DMB();                                                        \
-   _oldval_fenced;                                               \
-})
-
-#define ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
-   DMB();                                       \
-   ARM_64_ATOMIC_32_OPV_PRIVATE(atm,modval,op); \
-   DMB();                                       \
-})
-
-#define ARM_64_ATOMIC_32_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
-   uint32 _oldval_fenced;                                        \
-   DMB();                                                        \
-   _oldval_fenced = ARM_64_ATOMIC_32_OPO_PRIVATE(atm,modval,op); \
-   DMB();                                                        \
-   _oldval_fenced;                                               \
-})
-
-#define ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(atm,modval,op) ({ \
-   DMB();                                       \
-   ARM_64_ATOMIC_64_OPV_PRIVATE(atm,modval,op); \
-   DMB();                                       \
-})
-
-#define ARM_64_ATOMIC_64_OPO_PRIVATE_FENCED(atm,modval,op) ({ \
-   uint64 _oldval_fenced;                                        \
-   DMB();                                                        \
-   _oldval_fenced = ARM_64_ATOMIC_64_OPO_PRIVATE(atm,modval,op); \
-   DMB();                                                        \
-   _oldval_fenced;                                               \
-})
-
-#endif /* VM_ARM_64 */
-
-
-/* Basic atomic types: 16, 32 and 64 bits */
+#   include "vm_atomic_arm64_begin.h"
+#endif
+
+
+/* Basic atomic types: 8, 16, 32, 64 and 128 bits */
+typedef struct Atomic_uint8 {
+   volatile uint8 value;
+} Atomic_uint8 ALIGNED(1);
+
 typedef struct Atomic_uint16 {
    volatile uint16 value;
 } Atomic_uint16 ALIGNED(2);
@@ -239,10 +104,17 @@ typedef struct Atomic_uint32 {
    volatile uint32 value;
 } Atomic_uint32 ALIGNED(4);
 
-typedef struct  Atomic_uint64 {
+typedef struct Atomic_uint64 {
    volatile uint64 value;
 } Atomic_uint64 ALIGNED(8);
 
+#if defined __GNUC__ && defined VM_64BIT && \
+     (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
+typedef struct Atomic_uint128 {
+   volatile uint128 value;
+} Atomic_uint128 ALIGNED(16);
+#endif
+
 /*
  * Prototypes for msft atomics.  These are defined & inlined by the
  * compiler so no function definition is needed.  The prototypes are
@@ -258,7 +130,7 @@ typedef struct  Atomic_uint64 {
  * Windows typedefs. This avoids having to include windows header files
  * to get to the windows types.
  */
-#if defined(_MSC_VER) && _MSC_VER >= 1310 && !defined(BORA_NO_WIN32_INTRINS)
+#if defined _MSC_VER && _MSC_VER >= 1310 && !defined BORA_NO_WIN32_INTRINS
 #ifdef __cplusplus
 extern "C" {
 #endif
@@ -267,10 +139,11 @@ long  _InterlockedCompareExchange(long volatile*, long, long);
 long  _InterlockedExchangeAdd(long volatile*, long);
 long  _InterlockedDecrement(long volatile*);
 long  _InterlockedIncrement(long volatile*);
-void  _ReadWriteBarrier(void);
+__int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
 #pragma intrinsic(_InterlockedExchange, _InterlockedCompareExchange)
 #pragma intrinsic(_InterlockedExchangeAdd, _InterlockedDecrement)
-#pragma intrinsic(_InterlockedIncrement, _ReadWriteBarrier)
+#pragma intrinsic(_InterlockedIncrement)
+#pragma intrinsic(_InterlockedCompareExchange64)
 
 # if _MSC_VER >= 1600
 char     _InterlockedExchange8(char volatile *, char);
@@ -278,7 +151,7 @@ char     _InterlockedCompareExchange8(char volatile *, char, char);
 #pragma intrinsic(_InterlockedCompareExchange8, _InterlockedCompareExchange8)
 #endif
 
-#if defined(VM_X86_64)
+#if defined VM_X86_64
 long     _InterlockedAnd(long volatile*, long);
 __int64  _InterlockedAnd64(__int64 volatile*, __int64);
 long     _InterlockedOr(long volatile*, long);
@@ -289,14 +162,12 @@ __int64  _InterlockedExchangeAdd64(__int64 volatile*, __int64);
 __int64  _InterlockedIncrement64(__int64 volatile*);
 __int64  _InterlockedDecrement64(__int64 volatile*);
 __int64  _InterlockedExchange64(__int64 volatile*, __int64);
-__int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
-#if !defined(_WIN64)
+#if !defined _WIN64
 #pragma intrinsic(_InterlockedAnd, _InterlockedAnd64)
 #pragma intrinsic(_InterlockedOr, _InterlockedOr64)
 #pragma intrinsic(_InterlockedXor, _InterlockedXor64)
 #pragma intrinsic(_InterlockedExchangeAdd64, _InterlockedIncrement64)
 #pragma intrinsic(_InterlockedDecrement64, _InterlockedExchange64)
-#pragma intrinsic(_InterlockedCompareExchange64)
 #endif /* !_WIN64 */
 #endif /* __x86_64__ */
 
@@ -305,7 +176,7 @@ __int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
 #endif
 #endif /* _MSC_VER */
 
-#if defined(__arm__)
+#if defined __arm__
 /*
  * LDREX without STREX or CLREX may cause problems in environments where the
  * context switch may not clear the reference monitor - according ARM manual
@@ -313,8 +184,8 @@ __int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
  * may not like Linux kernel's non-preemptive context switch path. So use of
  * ARM routines in kernel code may not be safe.
  */
-#   if defined(__ARM_ARCH_7__) || defined(__ARM_ARCH_7A__) ||  \
-       defined(__ARM_ARCH_7R__)|| defined(__ARM_ARCH_7M__)
+#   if defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ ||  \
+       defined __ARM_ARCH_7R__|| defined __ARM_ARCH_7M__
 #      define VM_ARM_V7
 #      ifdef __KERNEL__
 #         warning LDREX/STREX may not be safe in linux kernel, since it      \
@@ -335,10 +206,12 @@ __int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
 
 /* Convert a volatile uint32 to Atomic_uint32. */
 static INLINE Atomic_uint32 *
-Atomic_VolatileToAtomic(volatile uint32 *var)  // IN:
+Atomic_VolatileToAtomic32(volatile uint32 *var)  // IN:
 {
    return (Atomic_uint32 *)var;
 }
+#define Atomic_VolatileToAtomic Atomic_VolatileToAtomic32
+
 
 /* Convert a volatile uint64 to Atomic_uint64. */
 static INLINE Atomic_uint64 *
@@ -347,235 +220,617 @@ Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
    return (Atomic_uint64 *)var;
 }
 
+
+/*
+ * All the assembly code is tricky and written conservatively.
+ * For example, to make sure gcc won't introduce copies,
+ * we force the addressing mode like this:
+ *
+ *    "xchgl %0, (%1)"
+ *    : "=r" (val)
+ *    : "r" (&var->value),
+ *      "0" (val)
+ *    : "memory"
+ *
+ * - edward
+ *
+ * Actually - turns out that gcc never generates memory aliases (it
+ * still does generate register aliases though), so we can be a bit
+ * more agressive with the memory constraints. The code above can be
+ * modified like this:
+ *
+ *    "xchgl %0, %1"
+ *    : "=r" (val),
+ *      "=m" (var->value),
+ *    : "0" (val),
+ *      "1" (var->value)
+ *
+ * The advantages are that gcc can use whatever addressing mode it
+ * likes to access the memory value, and that we dont have to use a
+ * way-too-generic "memory" clobber as there is now an explicit
+ * declaration that var->value is modified.
+ *
+ * see also /usr/include/asm/atomic.h to convince yourself this is a
+ * valid optimization.
+ *
+ * - walken
+ */
+
+#if defined _MSC_VER && _MSC_VER < 1600 && defined __x86_64__
+uint8 VMWInterlockedExchange8(uint8 volatile *ptr,
+                              uint8 val);
+
+uint8 VMWInterlockedCompareExchange8(uint8 volatile *ptr,
+                                     uint8 newVal,
+                                     uint8 oldVal);
+#endif
+
+#if defined __GNUC__ && defined VM_ARM_32
+/* Force the link step to fail for unimplemented functions. */
+extern int AtomicUndefined(void const *);
+#endif
+
+
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Init, Atomic_SetFence, AtomicUseFence --
+ * Atomic_ReadIfEqualWrite128 --
+ *
+ *      Compare and exchange a 16 byte tuple.
  *
- *      Determine whether an lfence intruction is executed after
- *	every locked instruction.
+ * Results:
+ *      old value
  *
- *	Certain AMD processors have a bug (see bug 107024) that
- *	requires an lfence after every locked instruction.
+ * Side effects:
+ *      None
  *
- *	The global variable AtomicUseFence controls whether lfence
- *	is used (see AtomicEpilogue).
+ *-----------------------------------------------------------------------------
+ */
+#if defined __GNUC__ && defined VM_64BIT && \
+     (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
+static INLINE uint128
+Atomic_ReadIfEqualWrite128(Atomic_uint128 *ptr,   // IN/OUT
+                           uint128        oldVal, // IN
+                           uint128        newVal) // IN
+{
+#ifdef __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16
+   return __sync_val_compare_and_swap(&ptr->value, oldVal, newVal);
+#elif defined VM_ARM_64
+   union {
+      uint128 raw;
+      struct {
+         uint64 lo;
+         uint64 hi;
+      };
+   } res, _old = { oldVal }, _new = { newVal };
+   uint32 failed;
+
+   SMP_RW_BARRIER_RW();
+   __asm__ __volatile__(
+      "1: ldxp    %x0, %x1, %3        \n\t"
+      "   cmp     %x0, %x4            \n\t"
+      "   ccmp    %x1, %x5, #0, eq    \n\t"
+      "   b.ne    2f                  \n\t"
+      "   stxp    %w2, %x6, %x7, %3   \n\t"
+      "   cbnz    %w2, 1b             \n\t"
+      "2:                             \n\t"
+      : "=&r" (res.lo),
+        "=&r" (res.hi),
+        "=&r" (failed),
+        "+Q" (ptr->value)
+      : "r" (_old.lo),
+        "r" (_old.hi),
+        "r" (_new.lo),
+        "r" (_new.hi)
+      : "cc"
+   );
+   SMP_RW_BARRIER_RW();
+
+   return res.raw;
+#endif
+}
+#endif
+
+
+/*
+ *-----------------------------------------------------------------------------
  *
- *	Atomic_SetFence sets AtomicUseFence to the given value.
+ * Atomic_Read8 --
  *
- *	Atomic_Init computes and sets AtomicUseFence for x86.
- *	It does not take into account the number of processors.
+ *      Read the value of the specified object atomically.
  *
- *	The rationale for all this complexity is that Atomic_Init
- *	is the easy-to-use interface.  It can be called a number
- *	of times cheaply, and does not depend on other libraries.
- *	However, because the number of CPUs is difficult to compute,
- *	it does without it and always assumes there are more than one.
+ * Results:
+ *      The value of the atomic variable.
  *
- *	For programs that care or have special requirements,
- *	Atomic_SetFence can be called directly, in addition to Atomic_Init.
- *	It overrides the effect of Atomic_Init, and can be called
- *	before, after, or between calls to Atomic_Init.
+ * Side effects:
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
 
-// The freebsd assembler doesn't know the lfence instruction
-#if defined(__GNUC__) &&                                                \
-     __GNUC__ >= 3 &&                                                   \
-    (defined(__VMKERNEL__) || !defined(__FreeBSD__)) &&                 \
-    (!defined(MODULE) || defined(__VMKERNEL_MODULE__)) &&               \
-    !defined(__APPLE__) &&                                              \
-    (defined(__i386__) || defined(__x86_64__)) /* PR136775 */
-#define ATOMIC_USE_FENCE
+static INLINE uint8
+Atomic_Read8(Atomic_uint8 const *var)  // IN:
+{
+   uint8 val;
+
+#if defined __GNUC__ && defined VM_ARM_32
+   val = AtomicUndefined(var);
+#elif defined VM_ARM_64
+   val = _VMATOM_X(R, 8, &var->value);
+#elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=q" (val)
+      : "m" (var->value)
+   );
+#elif defined _MSC_VER
+   val = var->value;
+#else
+#error No compiler defined for Atomic_Read8
 #endif
 
-/* 
- * Starting with vSphere 2014, we no longer support ESX on AMD Rev F. 
- * Thus, we can eliminate all dynamic checks for whether to enable 
- * the Errata 147 work-around when compiling many of our binaries. 
- * However, we use an opt-in approach here rather than assuming all 
- * parts of our builds are safe. For example, the "fdm" binary from 
- * a new build may time travel back to hosts running older versions 
- * of ESX on Rev F, so "fdm" continues to require the ability to 
- * dynamically enable the errata work-around. With vSphere 2017,
- * this will no longer be required as the oldest version of ESX that 
- * VC 2017 will support is ESX 2014 (which won't run on Rev F).
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadWrite8 --
  *
- * Modules may explicitly define MAY_NEED_AMD_REVF_WORKAROUND as 0 prior to
- * inclusion of vm_atomic.h when they are safe on AMD Rev F with the elided
- * lfence.
+ *      Read followed by write.
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
  */
-#if !defined(MAY_NEED_AMD_REVF_WORKAROUND)
-#if (!defined(VMX86_SERVER) ||                                          \
-      (!defined(VMX86_VMX) && !defined(VMKERNEL) &&                     \
-       !defined(VMM)       && !defined(VMCORE)))
-#define MAY_NEED_AMD_REVF_WORKAROUND 1
+
+static INLINE uint8
+Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
+                  uint8 val)          // IN:
+{
+#if defined __GNUC__ && defined VM_ARM_32
+   return AtomicUndefined(var + val);
+#elif defined VM_ARM_64
+   return _VMATOM_X(RW, 8, TRUE, &var->value, val);
+#elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
+   __asm__ __volatile__(
+      "xchgb %0, %1"
+      : "=q" (val),
+        "+m" (var->value)
+      : "0" (val)
+   );
+   return val;
+#elif defined _MSC_VER && _MSC_VER >= 1600
+   return _InterlockedExchange8((volatile char *)&var->value, val);
+#elif defined _MSC_VER && defined __i386__
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm movzx eax, val
+      __asm mov ebx, var
+      __asm xchg [ebx]Atomic_uint8.value, al
+   }
+#pragma warning(pop)
+#elif defined _MSC_VER && defined __x86_64__
+   return VMWInterlockedExchange8(&var->value, val);
 #else
-#define MAY_NEED_AMD_REVF_WORKAROUND 0
+#error No compiler defined for Atomic_ReadWrite8
 #endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write8 --
+ *
+ *      Write the specified value to the specified object atomically.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
+              uint8 val)          // IN:
+{
+#if defined __GNUC__ && defined VM_ARM_32
+   AtomicUndefined(var + val);
+#elif defined VM_ARM_64
+   _VMATOM_X(W, 8, &var->value, val);
+#elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=m" (var->value)
+      : "qn" (val)
+   );
+#elif defined _MSC_VER
+   var->value = val;
+#else
+#error No compiler defined for Atomic_Write8
 #endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadIfEqualWrite8 --
+ *
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal.
+ *
+ * Results:
+ *      The value of the atomic variable before the write.
+ *
+ * Side effects:
+ *      The variable may be modified.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
+                         uint8 oldVal,       // IN:
+                         uint8 newVal)       // IN:
+{
+#if defined __GNUC__ && defined VM_ARM_32
+   return AtomicUndefined(var + oldVal + newVal);
+#elif defined VM_ARM_64
+   return _VMATOM_X(RIFEQW, 8, TRUE, &var->value, oldVal, newVal);
+#elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
+   uint8 val;
+
+   __asm__ __volatile__(
+      "lock; cmpxchgb %2, %1"
+      : "=a" (val),
+        "+m" (var->value)
+      : "q" (newVal),
+        "0" (oldVal)
+      : "cc"
+   );
 
-#if MAY_NEED_AMD_REVF_WORKAROUND
-#if defined(VMATOMIC_IMPORT_DLLDATA)
-VMX86_EXTERN_DATA Bool AtomicUseFence;
+   return val;
+#elif defined _MSC_VER && _MSC_VER >= 1600
+   return _InterlockedCompareExchange8((volatile char *)&var->value,
+                                       newVal, oldVal);
+#elif defined _MSC_VER && defined __i386__
+#pragma warning(push)
+#pragma warning(disable : 4035)         // disable no-return warning
+   {
+      __asm mov al, oldVal
+      __asm mov ebx, var
+      __asm mov cl, newVal
+      __asm lock cmpxchg [ebx]Atomic_uint8.value, cl
+      __asm movzx eax, al
+      // eax is the return value, this is documented to work - edward
+   }
+#pragma warning(pop)
+#elif defined _MSC_VER && defined __x86_64__
+   return VMWInterlockedCompareExchange8(&var->value, newVal, oldVal);
 #else
-EXTERN Bool AtomicUseFence;
+#error No compiler defined for Atomic_ReadIfEqualWrite8
 #endif
-EXTERN Bool atomicFenceInitialized;
-#else   /* MAY_NEED_AMD_REVF_WORKAROUND */
-#define AtomicUseFence         FALSE
-#define atomicFenceInitialized TRUE
-#endif  /* MAY_NEED_AMD_REVF_WORKAROUND */
+}
 
 
-void AtomicInitFence(void);
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAnd8 --
+ *
+ *      Atomic read (returned), bitwise AND with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadAnd8(Atomic_uint8 *var, // IN/OUT
+                uint8 val)         // IN
+{
+   uint8 res;
+
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 8, TRUE, &var->value, and, val);
+#else
+   do {
+      res = Atomic_Read8(var);
+   } while (res != Atomic_ReadIfEqualWrite8(var, res, res & val));
+#endif
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_And8 --
+ *
+ *      Atomic read, bitwise AND with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
 
 static INLINE void
-Atomic_Init(void)
+Atomic_And8(Atomic_uint8 *var, // IN/OUT
+            uint8 val)         // IN
 {
-#ifdef ATOMIC_USE_FENCE
-   if (MAY_NEED_AMD_REVF_WORKAROUND && !atomicFenceInitialized) {
-      AtomicInitFence();
-   }
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, and, val);
+#else
+   (void)Atomic_ReadAnd8(var, val);
 #endif
 }
 
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadOr8 --
+ *
+ *      Atomic read (returned), bitwise OR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadOr8(Atomic_uint8 *var, // IN/OUT
+               uint8 val)         // IN
+{
+   uint8 res;
+
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 8, TRUE, &var->value, orr, val);
+#else
+   do {
+      res = Atomic_Read8(var);
+   } while (res != Atomic_ReadIfEqualWrite8(var, res, res | val));
+#endif
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Or8 --
+ *
+ *      Atomic read, bitwise OR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
 static INLINE void
-Atomic_SetFence(Bool fenceAfterLock)  // IN:
+Atomic_Or8(Atomic_uint8 *var, // IN/OUT
+           uint8 val)         // IN
 {
-   (void)fenceAfterLock;     /* Work around unused parameter. */
-#if MAY_NEED_AMD_REVF_WORKAROUND
-   AtomicUseFence = fenceAfterLock;
-   atomicFenceInitialized = TRUE;
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, orr, val);
+#else
+   (void)Atomic_ReadOr8(var, val);
 #endif
 }
 
 
-/* Conditionally execute fence after interlocked instruction. */
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadXor8 --
+ *
+ *      Atomic read (returned), bitwise XOR with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadXor8(Atomic_uint8 *var, // IN/OUT
+                uint8 val)         // IN
+{
+   uint8 res;
+
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 8, TRUE, &var->value, eor, val);
+#else
+   do {
+      res = Atomic_Read8(var);
+   } while (res != Atomic_ReadIfEqualWrite8(var, res, res ^ val));
+#endif
+
+   return res;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Xor8 --
+ *
+ *      Atomic read, bitwise XOR with a value, write.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
 static INLINE void
-AtomicEpilogue(void)
+Atomic_Xor8(Atomic_uint8 *var, // IN/OUT
+            uint8 val)         // IN
 {
-#if MAY_NEED_AMD_REVF_WORKAROUND && defined(ATOMIC_USE_FENCE)
-#ifdef VMM
-      /* The monitor conditionally patches out the lfence when not needed.*/
-      /* Construct a MonitorPatchTextEntry in the .patchtext section. */
-      asm volatile ("1:\n\t"
-                    "lfence\n\t"
-                    "2:\n\t"
-                    ".pushsection .patchtext\n\t"
-                    ".quad 1b\n\t"
-                    ".quad 2b\n\t"
-                    ".quad 0\n\t"
-                    ".popsection\n\t" ::: "memory");
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, eor, val);
 #else
-      if (UNLIKELY(AtomicUseFence)) {
-         asm volatile ("lfence" ::: "memory");
-      }
+   (void)Atomic_ReadXor8(var, val);
 #endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAdd8 --
+ *
+ *      Atomic read (returned), add a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_ReadAdd8(Atomic_uint8 *var, // IN/OUT
+                uint8 val)         // IN
+{
+   uint8 res;
+
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 8, TRUE, &var->value, add, val);
+#else
+   do {
+      res = Atomic_Read8(var);
+   } while (res != Atomic_ReadIfEqualWrite8(var, res, res + val));
 #endif
+
+   return res;
 }
 
 
 /*
- * All the assembly code is tricky and written conservatively.
- * For example, to make sure gcc won't introduce copies,
- * we force the addressing mode like this:
+ *-----------------------------------------------------------------------------
  *
- *    "xchgl %0, (%1)"
- *    : "=r" (val)
- *    : "r" (&var->value),
- *      "0" (val)
- *    : "memory"
+ * Atomic_Add8 --
  *
- * - edward
+ *      Atomic read, add a value, write.
  *
- * Actually - turns out that gcc never generates memory aliases (it
- * still does generate register aliases though), so we can be a bit
- * more agressive with the memory constraints. The code above can be
- * modified like this:
+ * Results:
+ *      None
  *
- *    "xchgl %0, %1"
- *    : "=r" (val),
- *      "=m" (var->value),
- *    : "0" (val),
- *      "1" (var->value)
+ * Side effects:
+ *      None
  *
- * The advantages are that gcc can use whatever addressing mode it
- * likes to access the memory value, and that we dont have to use a
- * way-too-generic "memory" clobber as there is now an explicit
- * declaration that var->value is modified.
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Add8(Atomic_uint8 *var, // IN/OUT
+            uint8 val)         // IN
+{
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, add, val);
+#else
+   (void)Atomic_ReadAdd8(var, val);
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Sub8 --
+ *
+ *      Atomic read, subtract a value, write.
+ *
+ * Results:
+ *      None
  *
- * see also /usr/include/asm/atomic.h to convince yourself this is a
- * valid optimization.
+ * Side effects:
+ *      None
  *
- * - walken
+ *-----------------------------------------------------------------------------
  */
 
-#if defined(_MSC_VER) && _MSC_VER < 1600 && defined(__x86_64__)
-Bool VMWInterlockedExchangeBool(Bool volatile *ptr,
-                                Bool val);
-
-Bool VMWInterlockedCompareExchangeBool(Bool volatile *ptr,
-                                       Bool newVal,
-                                       Bool oldVal);
+static INLINE void
+Atomic_Sub8(Atomic_uint8 *var, // IN/OUT
+            uint8 val)         // IN
+{
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 8, TRUE, &var->value, sub, val);
+#else
+   Atomic_Add8(var, -val);
 #endif
+}
 
-typedef struct Atomic_Bool {
-   volatile Bool value;
-} Atomic_Bool;
-
-/* The ARM team can come along and add the code real soon now */
-extern Bool AtomicUndefinedOnARM(void);
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadBool --
+ * Atomic_Inc8 --
  *
- *      Read the value of the specified object atomically.
+ *      Atomic read, increment, write.
  *
  * Results:
- *      The value of the atomic variable.
+ *      None
  *
  * Side effects:
- *      None.
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
 
-static INLINE Bool
-Atomic_ReadBool(Atomic_Bool const *var)  // IN:
+static INLINE void
+Atomic_Inc8(Atomic_uint8 *var) // IN/OUT
 {
-   Bool val;
-
-#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
-   val = AtomicUndefinedOnARM();
-#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-   __asm__ __volatile__(
-      "movb %1, %0"
-      : "=q" (val)
-      : "m" (var->value)
-   );
-#elif defined(_MSC_VER)
-   val = var->value;
-#else
-#error No compiler defined for Atomic_ReadBool
-#endif
-
-   return val;
+   Atomic_Add8(var, 1);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadWriteBool --
+ * Atomic_Dec8 --
  *
- *      Read followed by write.
+ *      Atomic read, decrement, write.
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      None
  *
  * Side effects:
  *      None
@@ -583,138 +838,63 @@ Atomic_ReadBool(Atomic_Bool const *var)  // IN:
  *-----------------------------------------------------------------------------
  */
 
-static INLINE Bool
-Atomic_ReadWriteBool(Atomic_Bool *var,  // IN/OUT:
-                     Bool val)          // IN:
+static INLINE void
+Atomic_Dec8(Atomic_uint8 *var) // IN/OUT
 {
-#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
-   return AtomicUndefinedOnARM();
-#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-   __asm__ __volatile__(
-      "xchgb %0, %1"
-      : "=q" (val),
-        "+m" (var->value)
-      : "0" (val)
-   );
-   AtomicEpilogue();
-   return val;
-#elif defined(_MSC_VER) && _MSC_VER >= 1600
-   return _InterlockedExchange8(&var->value, val);
-#elif defined(_MSC_VER) && defined(__i386__)
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm movzx eax, val
-      __asm mov ebx, var
-      __asm xchg [ebx]Atomic_Bool.value, al
-   }
-#pragma warning(pop)
-#elif defined(_MSC_VER) && defined(__x86_64__)
-   return VMWInterlockedExchangeBool(&var->value, val);
-#else
-#error No compiler defined for Atomic_ReadBool
-#endif
+   Atomic_Sub8(var, 1);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_WriteBool --
+ * Atomic_ReadInc8 --
  *
- *      Write the specified value to the specified object atomically.
+ *      Atomic read (returned), increment, write.
  *
  * Results:
- *      None.
+ *      The value of the variable before the operation.
  *
  * Side effects:
- *      None.
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
 
-static INLINE void
-Atomic_WriteBool(Atomic_Bool *var,  // IN/OUT:
-                 Bool val)          // IN:
+static INLINE uint8
+Atomic_ReadInc8(Atomic_uint8 *var) // IN/OUT
 {
-#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
-   AtomicUndefinedOnARM();
-#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-   __asm__ __volatile__(
-      "movb %1, %0"
-      : "=m" (var->value)
-      : "qn" (val)
-   );
-#elif defined(_MSC_VER)
-   var->value = val;
-#else
-#error No compiler defined for Atomic_WriteBool
-#endif
+   return Atomic_ReadAdd8(var, 1);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadIfEqualWriteBool --
+ * Atomic_ReadDec8 --
  *
- *      Compare exchange: Read variable, if equal to oldVal, write newVal.
+ *      Atomic read (returned), decrement, write.
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value of the variable before the operation.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None
  *
  *-----------------------------------------------------------------------------
  */
 
-static INLINE Bool
-Atomic_ReadIfEqualWriteBool(Atomic_Bool *var,  // IN/OUT:
-                            Bool oldVal,       // IN:
-                            Bool newVal)       // IN:
+static INLINE uint8
+Atomic_ReadDec8(Atomic_uint8 *var) // IN/OUT
 {
-#if defined(__GNUC__) && (defined(VM_ARM_32) || defined(VM_ARM_64))
-   return AtomicUndefinedOnARM();
-#elif defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
-   Bool val;
-
-   __asm__ __volatile__(
-      "lock; cmpxchgb %2, %1"
-      : "=a" (val),
-        "+m" (var->value)
-      : "q" (newVal),
-        "0" (oldVal)
-      : "cc"
-   );
-   AtomicEpilogue();
-   return val;
-#elif defined(_MSC_VER) && _MSC_VER >= 1600
-   return _InterlockedCompareExchange8(&var->value, newVal, oldVal);
-#elif defined(_MSC_VER) && defined(__i386__)
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov al, oldVal
-      __asm mov ebx, var
-      __asm mov cl, newVal
-      __asm lock cmpxchg [ebx]Atomic_Bool.value, cl
-      __asm movzx eax, al
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#elif defined(_MSC_VER) && defined(__x86_64__)
-   return VMWInterlockedCompareExchangeBool(&var->value, newVal, oldVal);
-#else
-#error No compiler defined for Atomic_ReadIfEqualWriteBool
-#endif
+   return Atomic_ReadAdd8(var, (uint8)-1);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Read --
+ * Atomic_Read32 --
  *
  *      Read
  *
@@ -728,33 +908,29 @@ Atomic_ReadIfEqualWriteBool(Atomic_Bool *var,  // IN/OUT:
  */
 
 static INLINE uint32
-Atomic_Read(Atomic_uint32 const *var) // IN
+Atomic_Read32(Atomic_uint32 const *var) // IN
 {
    uint32 value;
 
-#if defined(VMM)
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT(((uintptr_t)var % 4) == 0);
 #endif
 
-#if defined(__GNUC__)
+#if defined __GNUC__
    /*
     * Use inline assembler to force using a single load instruction to
     * ensure that the compiler doesn't split a transfer operation into multiple
     * instructions.
     */
 
-#if defined(VM_ARM_32)
+#if defined VM_ARM_32
    __asm__ __volatile__(
       "ldr %0, [%1]"
       : "=r" (value)
       : "r" (&var->value)
    );
-#elif defined(VM_ARM_64)
-   __asm__ __volatile__ (
-      "ldr    %w0, [%1]"
-      : "=r" (value)
-      : "r" (&var->value)
-   );
+#elif defined VM_ARM_64
+   value = _VMATOM_X(R, 32, &var->value);
 #else
    __asm__ __volatile__(
       "mov %1, %0"
@@ -762,7 +938,7 @@ Atomic_Read(Atomic_uint32 const *var) // IN
       : "m" (var->value)
    );
 #endif
-#elif defined(_MSC_VER)
+#elif defined _MSC_VER
    /*
     * Microsoft docs guarantee simple reads and writes to properly
     * aligned 32-bit variables use only a single instruction.
@@ -776,13 +952,13 @@ Atomic_Read(Atomic_uint32 const *var) // IN
 
    return value;
 }
-#define Atomic_Read32 Atomic_Read
+#define Atomic_Read Atomic_Read32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadWrite --
+ * Atomic_ReadWrite32 --
  *
  *      Read followed by write
  *
@@ -796,10 +972,10 @@ Atomic_Read(Atomic_uint32 const *var) // IN
  */
 
 static INLINE uint32
-Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
-                 uint32 val)         // IN
+Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
+                   uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 retVal;
    register volatile uint32 res;
@@ -819,22 +995,8 @@ Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint32 retVal;
-   register uint32 failed;
-
-   __asm__ __volatile__(
-      "   dmb     sy             \n\t"
-      "1: ldxr   %w0, [%2]       \n\t"
-      "   stxr   %w1, %w3, [%2]  \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (val)
-      : "memory"
-   );
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RW, 32, TRUE, &var->value, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -843,7 +1005,6 @@ Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
 	"+m" (var->value)
       : "0" (val)
    );
-   AtomicEpilogue();
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -864,13 +1025,13 @@ Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_ReadWrite
 #endif // __GNUC__
 }
-#define Atomic_ReadWrite32 Atomic_ReadWrite
+#define Atomic_ReadWrite Atomic_ReadWrite32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Write --
+ * Atomic_Write32 --
  *
  *      Write
  *
@@ -884,16 +1045,21 @@ Atomic_ReadWrite(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Write(Atomic_uint32 *var, // OUT
-             uint32 val)         // IN
+Atomic_Write32(Atomic_uint32 *var, // OUT
+               uint32 val)         // IN
 {
-#if defined(VMM)
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT(((uintptr_t)var % 4) == 0);
 #endif
 
-#if defined(__GNUC__)
-#if defined(VM_ARM_ANY)
+#if defined __GNUC__
+#if defined VM_ARM_64
+   _VMATOM_X(W, 32, &var->value, val);
+#elif defined VM_ARM_32
    /*
+    * Best left this way due to the intricacies of exclusive load/store
+    * operations on legacy (32-bit) ARM.
+    *
     * A3.4.1 ARM DDI 0406C:
     *
     * When a processor writes using any instruction other than a
@@ -915,7 +1081,7 @@ Atomic_Write(Atomic_uint32 *var, // OUT
     * - it is not necessary for every LDREX to have a subsequent STREX.
     */
 
-   Atomic_ReadWrite(var, val);
+   Atomic_ReadWrite32(var, val);
 #else
    /*
     * Use inline assembler to force using a single store instruction to
@@ -929,7 +1095,7 @@ Atomic_Write(Atomic_uint32 *var, // OUT
       : "r" (val)
    );
 #endif
-#elif defined(_MSC_VER)
+#elif defined _MSC_VER
    /*
     * Microsoft docs guarantee simple reads and writes to properly
     * aligned 32-bit variables use only a single instruction.
@@ -941,13 +1107,13 @@ Atomic_Write(Atomic_uint32 *var, // OUT
 #error No compiler defined for Atomic_Write
 #endif
 }
-#define Atomic_Write32 Atomic_Write
+#define Atomic_Write Atomic_Write32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_ReadIfEqualWrite --
+ * Atomic_ReadIfEqualWrite32 --
  *
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
@@ -961,11 +1127,11 @@ Atomic_Write(Atomic_uint32 *var, // OUT
  */
 
 static INLINE uint32
-Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
-                        uint32 oldVal,      // IN
-                        uint32 newVal)      // IN
+Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
+                          uint32 oldVal,      // IN
+                          uint32 newVal)      // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register uint32 retVal;
    register uint32 res;
@@ -987,24 +1153,8 @@ Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint32 retVal;
-   register uint32 failed;
-
-   __asm__ __volatile__ (
-      "   dmb     sy             \n\t"
-      "1: ldxr   %w0, [%2]       \n\t"
-      "   cmp     %w0, %w3       \n\t"
-      "   b.ne    2f             \n\t"
-      "   stxr   %w1, %w4, [%2]  \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "2: clrex                  \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (oldVal), "r" (newVal)
-      : "cc", "memory");
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RIFEQW, 32, TRUE, &var->value, oldVal, newVal);
 #else /* VM_X86_ANY */
    uint32 val;
 
@@ -1017,7 +1167,6 @@ Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
 	"0" (oldVal)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1041,10 +1190,10 @@ Atomic_ReadIfEqualWrite(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_ReadIfEqualWrite
 #endif
 }
-#define Atomic_ReadIfEqualWrite32 Atomic_ReadIfEqualWrite
+#define Atomic_ReadIfEqualWrite Atomic_ReadIfEqualWrite32
 
 
-#if defined(VM_64BIT) || defined(VM_ARM_V7)
+#if defined VM_64BIT || defined VM_ARM_V7
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1066,7 +1215,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
                           uint64 oldVal,      // IN
                           uint64 newVal)      // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register uint64 retVal;
    register uint32 res;
@@ -1087,7 +1236,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
     * Furthermore, using a 32-bits register to store a
     * 64-bits value of an variable looks risky.
     */
-#if defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#if defined __APPLE__ && __clang__ == 1 && __clang_major__ >= 5
 #pragma clang diagnostic push
 #pragma clang diagnostic ignored "-Wasm-operand-widths"
 #endif
@@ -1103,30 +1252,14 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
       : [var] "r" (&var->value), [oldVal] "r" (oldVal), [newVal] "r" (newVal)
       : "cc"
    );
-#if defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#if defined __APPLE__ && __clang__ == 1 && __clang_major__ >= 5
 #pragma clang diagnostic pop
-#endif // defined(__APPLE__) && __clang__ == 1 && __clang_major__ >= 5
+#endif // defined __APPLE__ && __clang__ == 1 && __clang_major__ >= 5
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint64 retVal;
-   register uint32 failed;
-
-   __asm__ __volatile__ (
-      "   dmb     sy             \n\t"
-      "1: ldxr    %x0, [%2]      \n\t"
-      "   cmp     %x0, %x3       \n\t"
-      "   b.ne    2f             \n\t"
-      "   stxr    %w1, %x4, [%2] \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "2: clrex                  \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (oldVal), "r" (newVal)
-      : "cc", "memory");
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RIFEQW, 64, TRUE, &var->value, oldVal, newVal);
 #else /* VM_X86_64 */
    uint64 val;
 
@@ -1139,7 +1272,6 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
 	"0" (oldVal)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
@@ -1156,7 +1288,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_And --
+ * Atomic_And32 --
  *
  *      Atomic read, bitwise AND with a value, write.
  *
@@ -1170,10 +1302,10 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_And(Atomic_uint32 *var, // IN/OUT
-           uint32 val)         // IN
+Atomic_And32(Atomic_uint32 *var, // IN/OUT
+             uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1192,8 +1324,8 @@ Atomic_And(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, and);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, and, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1202,10 +1334,9 @@ Atomic_And(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined(__x86_64__)
+#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedAnd((long *)&var->value, (long)val);
 #else
    __asm mov eax, val
@@ -1216,13 +1347,13 @@ Atomic_And(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_And
 #endif
 }
-#define Atomic_And32 Atomic_And
+#define Atomic_And Atomic_And32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Or --
+ * Atomic_Or32 --
  *
  *      Atomic read, bitwise OR with a value, write.
  *
@@ -1236,10 +1367,10 @@ Atomic_And(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Or(Atomic_uint32 *var, // IN/OUT
-          uint32 val)         // IN
+Atomic_Or32(Atomic_uint32 *var, // IN/OUT
+            uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1258,8 +1389,8 @@ Atomic_Or(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, orr);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, orr, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1268,10 +1399,9 @@ Atomic_Or(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined(__x86_64__)
+#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedOr((long *)&var->value, (long)val);
 #else
    __asm mov eax, val
@@ -1282,13 +1412,13 @@ Atomic_Or(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_Or
 #endif
 }
-#define Atomic_Or32 Atomic_Or
+#define Atomic_Or Atomic_Or32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Xor --
+ * Atomic_Xor32 --
  *
  *      Atomic read, bitwise XOR with a value, write.
  *
@@ -1302,10 +1432,10 @@ Atomic_Or(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Xor(Atomic_uint32 *var, // IN/OUT
-           uint32 val)         // IN
+Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
+             uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1324,8 +1454,8 @@ Atomic_Xor(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, eor);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, eor, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1334,10 +1464,9 @@ Atomic_Xor(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined(__x86_64__)
+#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedXor((long *)&var->value, (long)val);
 #else
    __asm mov eax, val
@@ -1348,10 +1477,10 @@ Atomic_Xor(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_Xor
 #endif
 }
-#define Atomic_Xor32 Atomic_Xor
+#define Atomic_Xor Atomic_Xor32
 
 
-#if defined(VM_64BIT)
+#if defined VM_64BIT
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1372,9 +1501,9 @@ static INLINE void
 Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined(__GNUC__)
-#if defined(VM_ARM_64)
-   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, eor);
+#if defined __GNUC__
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, eor, val);
 #else /* VM_X86_64 */
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -1383,7 +1512,6 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif
 #elif defined _MSC_VER
    _InterlockedXor64((__int64 *)&var->value, (__int64)val);
@@ -1397,7 +1525,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Add --
+ * Atomic_Add32 --
  *
  *      Atomic read, add a value, write.
  *
@@ -1411,10 +1539,10 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Add(Atomic_uint32 *var, // IN/OUT
-           uint32 val)         // IN
+Atomic_Add32(Atomic_uint32 *var, // IN/OUT
+             uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1433,8 +1561,8 @@ Atomic_Add(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, add);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, add, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1443,7 +1571,6 @@ Atomic_Add(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
 #if _MSC_VER >= 1310
@@ -1457,13 +1584,13 @@ Atomic_Add(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_Add
 #endif
 }
-#define Atomic_Add32 Atomic_Add
+#define Atomic_Add Atomic_Add32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Sub --
+ * Atomic_Sub32 --
  *
  *      Atomic read, subtract a value, write.
  *
@@ -1477,10 +1604,10 @@ Atomic_Add(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Sub(Atomic_uint32 *var, // IN/OUT
-           uint32 val)         // IN
+Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
+             uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 tmp;
@@ -1499,8 +1626,8 @@ Atomic_Sub(Atomic_uint32 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_32_OPV_PRIVATE_FENCED(var, val, sub);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 32, TRUE, &var->value, sub, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1509,7 +1636,6 @@ Atomic_Sub(Atomic_uint32 *var, // IN/OUT
       : "ri" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
 #if _MSC_VER >= 1310
@@ -1523,13 +1649,13 @@ Atomic_Sub(Atomic_uint32 *var, // IN/OUT
 #error No compiler defined for Atomic_Sub
 #endif
 }
-#define Atomic_Sub32 Atomic_Sub
+#define Atomic_Sub Atomic_Sub32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Inc --
+ * Atomic_Inc32 --
  *
  *      Atomic read, increment, write.
  *
@@ -1543,11 +1669,11 @@ Atomic_Sub(Atomic_uint32 *var, // IN/OUT
  */
 
 static INLINE void
-Atomic_Inc(Atomic_uint32 *var) // IN/OUT
+Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
 {
 #ifdef __GNUC__
-#if defined(VM_ARM_ANY)
-   Atomic_Add(var, 1);
+#if defined VM_ARM_ANY
+   Atomic_Add32(var, 1);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1556,7 +1682,6 @@ Atomic_Inc(Atomic_uint32 *var) // IN/OUT
       :
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
 #if _MSC_VER >= 1310
@@ -1569,13 +1694,13 @@ Atomic_Inc(Atomic_uint32 *var) // IN/OUT
 #error No compiler defined for Atomic_Inc
 #endif
 }
-#define Atomic_Inc32 Atomic_Inc
+#define Atomic_Inc Atomic_Inc32
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * Atomic_Dec --
+ * Atomic_Dec32 --
  *
  *      Atomic read, decrement, write.
  *
@@ -1589,11 +1714,11 @@ Atomic_Inc(Atomic_uint32 *var) // IN/OUT
  */
 
 static INLINE void
-Atomic_Dec(Atomic_uint32 *var) // IN/OUT
+Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
 {
 #ifdef __GNUC__
-#if defined(VM_ARM_ANY)
-   Atomic_Sub(var, 1);
+#if defined VM_ARM_ANY
+   Atomic_Sub32(var, 1);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1602,7 +1727,6 @@ Atomic_Dec(Atomic_uint32 *var) // IN/OUT
       :
       : "cc"
    );
-   AtomicEpilogue();
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
 #if _MSC_VER >= 1310
@@ -1615,7 +1739,7 @@ Atomic_Dec(Atomic_uint32 *var) // IN/OUT
 #error No compiler defined for Atomic_Dec
 #endif
 }
-#define Atomic_Dec32 Atomic_Dec
+#define Atomic_Dec Atomic_Dec32
 
 
 /*
@@ -1646,9 +1770,13 @@ Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 32, TRUE, &var->value, orr, val);
+#else
    do {
-      res = Atomic_Read(var);
-   } while (res != Atomic_ReadIfEqualWrite(var, res, res | val));
+      res = Atomic_Read32(var);
+   } while (res != Atomic_ReadIfEqualWrite32(var, res, res | val));
+#endif
 
    return res;
 }
@@ -1676,15 +1804,19 @@ Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 32, TRUE, &var->value, and, val);
+#else
    do {
-      res = Atomic_Read(var);
-   } while (res != Atomic_ReadIfEqualWrite(var, res, res & val));
+      res = Atomic_Read32(var);
+   } while (res != Atomic_ReadIfEqualWrite32(var, res, res & val));
+#endif
 
    return res;
 }
 
 
-#if defined(VM_64BIT)
+#if defined VM_64BIT
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1707,9 +1839,13 @@ Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 64, TRUE, &var->value, orr, val);
+#else
    do {
       res = var->value;
    } while (res != Atomic_ReadIfEqualWrite64(var, res, res | val));
+#endif
 
    return res;
 }
@@ -1737,13 +1873,17 @@ Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 64, TRUE, &var->value, and, val);
+#else
    do {
       res = var->value;
    } while (res != Atomic_ReadIfEqualWrite64(var, res, res & val));
+#endif
 
    return res;
 }
-#endif /* defined(VM_64BIT) */
+#endif /* defined VM_64BIT */
 
 
 /*
@@ -1770,7 +1910,7 @@ static INLINE uint32
 Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
                  uint32 val)         // IN
 {
-#if defined(__GNUC__)
+#if defined __GNUC__
 #ifdef VM_ARM_V7
    register volatile uint32 res;
    register volatile uint32 retVal;
@@ -1792,8 +1932,8 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   return ARM_64_ATOMIC_32_OPO_PRIVATE_FENCED(var, val, add);
+#elif defined VM_ARM_64
+   return _VMATOM_X(ROP, 32, TRUE, &var->value, add, val);
 #else /* VM_X86_ANY */
    /* Checked against the Intel manual and GCC --walken */
    __asm__ __volatile__(
@@ -1803,7 +1943,6 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
       : "0" (val)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1871,51 +2010,6 @@ Atomic_ReadDec32(Atomic_uint32 *var) // IN/OUT
 }
 
 
-#if defined VMKERNEL || defined VMM
-#if !defined(VM_ARM_64)
-/*
- *-----------------------------------------------------------------------------
- *
- * CMPXCHG1B --
- *
- *      Compare and exchange a single byte.
- *
- * Results:
- *      The value read from ptr.
- *
- * Side effects:
- *      None
- *
- *-----------------------------------------------------------------------------
- */
-static INLINE uint8
-CMPXCHG1B(volatile uint8 *ptr, // IN/OUT
-          uint8 oldVal,        // IN
-          uint8 newVal)        // IN
-{
-   uint8 val;
-   __asm__ __volatile__("lock; cmpxchgb %b2, %1"
-                        : "=a" (val),
-                          "+m" (*ptr)
-                        : "r" (newVal),
-                          "0" (oldVal)
-                        : "cc");
-   return val;
-}
-#endif /* !defined(VM_ARM_64) */
-#endif
-
-
-/*
- * Usage of this helper struct is strictly reserved to the following
- * function. --hpreg
- */
-typedef struct {
-   uint32 lowValue;
-   uint32 highValue;
-} S_uint64;
-
-
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1923,12 +2017,6 @@ typedef struct {
  *
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
- *      XXX: Ensure that if this function is to be inlined by gcc, it is
- *      compiled with -fno-strict-aliasing. Otherwise it will break.
- *      Unfortunately we know that gcc 2.95.3 (used to build the FreeBSD 3.2
- *      Tools) does not honor -fno-strict-aliasing. As a workaround, we avoid
- *      inlining the function entirely for versions of gcc under 3.0.
- *
  * Results:
  *      TRUE if equal, FALSE if not equal
  *
@@ -1938,23 +2026,19 @@ typedef struct {
  *-----------------------------------------------------------------------------
  */
 
-#if defined(__GNUC__) && __GNUC__ < 3
-static Bool
-#else
 static INLINE Bool
-#endif
 Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
-                 uint64 const *oldVal, // IN
-                 uint64 const *newVal) // IN
+                 uint64 oldVal,        // IN
+                 uint64 newVal)        // IN
 {
-#if defined(__GNUC__)
-#if defined(VM_ARM_ANY)
-   return (Atomic_ReadIfEqualWrite64(var, *oldVal, *newVal) == *oldVal);
+#if defined __GNUC__
+#if defined VM_ARM_ANY
+   return Atomic_ReadIfEqualWrite64(var, oldVal, newVal) == oldVal;
 #else /* VM_X86_ANY */
 
    Bool equal;
    /* Checked against the Intel manual and GCC --walken */
-#if defined(__x86_64__)
+#if defined __x86_64__
    uint64 dummy;
    __asm__ __volatile__(
       "lock; cmpxchgq %3, %0" "\n\t"
@@ -1962,11 +2046,16 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
       : "+m" (*var),
 	"=qm" (equal),
 	"=a" (dummy)
-      : "r" (*newVal),
-        "2" (*oldVal)
+      : "r" (newVal),
+        "2" (oldVal)
       : "cc"
    );
 #else /* 32-bit version for non-ARM */
+   typedef struct {
+      uint32 lowValue;
+      uint32 highValue;
+   } S_uint64;
+
    int dummy1, dummy2;
 #   if defined __PIC__
    /*
@@ -1994,28 +2083,6 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
     * where it temporarily modifies %ebx as small as possible, and should
     * prefer specific register assignments.
     */
-#      if __GNUC__ < 3 // Part of #188541 - for RHL 6.2 etc.
-   __asm__ __volatile__(
-      "xchg %%ebx, %6"       "\n\t"
-      "mov 4(%%ebx), %%ecx"  "\n\t"
-      "mov (%%ebx), %%ebx"   "\n\t"
-      "lock; cmpxchg8b (%3)" "\n\t"
-      "xchg %%ebx, %6"       "\n\t"
-      "sete %0"
-      : "=a" (equal),
-        "=d" (dummy2),
-        "=D" (dummy1)
-      : /*
-         * See the "Rules for __asm__ statements in __PIC__ code" above: %3
-         * must use a register class which does not contain %ebx.
-         */
-        "S" (var),
-        "0" (((S_uint64 const *)oldVal)->lowValue),
-        "1" (((S_uint64 const *)oldVal)->highValue),
-        "D" (newVal)
-      : "ecx", "cc", "memory"
-   );
-#      else
    __asm__ __volatile__(
       "xchgl %%ebx, %6"      "\n\t"
       "lock; cmpxchg8b (%3)" "\n\t"
@@ -2033,13 +2100,12 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
          * stack, %ebp reserved for frame, %ebx reserved for PIC).
          */
         "S" (var),
-        "1" (((S_uint64 const *)oldVal)->lowValue),
-        "2" (((S_uint64 const *)oldVal)->highValue),
-        "D" (((S_uint64 const *)newVal)->lowValue),
-        "c" (((S_uint64 const *)newVal)->highValue)
+        "1" (((S_uint64 *)&oldVal)->lowValue),
+        "2" (((S_uint64 *)&oldVal)->highValue),
+        "D" (((S_uint64 *)&newVal)->lowValue),
+        "c" (((S_uint64 *)&newVal)->highValue)
       : "cc", "memory"
    );
-#      endif
 #   else
    __asm__ __volatile__(
       "lock; cmpxchg8b %0" "\n\t"
@@ -2048,40 +2114,20 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
 	"=qm" (equal),
 	"=a" (dummy1),
 	"=d" (dummy2)
-      : "2" (((S_uint64 const *)oldVal)->lowValue),
-        "3" (((S_uint64 const *)oldVal)->highValue),
-        "b" (((S_uint64 const *)newVal)->lowValue),
-        "c" (((S_uint64 const *)newVal)->highValue)
+      : "2" (((S_uint64 *)&oldVal)->lowValue),
+        "3" (((S_uint64 *)&oldVal)->highValue),
+        "b" (((S_uint64 *)&newVal)->lowValue),
+        "c" (((S_uint64 *)&newVal)->highValue)
       : "cc"
    );
 #   endif
 #endif
-   AtomicEpilogue();
    return equal;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
-#if defined(__x86_64__)
-   return (__int64)*oldVal == _InterlockedCompareExchange64((__int64 *)&var->value,
-                                                            (__int64)*newVal,
-                                                            (__int64)*oldVal);
-#else
-#pragma warning(push)
-#pragma warning(disable : 4035)		// disable no-return warning
-   {
-      __asm mov esi, var
-      __asm mov edx, oldVal
-      __asm mov ecx, newVal
-      __asm mov eax, [edx]S_uint64.lowValue
-      __asm mov edx, [edx]S_uint64.highValue
-      __asm mov ebx, [ecx]S_uint64.lowValue
-      __asm mov ecx, [ecx]S_uint64.highValue
-      __asm lock cmpxchg8b [esi]
-      __asm sete al
-      __asm movzx eax, al
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#endif
+   return (__int64)oldVal == _InterlockedCompareExchange64((__int64 *)&var->value,
+                                                           (__int64)newVal,
+                                                           (__int64)oldVal);
 #else
 #error No compiler defined for Atomic_CMPXCHG64
 #endif // !GNUC
@@ -2109,9 +2155,9 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
                  uint32 oldVal,        // IN
                  uint32 newVal)        // IN
 {
-#if defined(__GNUC__)
-#if defined(VM_ARM_ANY)
-   return (Atomic_ReadIfEqualWrite(var, oldVal, newVal) == oldVal);
+#if defined __GNUC__
+#if defined VM_ARM_ANY
+   return Atomic_ReadIfEqualWrite32(var, oldVal, newVal) == oldVal;
 #else /* VM_X86_ANY */
    Bool equal;
    uint32 dummy;
@@ -2126,12 +2172,11 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
         "2" (oldVal)
       : "cc"
    );
-   AtomicEpilogue();
    return equal;
 #endif /* VM_X86_ANY */
-#else // defined(__GNUC__)
-   return (Atomic_ReadIfEqualWrite(var, oldVal, newVal) == oldVal);
-#endif // !defined(__GNUC__)
+#else // defined __GNUC__
+   return Atomic_ReadIfEqualWrite32(var, oldVal, newVal) == oldVal;
+#endif // !defined __GNUC__
 }
 
 
@@ -2154,12 +2199,15 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
 static INLINE uint64
 Atomic_Read64(Atomic_uint64 const *var) // IN
 {
-#if defined(__GNUC__) && defined(__x86_64__)
+#if defined __GNUC__
    uint64 value;
+#endif
 
-#ifdef VMM
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 8 == 0);
 #endif
+
+#if defined __GNUC__ && defined __x86_64__
    /*
     * Use asm to ensure we emit a single load.
     */
@@ -2168,9 +2216,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
       : "=r" (value)
       : "m" (var->value)
    );
-   return value;
-#elif defined(__GNUC__) && defined(__i386__)
-   uint64 value;
+#elif defined __GNUC__ && defined __i386__
    /*
     * Since cmpxchg8b will replace the contents of EDX:EAX with the
     * value in memory if there is no match, we need only execute the
@@ -2188,9 +2234,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
       : "m" (*var)
       : "cc"
    );
-   AtomicEpilogue();
-   return value;
-#elif defined (_MSC_VER) && defined(__x86_64__)
+#elif defined _MSC_VER && defined __x86_64__
    /*
     * Microsoft docs guarantee "Simple reads and writes to properly
     * aligned 64-bit variables are atomic on 64-bit Windows."
@@ -2199,7 +2243,9 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
     * XXX Verify that value is properly aligned. Bug 61315.
     */
    return var->value;
-#elif defined (_MSC_VER) && defined(__i386__)
+#elif defined _MSC_VER && defined VM_ARM_32
+   return _InterlockedAdd64((__int64 *)&var->value, 0);
+#elif defined _MSC_VER && defined __i386__
 #   pragma warning(push)
 #   pragma warning(disable : 4035)		// disable no-return warning
    {
@@ -2210,26 +2256,19 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
       // edx:eax is the return value; this is documented to work. --mann
    }
 #   pragma warning(pop)
-#elif defined(__GNUC__) && defined (VM_ARM_V7)
-   uint64 value;
-
+#elif defined __GNUC__ && defined VM_ARM_V7
    __asm__ __volatile__(
       "ldrexd %[value], %H[value], [%[var]] \n\t"
       : [value] "=&r" (value)
       : [var] "r" (&var->value)
    );
+#elif defined VM_ARM_64
+   value = _VMATOM_X(R, 64, &var->value);
+#endif
 
+#if defined __GNUC__
    return value;
-#elif defined(__GNUC__) && defined(VM_ARM_64)
-   uint64 value;
-
-   __asm__ __volatile__(
-      "ldr     %0, [%1]"
-      : "=r" (value)
-      : "r" (&var->value));
-
-   return value;
-#endif /* defined(__GNUC__) && defined(VM_ARM_64) */
+#endif
 }
 
 
@@ -2241,7 +2280,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
  *      Atomically read a 64 bit integer, possibly misaligned.
  *      This function can be *very* expensive, costing over 50 kcycles
  *      on Nehalem.
- * 
+ *
  *      Note that "var" needs to be writable, even though it will not
  *      be modified.
  *
@@ -2254,7 +2293,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
  *----------------------------------------------------------------------
  */
 
-#if defined(VM_64BIT)
+#if defined VM_64BIT
 static INLINE uint64
 Atomic_ReadUnaligned64(Atomic_uint64 const *var)  // IN:
 {
@@ -2283,11 +2322,11 @@ static INLINE uint64
 Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined(VM_ARM_64)
-   return ARM_64_ATOMIC_64_OPO_PRIVATE_FENCED(var, val, add);
-#elif defined(__x86_64__)
+#if defined VM_ARM_64
+   return _VMATOM_X(ROP, 64, TRUE, &var->value, add, val);
+#elif defined __x86_64__
 
-#if defined(__GNUC__)
+#if defined __GNUC__
    __asm__ __volatile__(
       "lock; xaddq %0, %1"
       : "=r" (val),
@@ -2295,7 +2334,6 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
       : "0" (val)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
 #elif defined _MSC_VER
    return _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
@@ -2310,7 +2348,7 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal + val;
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 
    return oldVal;
 #endif
@@ -2337,7 +2375,11 @@ static INLINE uint64
 Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
+#if defined VM_ARM_64
+   return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
+#else
    return Atomic_ReadAdd64(var, -val);
+#endif
 }
 
 
@@ -2407,12 +2449,12 @@ static INLINE void
 Atomic_Add64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if !defined(VM_64BIT)
+#if !defined VM_64BIT
    Atomic_ReadAdd64(var, val); /* Return value is unused. */
-#elif defined(__GNUC__)
-#if defined(VM_ARM_64)
-   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, add);
-#else /* defined(VM_X86_64) */
+#elif defined __GNUC__
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, add, val);
+#else /* defined VM_X86_64 */
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; addq %1, %0"
@@ -2420,7 +2462,6 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif
 #elif defined _MSC_VER
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
@@ -2450,11 +2491,11 @@ static INLINE void
 Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if !defined(__x86_64__)
+#if !defined VM_64BIT
    Atomic_ReadSub64(var, val); /* Return value is unused. */
-#elif defined(__GNUC__)
-#if defined(VM_ARM_64)
-   ARM_64_ATOMIC_64_OPV_PRIVATE_FENCED(var, val, sub);
+#elif defined __GNUC__
+#if defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, sub, val);
 #else /* VM_X86_64 */
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -2463,7 +2504,6 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #endif
 #elif defined _MSC_VER
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)-val);
@@ -2492,9 +2532,11 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
 static INLINE void
 Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 {
-#if !defined(__x86_64__)
+#if defined VM_ARM_64
+   Atomic_Add64(var, 1);
+#elif !defined __x86_64__
    Atomic_ReadInc64(var);  /* Return value is unused. */
-#elif defined(__GNUC__)
+#elif defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; incq %0"
@@ -2502,7 +2544,6 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
       :
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    _InterlockedIncrement64((__int64 *)&var->value);
 #else
@@ -2530,9 +2571,11 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 static INLINE void
 Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
 {
-#if !defined(__x86_64__)
+#if defined VM_ARM_64
+   Atomic_Sub64(var, 1);
+#elif !defined __x86_64__
    Atomic_ReadDec64(var);  /* Return value is unused. */
-#elif defined(__GNUC__)
+#elif defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; decq %0"
@@ -2540,7 +2583,6 @@ Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
       :
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    _InterlockedDecrement64((__int64 *)&var->value);
 #else
@@ -2569,8 +2611,8 @@ static INLINE uint64
 Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
                    uint64 val)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "xchgq %0, %1"
@@ -2578,19 +2620,20 @@ Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
 	"+m" (var->value)
       : "0" (val)
    );
-   AtomicEpilogue();
    return val;
 #elif defined _MSC_VER
    return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
 #else
 #error No compiler defined for Atomic_ReadWrite64
 #endif
+#elif defined VM_ARM_64
+   return _VMATOM_X(RW, 64, TRUE, &var->value, val);
 #else
    uint64 oldVal;
 
    do {
       oldVal = var->value;
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &val));
+   } while (!Atomic_CMPXCHG64(var, oldVal, val));
 
    return oldVal;
 #endif
@@ -2617,12 +2660,12 @@ static INLINE void
 Atomic_Write64(Atomic_uint64 *var, // OUT
                uint64 val)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
-
-#ifdef VMM
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 8 == 0);
 #endif
+
+#if defined __x86_64__
+#if defined __GNUC__
    /*
     * There is no move instruction for 64-bit immediate to memory, so unless
     * the immediate value fits in 32-bit (i.e. can be sign-extended), GCC
@@ -2637,7 +2680,7 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
    );
 #elif defined _MSC_VER
    /*
-    * Microsoft docs guarantee "Simple reads and writes to properly aligned 
+    * Microsoft docs guarantee "Simple reads and writes to properly aligned
     * 64-bit variables are atomic on 64-bit Windows."
     * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
     *
@@ -2648,7 +2691,9 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
 #else
 #error No compiler defined for Atomic_Write64
 #endif
-#else  /* defined(__x86_64__) */
+#elif defined VM_ARM_64
+   _VMATOM_X(W, 64, &var->value, val);
+#else
    (void)Atomic_ReadWrite64(var, val);
 #endif
 }
@@ -2674,8 +2719,8 @@ static INLINE void
 Atomic_Or64(Atomic_uint64 *var, // IN/OUT
             uint64 val)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; orq %1, %0"
@@ -2683,19 +2728,20 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    _InterlockedOr64((__int64 *)&var->value, (__int64)val);
 #else
 #error No compiler defined for Atomic_Or64
 #endif
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, orr, val);
 #else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    do {
       oldVal = var->value;
       newVal = oldVal | val;
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #endif
 }
 
@@ -2720,8 +2766,8 @@ static INLINE void
 Atomic_And64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; andq %1, %0"
@@ -2729,19 +2775,20 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
 #else
 #error No compiler defined for Atomic_And64
 #endif
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, and, val);
 #else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    do {
       oldVal = var->value;
       newVal = oldVal & val;
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #endif
 }
 
@@ -2766,8 +2813,8 @@ static INLINE void
 Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
                 uint64 bit)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    ASSERT(bit <= 63);
    __asm__ __volatile__(
       "lock; bts %1, %0"
@@ -2775,7 +2822,6 @@ Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
       : "ri" (bit)
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    uint64 oldVal;
    uint64 newVal;
@@ -2783,7 +2829,7 @@ Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal | (CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #else
 #error No compiler defined for Atomic_SetBit64
 #endif
@@ -2794,7 +2840,7 @@ Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal | (CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #endif
 }
 
@@ -2819,8 +2865,8 @@ static INLINE void
 Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
                   uint64 bit)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    ASSERT(bit <= 63);
    __asm__ __volatile__(
       "lock; btr %1, %0"
@@ -2828,7 +2874,6 @@ Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
       : "ri" (bit)
       : "cc"
    );
-   AtomicEpilogue();
 #elif defined _MSC_VER
    uint64 oldVal;
    uint64 newVal;
@@ -2836,7 +2881,7 @@ Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal & ~(CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #else
 #error No compiler defined for Atomic_ClearBit64
 #endif
@@ -2847,7 +2892,7 @@ Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
    do {
       oldVal = var->value;
       newVal = oldVal & ~(CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, &oldVal, &newVal));
+   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #endif
 }
 
@@ -2872,8 +2917,8 @@ static INLINE Bool
 Atomic_TestBit64(Atomic_uint64 *var, // IN
                  uint64 bit)         // IN
 {
-#if defined(__x86_64__)
-#if defined(__GNUC__)
+#if defined __x86_64__
+#if defined __GNUC__
    Bool out = FALSE;
    ASSERT(bit <= 63);
    __asm__ __volatile__(
@@ -2897,7 +2942,7 @@ Atomic_TestBit64(Atomic_uint64 *var, // IN
 }
 
 
-#if defined(__GNUC__)
+#if defined __GNUC__
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2919,19 +2964,19 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
 {
    uint16 value;
 
-#ifdef VMM
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 2 == 0);
 #endif
 
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
 
    __asm__ __volatile__(
       "movw %1, %0"
       : "=r" (value)
       : "m" (var->value)
    );
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    NOT_TESTED();
 
    __asm__ __volatile__(
@@ -2939,13 +2984,8 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
       : "=r" (value)
       : "r" (&var->value)
    );
-#elif defined(VM_ARM_64)
-   __asm__ __volatile__ (
-      "ldrh   %w0, [%1]"
-      : "=r" (value)
-      : "r" (&var->value)
-   );
-
+#elif defined VM_ARM_64
+   value = _VMATOM_X(R, 16, &var->value);
 #else
 #error No 16-bits atomics.
 #endif
@@ -2975,17 +3015,16 @@ static INLINE uint16
 Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
                    uint16 val)          // IN:
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "xchgw %0, %1"
       : "=r" (val),
 	"+m" (var->value)
       : "0" (val)
    );
-   AtomicEpilogue();
    return val;
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 retVal;
    register volatile uint16 res;
 
@@ -3006,22 +3045,8 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint16 retVal;
-   register uint16 failed;
-
-   __asm__ __volatile__(
-      "   dmb     sy             \n\t"
-      "1: ldxrh  %w0, [%2]       \n\t"
-      "   stxrh  %w1, %w3, [%2]  \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (val)
-      : "memory"
-   );
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RW, 16, TRUE, &var->value, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3049,19 +3074,24 @@ static INLINE void
 Atomic_Write16(Atomic_uint16 *var,  // OUT:
                uint16 val)          // IN:
 {
-#ifdef VMM
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 2 == 0);
 #endif
 
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
-
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "movw %1, %0"
       : "=m" (var->value)
       : "r" (val)
    );
-#elif defined(VM_ARM_ANY)
+#elif defined VM_ARM_64
+   _VMATOM_X(W, 16, &var->value, val);
+#elif defined VM_ARM_32
+   /*
+    * Best left this way due to the intricacies of exclusive load/store
+    * operations on legacy (32-bit) ARM.
+    */
    Atomic_ReadWrite16(var, val);
 #else
 #error No 16-bits atomics.
@@ -3091,8 +3121,8 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
                           uint16 oldVal,        // IN
                           uint16 newVal)        // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    uint16 val;
 
    __asm__ __volatile__(
@@ -3103,9 +3133,8 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
 	"0" (oldVal)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register uint16 retVal;
    register uint16 res;
 
@@ -3128,24 +3157,8 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   register uint16 retVal;
-   register uint16 failed;
-
-   __asm__ __volatile__ (
-      "   dmb     sy             \n\t"
-      "1: ldxrh  %w0, [%2]       \n\t"
-      "   cmp     %w0, %w3       \n\t"
-      "   b.ne    2f             \n\t"
-      "   stxrh  %w1, %w4, [%2]  \n\t"
-      "   cbnz    %w1, 1b        \n\t"
-      "2: clrex                  \n\t"
-      "   dmb     sy             \n\t"
-      : "=&r" (retVal), "=&r" (failed)
-      : "r" (&var->value), "r" (oldVal), "r" (newVal)
-      : "cc", "memory");
-
-   return retVal;
+#elif defined VM_ARM_64
+   return _VMATOM_X(RIFEQW, 16, TRUE, &var->value, oldVal, newVal);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3173,16 +3186,15 @@ static INLINE void
 Atomic_And16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; andw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3202,8 +3214,8 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, and);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, and, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3231,16 +3243,15 @@ static INLINE void
 Atomic_Or16(Atomic_uint16 *var, // IN/OUT
             uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; orw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3260,14 +3271,15 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, orr);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, orr, val);
 #else
 #error No 16-bits atomics.
 #endif
 #endif
 }
 
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -3288,16 +3300,15 @@ static INLINE void
 Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; xorw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3317,8 +3328,8 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, eor);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, eor, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3346,16 +3357,15 @@ static INLINE void
 Atomic_Add16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; addw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3375,8 +3385,8 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, add);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, add, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3404,16 +3414,15 @@ static INLINE void
 Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; subw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 tmp;
 
@@ -3433,8 +3442,8 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined(VM_ARM_64)
-   ARM_64_ATOMIC_16_OPV_PRIVATE_FENCED(var, val, sub);
+#elif defined VM_ARM_64
+   _VMATOM_X(OP, 16, TRUE, &var->value, sub, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3461,16 +3470,15 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
 static INLINE void
 Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; incw %0"
       : "+m" (var->value)
       :
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_ANY)
+#elif defined VM_ARM_ANY
    Atomic_Add16(var, 1);
 #else
 #error No 16-bits atomics.
@@ -3498,16 +3506,15 @@ Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 static INLINE void
 Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; decw %0"
       : "+m" (var->value)
       :
       : "cc"
    );
-   AtomicEpilogue();
-#elif defined(VM_ARM_ANY)
+#elif defined VM_ARM_ANY
    Atomic_Sub16(var, 1);
 #else
 #error No 16-bits atomics.
@@ -3538,9 +3545,13 @@ Atomic_ReadOr16(Atomic_uint16 *var, // IN/OUT
 {
    uint16 res;
 
+#if defined VM_ARM_64
+   res = _VMATOM_X(ROP, 16, TRUE, &var->value, orr, val);
+#else
    do {
       res = var->value;
    } while (res != Atomic_ReadIfEqualWrite16(var, res, res | val));
+#endif
 
    return res;
 }
@@ -3566,8 +3577,8 @@ static INLINE uint16
 Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
                  uint16 val)          // IN:
 {
-#if defined(__GNUC__)
-#if (defined(__x86_64__) || defined(__i386__))
+#if defined __GNUC__
+#if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "lock; xaddw %0, %1"
       : "=r" (val),
@@ -3575,9 +3586,8 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
       : "0" (val)
       : "cc"
    );
-   AtomicEpilogue();
    return val;
-#elif defined(VM_ARM_V7)
+#elif defined VM_ARM_V7
    register volatile uint16 res;
    register volatile uint16 retVal;
    register volatile uint16 tmp;
@@ -3600,8 +3610,8 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
    dmb();
 
    return retVal;
-#elif defined(VM_ARM_64)
-   return ARM_64_ATOMIC_16_OPO_PRIVATE_FENCED(var, val, add);
+#elif defined VM_ARM_64
+   return _VMATOM_X(ROP, 16, TRUE, &var->value, add, val);
 #else
 #error No 16-bits atomics.
 #endif
@@ -3631,8 +3641,8 @@ Atomic_ReadInc16(Atomic_uint16 *var) // IN/OUT
    return Atomic_ReadAdd16(var, 1);
 }
 
-/*
 
+/*
  *----------------------------------------------------------------------
  *
  * Atomic_ReadDec16 --
@@ -3840,57 +3850,38 @@ Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
  * Atomic_ReadAddInt --
  * Atomic_ReadIncInt --
  * Atomic_ReadDecInt --
- */
-#if defined(VM_64BIT)
+ *
+ * Atomic_Bool
+ * Atomic_ReadBool --
+ * Atomic_WriteBool --
+ * Atomic_ReadWriteBool --
+ * Atomic_ReadIfEqualWriteBool --
+ * Atomic_AndBool --
+ * Atomic_OrBool --
+ * Atomic_XorBool --
+ * Atomic_AddBool --
+ * Atomic_SubBool --
+ * Atomic_IncBool --
+ * Atomic_DecBool --
+ * Atomic_ReadOrBool --
+ * Atomic_ReadAddBool --
+ * Atomic_ReadIncBool --
+ * Atomic_ReadDecBool --
+ */
+#if defined VM_64BIT
 MAKE_ATOMIC_TYPE(Ptr, 64, void const *, void *, uintptr_t)
 #else
 MAKE_ATOMIC_TYPE(Ptr, 32, void const *, void *, uintptr_t)
 #endif
 MAKE_ATOMIC_TYPE(Int, 32, int, int, int)
+MAKE_ATOMIC_TYPE(Bool, 8, Bool, Bool, Bool)
 
-
-/* Prevent the compiler from re-ordering memory references. */
-#ifdef __GNUC__
-#define ATOMIC_COMPILER_BARRIER()   __asm__ __volatile__ ("": : :"memory")
-#elif defined(_MSC_VER)
-#define ATOMIC_COMPILER_BARRIER()   _ReadWriteBarrier()
-#else
-#error No compiler defined for ATOMIC_COMPILER_BARRIER
+#ifdef VM_ARM_64
+#   include "vm_atomic_arm64_end.h"
 #endif
 
-
-/*
- *-----------------------------------------------------------------------------
- *
- * Atomic_MFence --
- *
- *      Implements mfence in terms of a lock xor. The reason for implementing
- *      our own mfence is that not all of our supported cpus have an assembly
- *      mfence (P3, Athlon). We put it here to avoid duplicating code which is
- *      also why it is prefixed with "Atomic_". Moreover, this implementation
- *      performs slightly better than 'mfence' on modern CPUs (See PR 817059).
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      Cause loads and stores prior to this to be globally
- *      visible.
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE void
-Atomic_MFence(void)
-{
-   Atomic_uint32 fence;
-   ATOMIC_COMPILER_BARRIER();
-   Atomic_Xor(&fence, 0x1);
-   ATOMIC_COMPILER_BARRIER();
-}
-
-#ifdef ATOMIC_COMPILER_BARRIER
-#undef ATOMIC_COMPILER_BARRIER
-#endif /* ATOMIC_COMPILER_BARRIER */
+#if defined __cplusplus
+}  // extern "C"
+#endif
 
 #endif // ifndef _ATOMIC_H_
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index 0e4adae6..11c3abac 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -43,6 +43,10 @@
 #elif defined VM_X86_32
 #include "vm_basic_asm_x86_common.h"
 #include "vm_basic_asm_x86.h"
+#elif defined VM_ARM_32
+#include "vm_basic_asm_arm32.h"
+#define MUL64_NO_ASM 1
+#include "mul64.h"
 #elif defined VM_ARM_64
 #include "arm64_basic_defs.h"
 #include "vm_basic_asm_arm64.h"
@@ -51,6 +55,11 @@
 #include "mul64.h"
 #endif
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 /*
  * Locate most and least significant bit set functions. Use our own name
  * space to avoid namespace collisions. The new names follow a pattern,
@@ -623,6 +632,11 @@ uint16set(void *dst, uint16 val, size_t count)
 {
 #ifdef VM_X86_64
    __stosw((uint16*)dst, val, count);
+#elif defined(VM_ARM_32)
+   size_t i;
+   for (i = 0; i < count; i++) {
+      ((uint16 *)dst)[i] = val;
+   }
 #else
    __asm { pushf;
            mov ax, val;
@@ -641,6 +655,11 @@ uint32set(void *dst, uint32 val, size_t count)
 {
 #ifdef VM_X86_64
    __stosd((unsigned long*)dst, (unsigned long)val, count);
+#elif defined(VM_ARM_32)
+   size_t i;
+   for (i = 0; i < count; i++) {
+      ((uint32 *)dst)[i] = val;
+   }
 #else
    __asm { pushf;
            mov eax, val;
@@ -673,7 +692,7 @@ static INLINE uint16
 Bswap16(uint16 v)
 {
 #if defined(VM_ARM_64)
-   __asm__("rev16 %0, %0" : "+r"(v));
+   __asm__("rev16 %w0, %w0" : "+r"(v));
    return v;
 #else
    return ((v >> 8) & 0x00ff) | ((v << 8) & 0xff00);
@@ -702,12 +721,12 @@ Bswap32(uint32 v) // IN
       : "0" (v)
    );
    return v;
-#elif defined(VM_ARM_32) && !defined(__ANDROID__)
+#elif defined(VM_ARM_32) && !defined(__ANDROID__) && !defined(_MSC_VER)
     __asm__("rev %0, %0" : "+r"(v));
     return v;
 #elif defined(VM_ARM_64)
-   __asm__("rev32 %0, %0" : "+r"(v));
-    return v;
+   __asm__("rev32 %x0, %x0" : "+r"(v));
+   return v;
 #else
    return    (v >> 24)
           | ((v >>  8) & 0xFF00)
@@ -740,63 +759,6 @@ Bswap64(uint64 v) // IN
 }
 
 
-/*
- * COMPILER_MEM_BARRIER prevents the compiler from re-ordering memory
- * references accross the barrier.  NOTE: It does not generate any
- * instruction, so the CPU is free to do whatever it wants to...
- */
-#ifdef __GNUC__
-#define COMPILER_MEM_BARRIER()   __asm__ __volatile__ ("": : :"memory")
-#define COMPILER_READ_BARRIER()  COMPILER_MEM_BARRIER()
-#define COMPILER_WRITE_BARRIER() COMPILER_MEM_BARRIER()
-#elif defined(_MSC_VER)
-#define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
-#define COMPILER_READ_BARRIER()  _ReadBarrier()
-#define COMPILER_WRITE_BARRIER() _WriteBarrier()
-#endif
-
-
-/*
- *----------------------------------------------------------------------
- *
- * COMPILER_FORCED_LOAD_AND_MEM_BARRIER --
- *
- *        This macro prevents the compiler from re-ordering memory references
- *        across the barrier. In addition it emits a forced load from the given
- *        memory reference. The memory reference has to be either 1, 2, 4 or 8
- *        bytes wide.
- *        The forced load of a memory reference can be used exploit details of a
- *        given CPUs memory model. For example x86 CPUs won't reorder stores to
- *        a memory location x with loads from a memory location x.
- *        NOTE: It does not generate any fencing instruction, so the CPU is free
- *              to reorder instructions according to its memory model.
- *
- * Results:
- *        None
- *
- * Side Effects:
- *        None.
- *
- *----------------------------------------------------------------------
- */
-
-#ifdef VM_X86_64
-#ifdef __GNUC__
-
-#define COMPILER_FORCED_LOAD_AND_MEM_BARRIER(_memory_reference)               \
-   do {                                                                       \
-      typeof(_memory_reference) _dummy;                                       \
-                                                                              \
-      asm volatile("mov %1, %0\n\t"                                           \
-                   : "=r" (_dummy) /* Let compiler choose reg for _dummy */   \
-                   : "m" (_memory_reference)                                  \
-                   : "memory");                                               \
-   } while(0)
-
-#endif /* __GNUC__ */
-#endif /* VM_X86_64 */
-
-
 /*
  * PAUSE is a P4 instruction that improves spinlock power+performance;
  * on non-P4 IA32 systems, the encoding is interpreted as a REPZ-NOP.
@@ -804,7 +766,7 @@ Bswap64(uint64 v) // IN
  */
 static INLINE void
 PAUSE(void)
-#ifdef __GNUC__
+#if defined(__GNUC__) || defined(VM_ARM_32)
 {
 #ifdef VM_ARM_ANY
    /*
@@ -878,6 +840,15 @@ RDTSC(void)
 {
    return __rdtsc();
 }
+#elif defined(VM_ARM_32)
+{
+   /*
+    * We need to do more inverstagetion here to find
+    * a microsoft equivalent of that code
+    */
+   NOT_IMPLEMENTED();
+   return 0;
+}
 #else
 #pragma warning( disable : 4035)
 {
@@ -1254,5 +1225,10 @@ RoundUpPow2_32(uint32 value)
 #endif
 }
 
+
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif // _VM_BASIC_ASM_H_
 
diff --git a/vmnet-only/vm_basic_asm_x86.h b/vmnet-only/vm_basic_asm_x86.h
index 2c4232c3..b9c684f4 100644
--- a/vmnet-only/vm_basic_asm_x86.h
+++ b/vmnet-only/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -35,6 +35,11 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
+
 #ifdef VM_X86_64
 /*
  * The gcc inline asm uses the "A" constraint which differs in 32 & 64
@@ -545,4 +550,9 @@ Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
 #pragma warning(default: 4035)
 #endif
 
+
+#if defined __cplusplus
+} // extern "C"
 #endif
+
+#endif // _VM_BASIC_ASM_X86_H_
diff --git a/vmnet-only/vm_basic_asm_x86_64.h b/vmnet-only/vm_basic_asm_x86_64.h
index bef0056d..4f9fd4f2 100644
--- a/vmnet-only/vm_basic_asm_x86_64.h
+++ b/vmnet-only/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -59,24 +59,23 @@ uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
 
 #if defined(__GNUC__)
 /*
- * GET_CURRENT_RIP
+ * GET_CURRENT_PC
  *
- * Returns the current instruction pointer. In the example below:
+ * Returns the current program counter (i.e. instruction pointer i.e. rip
+ * register on x86_64). In the example below:
  *
  *   foo.c
- *   L123: Foo(GET_CURRENT_RIP())
+ *   L123: Foo(GET_CURRENT_PC())
  *
- * the return value from GET_CURRENT_RIP will point a debugger to L123.
+ * the return value from GET_CURRENT_PC will point a debugger to L123.
  */
-#define GET_CURRENT_RIP() ({                                          \
+#define GET_CURRENT_PC() ({                                           \
       void *__rip;                                                    \
       asm("lea 0(%%rip), %0;\n\t"                                     \
          : "=r" (__rip));                                             \
       __rip;                                                          \
 })
 
-#define GET_CURRENT_PC() GET_CURRENT_RIP()
-
 /*
  * GET_CURRENT_LOCATION
  *
diff --git a/vmnet-only/vm_basic_asm_x86_common.h b/vmnet-only/vm_basic_asm_x86_common.h
index 6bbbc3e6..06ae1b5f 100644
--- a/vmnet-only/vm_basic_asm_x86_common.h
+++ b/vmnet-only/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -89,6 +89,9 @@ void _mm_mfence(void);
 void _mm_lfence(void);
 #pragma intrinsic(_mm_mfence, _mm_lfence)
 
+long _InterlockedXor(long volatile *, long);
+#pragma intrinsic(_InterlockedXor)
+
 unsigned int __getcallerseflags(void);
 #pragma intrinsic(__getcallerseflags)
 
@@ -294,20 +297,150 @@ RDTSC_BARRIER(void)
 
 
 /*
- * Compiler/CPU barriers. These take the form of <mem access type>_<mem access
- * type>_MEM_BARRIER, where <mem access type> is either LD (load), ST (store) or
- * LDST (any). On x86 we only need to care specifically about store-load
- * reordering on normal memory types and mfence, otherwise only a compiler
- * barrier is needed.
+ * Memory Barriers
+ * ===============
+ *
+ *    Terminology
+ *    -----------
+ *
+ * A compiler memory barrier prevents the compiler from re-ordering memory
+ * accesses accross the barrier. It is not a CPU instruction, it is a compiler
+ * directive (i.e. it does not emit any code).
+ *
+ * A CPU memory barrier prevents the CPU from re-ordering memory accesses
+ * accross the barrier. It is a CPU instruction.
+ *
+ * A memory barrier is the union of a compiler memory barrier and a CPU memory
+ * barrier. A compiler memory barrier is a useless construct by itself. It is
+ * only useful when combined with a CPU memory barrier, to implement a memory
+ * barrier.
+ *
+ *    Semantics
+ *    ---------
+ *
+ * At the time COMPILER_*_BARRIER were created (and references to them were
+ * added to the code), the code was only targetting x86. The intent of the code
+ * was really to use a memory barrier, but because x86 uses a strongly ordered
+ * memory model, the CPU would not re-order memory accesses, and the code could
+ * get away with using just a compiler memory barrier. So COMPILER_*_BARRIER
+ * were born and were implemented as compiler memory barriers _on x86_. But
+ * make no mistake, _the semantics that the code expects from
+ * COMPILER_*_BARRIER are that of a memory barrier_!
+ *
+ *    DO NOT USE!
+ *    -----------
+ *
+ * On at least one non-x86 architecture, COMPILER_*_BARRIER are
+ * 1) Misnomers
+ * 2) Not fine-grained enough to provide the best performance.
+ * For the above two reasons, usage of COMPILER_*_BARRIER is now deprecated.
+ * _Do not add new references to COMPILER_*_BARRIER._ Instead, precisely
+ * document the intent of your code by using
+ * <mem_type/purpose>_<before_access_type>_BARRIER_<after_access_type>.
+ * Existing references to COMPILER_*_BARRIER are being slowly but surely
+ * converted, and when no references are left, COMPILER_*_BARRIER will be
+ * retired.
+ *
+ * Thanks for pasting this whole comment into every architecture header.
+ */
+
+#if defined __GNUC__
+#   define COMPILER_READ_BARRIER()  COMPILER_MEM_BARRIER()
+#   define COMPILER_WRITE_BARRIER() COMPILER_MEM_BARRIER()
+#   define COMPILER_MEM_BARRIER()   __asm__ __volatile__("" ::: "memory")
+#elif defined _MSC_VER
+#   define COMPILER_READ_BARRIER()  _ReadBarrier()
+#   define COMPILER_WRITE_BARRIER() _WriteBarrier()
+#   define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
+#endif
+
+
+/*
+ * Memory barriers. These take the form of
+ *
+ * <mem_type/purpose>_<before_access_type>_BARRIER_<after_access_type>
+ *
+ * where:
+ *   <mem_type/purpose> is either SMP, DMA, or MMIO.
+ *   <*_access type> is either R(load), W(store) or RW(any).
+ *
+ * Above every use of these memory barriers in the code, there _must_ be a
+ * comment to justify the use, i.e. a comment which:
+ *
+ * 1) Precisely identifies which memory accesses must not be re-ordered across
+ *    the memory barrier.
+ * 2) Explains why it is important that the memory accesses not be re-ordered.
+ *
+ * Thanks for pasting this whole comment into every architecture header.
+ *
+ * On x86, we only need to care specifically about store-load reordering on
+ * normal memory types. In other cases, only a compiler barrier is needed. The
+ * ST_LD barrier is implemented with a locked xor operation (instead of the
+ * mfence instruction) for performance reasons. See PR 1674199 for more
+ * details.
+ *
+ * On x64, special instructions are only provided for load-load (lfence) and
+ * store-store (sfence) ordering, and they don't apply to normal memory.
+ */
+
+
+static INLINE void
+SMP_W_BARRIER_R(void)
+{
+   volatile long temp;
+
+   COMPILER_MEM_BARRIER();
+#if defined __GNUC__
+   __asm__ __volatile__ (
+      "lock xorl $1, %0\n"
+      : "+m" (temp)
+      : /* no additional inputs */
+      : "cc");
+#elif defined _MSC_VER
+   _InterlockedXor(&temp, 1);
+#else
+#error SMP_W_BARRIER_R not defined for this compiler
+#endif
+   COMPILER_MEM_BARRIER();
+}
+
+#define SMP_R_BARRIER_R()     COMPILER_READ_BARRIER()
+#define SMP_R_BARRIER_W()     COMPILER_MEM_BARRIER()
+#define SMP_R_BARRIER_RW()    COMPILER_MEM_BARRIER()
+#define SMP_W_BARRIER_W()     COMPILER_WRITE_BARRIER()
+#define SMP_W_BARRIER_RW()    SMP_W_BARRIER_R()
+#define SMP_RW_BARRIER_R()    SMP_W_BARRIER_R()
+#define SMP_RW_BARRIER_W()    COMPILER_MEM_BARRIER()
+#define SMP_RW_BARRIER_RW()   SMP_W_BARRIER_R()
+
+/*
+ * Like the above, only for use with observers other than CPUs,
+ * i.e. DMA masters.
+ */
+
+#define DMA_R_BARRIER_R()     SMP_R_BARRIER_R()
+#define DMA_R_BARRIER_W()     SMP_R_BARRIER_W()
+#define DMA_R_BARRIER_RW()    SMP_R_BARRIER_RW()
+#define DMA_W_BARRIER_R()     SMP_W_BARRIER_R()
+#define DMA_W_BARRIER_W()     SMP_W_BARRIER_W()
+#define DMA_W_BARRIER_RW()    SMP_W_BARRIER_RW()
+#define DMA_RW_BARRIER_R()    SMP_RW_BARRIER_R()
+#define DMA_RW_BARRIER_W()    SMP_RW_BARRIER_W()
+#define DMA_RW_BARRIER_RW()   SMP_RW_BARRIER_RW()
+
+/*
+ * And finally a set for use with MMIO accesses.
  */
-#define LD_LD_MEM_BARRIER()      COMPILER_MEM_BARRIER()
-#define LD_ST_MEM_BARRIER()      COMPILER_MEM_BARRIER()
-#define LD_LDST_MEM_BARRIER()    COMPILER_MEM_BARRIER()
-#define ST_LD_MEM_BARRIER()      asm volatile ("mfence" ::: "memory")
-#define ST_ST_MEM_BARRIER()      COMPILER_MEM_BARRIER()
-#define ST_LDST_MEM_BARRIER()    ST_LD_MEM_BARRIER()
-#define LDST_LD_MEM_BARRIER()    ST_LD_MEM_BARRIER()
-#define LDST_ST_MEM_BARRIER()    COMPILER_MEM_BARRIER()
-#define LDST_LDST_MEM_BARRIER()  ST_LD_MEM_BARRIER()
+
+#define MMIO_R_BARRIER_R()    SMP_R_BARRIER_R()
+#define MMIO_R_BARRIER_W()    SMP_R_BARRIER_W()
+#define MMIO_R_BARRIER_RW()   SMP_R_BARRIER_RW()
+#define MMIO_W_BARRIER_R()    SMP_W_BARRIER_R()
+#define MMIO_W_BARRIER_W()    SMP_W_BARRIER_W()
+#define MMIO_W_BARRIER_RW()   SMP_W_BARRIER_RW()
+#define MMIO_RW_BARRIER_R()   SMP_RW_BARRIER_R()
+#define MMIO_RW_BARRIER_W()   SMP_RW_BARRIER_W()
+#define MMIO_RW_BARRIER_RW()  SMP_RW_BARRIER_RW()
+
 
 #endif // _VM_BASIC_ASM_X86_COMMON_H_
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index efe492ab..47022384 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -251,12 +251,16 @@ Max(int a, int b)
 #define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
 #endif
 
+#ifndef MBYTES_SHIFT
+#define MBYTES_SHIFT 20
+#endif
+
 #ifndef MBYTES_2_PAGES
-#define MBYTES_2_PAGES(_nbytes) ((_nbytes) << (20 - PAGE_SHIFT))
+#define MBYTES_2_PAGES(_nbytes) ((_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_MBYTES
-#define PAGES_2_MBYTES(_npages) ((_npages) >> (20 - PAGE_SHIFT))
+#define PAGES_2_MBYTES(_npages) ((_npages) >> (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef GBYTES_2_PAGES
@@ -268,11 +272,11 @@ Max(int a, int b)
 #endif
 
 #ifndef BYTES_2_MBYTES
-#define BYTES_2_MBYTES(_nbytes) ((_nbytes) >> 20)
+#define BYTES_2_MBYTES(_nbytes) ((_nbytes) >> MBYTES_SHIFT)
 #endif
 
 #ifndef MBYTES_2_BYTES
-#define MBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << 20)
+#define MBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << MBYTES_SHIFT)
 #endif
 
 #ifndef BYTES_2_GBYTES
@@ -299,6 +303,26 @@ Max(int a, int b)
 #define VM_PAE_LARGE_2_SMALL_PAGES (BYTES_2_PAGES(VM_PAE_LARGE_PAGE_SIZE))
 #endif
 
+#ifndef VM_PAE_LARGE_2_BYTES
+#define VM_PAE_LARGE_2_BYTES(_2mbytes) ((_2mbytes) << VM_PAE_LARGE_PAGE_SHIFT)
+#endif
+
+#ifndef VM_1GB_PAGE_SHIFT
+#define VM_1GB_PAGE_SHIFT 30
+#endif
+
+#ifndef VM_1GB_PAGE_SIZE
+#define VM_1GB_PAGE_SIZE (1 << VM_1GB_PAGE_SHIFT)
+#endif
+
+#ifndef VM_1GB_2_PAGES
+#define VM_1GB_2_PAGES (BYTES_2_PAGES(VM_1GB_PAGE_SIZE))
+#endif
+
+#ifndef VM_1GB_2_PDIRS
+#define VM_1GB_2_PDIRS (VM_1GB_PAGE_SIZE / VM_PAE_LARGE_PAGE_SIZE)
+#endif
+
 /*
  * Word operations
  */
@@ -394,9 +418,7 @@ void *_ReturnAddress(void);
  * guarantee.  Bummer.  --Jeremy.
  */
 
-#if defined(N_PLAT_NLM)
-/* We do not have YIELD() as we do not need it yet... */
-#elif defined(_WIN32)
+#if defined(_WIN32)
 #      define YIELD()		Sleep(0)
 #elif defined(VMKERNEL)
 /* We don't have a YIELD macro in the vmkernel */
@@ -412,7 +434,11 @@ void *_ReturnAddress(void);
 
 #ifdef _WIN32 // {
 
+/* Conflict with definition of Visual Studio 2015 */
+#if (_MSC_VER < 1900)
 #define snprintf  _snprintf
+#endif
+
 #define strtok_r  strtok_s
 
 #if (_MSC_VER < 1500)
@@ -652,14 +678,24 @@ typedef int pid_t;
 #define APPLE_ONLY(x) x
 #else
 #define vmx86_apple 0
-#define APPLE_ONLY(x) 
+#define APPLE_ONLY(x)
+#endif
+
+#if defined(__APPLE__) && defined(VMW_APPLE_SANDBOX)
+#define vmw_apple_sandbox 1
+#else
+#define vmw_apple_sandbox 0
 #endif
 
 #ifdef VMM
 #define VMM_ONLY(x) x
-#define USER_ONLY(x)
 #else
 #define VMM_ONLY(x)
+#endif
+
+#if defined(VMM) || defined(VMKERNEL)
+#define USER_ONLY(x)
+#else
 #define USER_ONLY(x) x
 #endif
 
@@ -781,6 +817,22 @@ typedef int pid_t;
 #define SIZE_80BIT  10
 #define SIZE_128BIT 16
 #define SIZE_256BIT 32
+#define SIZE_512BIT 64
+
+/*
+ * Allocate a variable of type _type, aligned to _align bytes, returning a
+ * pointer to the variable in _var.  Potentially _align - 1 bytes may be
+ * wasted.  On x86, GCC 6.3.0 behaves sub-optimally when variables are declared
+ * on the stack using the aligned attribute, so this pattern is preferred.
+ * See PRs 1795155, 1819963.
+ */
+#define WITH_PTR_TO_ALIGNED_VAR(_type, _align, _var)                     \
+   do {                                                                  \
+      uint8 _buf_##_var[sizeof(_type) + (_align) - 1];                   \
+      _type *_var = (_type *) ((uintptr_t)(_buf_##_var + (_align) - 1) & \
+                               ~((uintptr_t) ((_align) - 1)));
 
+#define END_PTR_TO_ALIGNED_VAR \
+   } while (0)
 
 #endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index 17b11b96..01aa0c9f 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,7 +40,8 @@
 
 /* STRICT ANSI means the Xserver build and X defines Bool differently. */
 #if !defined(_XTYPEDEF_BOOL) && \
-    (!defined(__STRICT_ANSI__) || defined(__FreeBSD__) || defined(__MINGW32__))
+    (!defined(__STRICT_ANSI__) || defined(__FreeBSD__) || \
+      defined(__MINGW32__) || defined(__APPLE__))
 #define _XTYPEDEF_BOOL
 typedef char           Bool;
 #endif
@@ -53,8 +54,7 @@ typedef char           Bool;
 #define TRUE           1
 #endif
 
-#define IsBool(x)      (((x) & ~1) == 0)
-#define IsBool2(x, y)  ((((x) | (y)) & ~1) == 0)
+#define IS_BOOL(x)     (((x) & ~1) == 0)
 
 /*
  * Macros __i386__ and __ia64 are intrinsically defined by GCC
@@ -312,6 +312,19 @@ typedef uint32    uintptr_t;
 #endif
 
 
+#if defined(__GNUC__) && defined(__SIZEOF_INT128__)
+
+typedef unsigned __int128 uint128;
+typedef          __int128  int128;
+
+#define MIN_INT128   ((int128)1 << 127)
+#define MAX_INT128   (~MIN_INT128)
+#define MIN_UINT128  ((uint128)0)
+#define MAX_UINT128  (~MIN_UINT128)
+
+#endif
+
+
 /*
  * Time
  * XXX These should be cleaned up.  -- edward
@@ -353,14 +366,7 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
    #define FMTH ""
 #elif __GNUC__
    #define FMTH ""
-   #if defined(N_PLAT_NLM) || defined(sun) || \
-       (defined(__FreeBSD__) && (__FreeBSD__ + 0) && ((__FreeBSD__ + 0) < 5))
-      /*
-       * Why (__FreeBSD__ + 0)?  See bug 141008.
-       * Yes, we really need to test both (__FreeBSD__ + 0) and
-       * ((__FreeBSD__ + 0) < 5).  No, we can't remove "+ 0" from
-       * ((__FreeBSD__ + 0) < 5).
-       */
+   #if defined(sun)
       #if defined(VM_X86_64) || defined(VM_ARM_64)
          #define FMTSZ  "l"
          #define FMTPD  "l"
@@ -368,7 +374,8 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
          #define FMTSZ  ""
          #define FMTPD  ""
       #endif
-   #elif defined(__linux__) \
+   #elif defined(__linux__) || \
+        (defined(__FreeBSD__) && (__FreeBSD__ + 0))\
       || (defined(_POSIX_C_SOURCE) && _POSIX_C_SOURCE >= 200112L) \
       || (defined(_POSIX_VERSION) && _POSIX_VERSION >= 200112L) \
       || (defined(_POSIX2_VERSION) && _POSIX2_VERSION >= 200112L)
@@ -543,6 +550,11 @@ typedef uint16  UReg16;
 typedef uint32  UReg32;
 typedef uint64  UReg64;
 
+#if defined(__GNUC__) && defined(__SIZEOF_INT128__)
+typedef  int128  Reg128;
+typedef uint128 UReg128;
+#endif
+
 #if defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
     defined (VMKERNEL) || defined (VMKBOOT)
 typedef  Reg64  Reg;
@@ -673,10 +685,17 @@ typedef void * UserVA;
 #endif
 #define CONST         const
 
-
 #ifndef INLINE
 #   ifdef _MSC_VER
-#      define INLINE        __inline
+       /*
+        * On UWP(Universal Windows Platform),
+        * Only X86 32bit support '__inline'
+        */
+#      if defined(VM_WIN_UWP) && !defined(VM_X86_32)
+#            define INLINE
+#      else
+#            define INLINE        __inline
+#      endif
 #   else
 #      define INLINE        inline
 #   endif
@@ -887,6 +906,8 @@ typedef void * UserVA;
 #ifndef UNUSED_PARAM
 # if defined(__GNUC__)
 #  define UNUSED_PARAM(_parm) _parm  __attribute__((__unused__))
+# elif defined _MSC_VER
+#  define UNUSED_PARAM(_parm) __pragma(warning(suppress:4100)) _parm
 # else
 #  define UNUSED_PARAM(_parm) _parm
 # endif
@@ -921,6 +942,21 @@ typedef void * UserVA;
 #define ALIGNED(n)
 #endif
 
+
+/*
+ * Encapsulate the syntactic differences between gcc and msvc alignment control.
+ * BOUNDARY must match in the prefix and suffix.
+ */
+
+#ifdef _WIN32
+#define ALIGN_PREFIX(BOUNDRY) __declspec(align(BOUNDRY))
+#define ALIGN_SUFFIX(BOUNDRY)
+#else
+#define ALIGN_PREFIX(BOUNDRY)
+#define ALIGN_SUFFIX(BOUNDRY) __attribute__((__aligned__(BOUNDRY)))
+#endif
+
+
 /*
  * Once upon a time, this was used to silence compiler warnings that
  * get generated when the compiler thinks that a function returns
@@ -1102,16 +1138,6 @@ typedef void * UserVA;
 #endif
 
 
-/*
- * Define MXSemaHandle here so both vmmon and vmx see this definition.
- */
-
-#ifdef _WIN32
-typedef uintptr_t MXSemaHandle;
-#else
-typedef int MXSemaHandle;
-#endif
-
 /*
  * Define type for poll device handles.
  */
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
index e2cb477f..ab396bc1 100644
--- a/vmnet-only/vm_device_version.h
+++ b/vmnet-only/vm_device_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2005-2012,2014-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2005-2012,2014-2016 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -74,9 +74,19 @@
 #define PCI_DEVICE_ID_VMWARE_PVSCSI             0x07C0
 #define PCI_DEVICE_ID_VMWARE_82574              0x07D0
 #define PCI_DEVICE_ID_VMWARE_AHCI               0x07E0
+#define PCI_DEVICE_ID_VMWARE_NVME               0x07F0
 #define PCI_DEVICE_ID_VMWARE_HDAUDIO_CODEC      0x1975
 #define PCI_DEVICE_ID_VMWARE_HDAUDIO_CONTROLLER 0x1977
 
+/*
+ * TXT vendor, device and revision ID. We are keeping vendor
+ * as Intel since tboot code does not like anything other
+ * than Intel in the SINIT ACM header.
+ */
+#define TXT_VENDOR_ID                           0x8086
+#define TXT_DEVICE_ID                           0xB002
+#define TXT_REVISION_ID                         0x01
+
 /* The hypervisor device might grow.  Please leave room
  * for 7 more subfunctions.
  */
@@ -90,8 +100,8 @@
 
 #define PCI_DEVICE_ID_VMWARE_DUMMY      0x0809
 
-#define PCI_DEVICE_ID_VMWARE_NVDIMM     0x0810
 #define PCI_DEVICE_ID_VMWARE_VRDMA      0x0820
+#define PCI_DEVICE_ID_VMWARE_VTPM       0x0830
 
 /*
  * VMware Virtual Device Test Infrastructure (VDTI) devices
@@ -136,11 +146,31 @@
 #define PCI_DEVICE_ID_INTEL_HECI        0x2a74
 #define PCI_DEVICE_ID_INTEL_PANTHERPOINT_XHCI 0x1e31
 
-/* From drivers/usb/host/xhci-pci.c:
+/*
+ *  From drivers/usb/host/xhci-pci.c:
  *    Intel XHCI (Lynx Point / Intel 8 Series)
  */
 #define PCI_DEVICE_ID_INTEL_LYNXPOINT_XHCI 0x8c31
 
+/*
+ * Intel Quickassist (QAT) devices:
+ * - Gen 1: Cave Creek (CVC) and Coleto Creek (CLC)
+ * - Gen 2: Lewisburg (LBG)
+ */
+#define PCI_DEVICE_ID_INTEL_QAT_CVC     0x0434
+#define PCI_DEVICE_ID_INTEL_QAT_CLC     0x0435
+#define PCI_DEVICE_ID_INTEL_QAT_LBG     0x37c8
+#define PCI_DEVICE_ID_INTEL_QAT_CVC_VF  0x0442
+#define PCI_DEVICE_ID_INTEL_QAT_CLC_VF  0x0443
+#define PCI_DEVICE_ID_INTEL_QAT_LBG_VF  0x37c9
+
+/*
+ * Intel FPGAs
+ */
+
+#define PCI_DEVICE_ID_INTEL_FPGA_SKL_PF 0xbcc0
+#define PCI_DEVICE_ID_INTEL_FPGA_SKL_VF 0xbcc1
+
 #define E1000E_PCI_DEVICE_ID_CONFIG_STR "e1000e.pci.deviceID"
 #define E1000E_PCI_SUB_VENDOR_ID_CONFIG_STR "e1000e.pci.subVendorID"
 #define E1000E_PCI_SUB_DEVICE_ID_CONFIG_STR "e1000e.pci.subDeviceID"
@@ -198,6 +228,13 @@
 #define SCSI_CDROM_VENDOR_NAME COMPANY_NAME
 #define SCSI_CDROM_REV_LEVEL "1.0"
 
+/************* NVME implementation limits ********************************/
+#define NVME_MAX_CONTROLLERS   4
+#define NVME_MIN_NAMESPACES    1
+#define NVME_MAX_NAMESPACES    15 /* We support only 15 namespaces same
+                                   * as SCSI devices.
+                                   */
+
 /************* SCSI implementation limits ********************************/
 #define SCSI_MAX_CONTROLLERS	 4	  // Need more than 1 for MSCS clustering
 #define	SCSI_MAX_DEVICES	 16	  // BT-958 emulates only 16
@@ -218,6 +255,7 @@
 #define MAX_NUM_DISKS \
    ((SATA_MAX_CONTROLLERS * SATA_MAX_DEVICES) + \
     (SCSI_MAX_CONTROLLERS * SCSI_MAX_DEVICES) + \
+    (NVME_MAX_CONTROLLERS * NVME_MAX_NAMESPACES) + \
     (IDE_NUM_INTERFACES * IDE_DRIVES_PER_IF))
 
 /*
@@ -228,7 +266,17 @@
 #define SCSI_IDE_CHANNEL         SCSI_MAX_CONTROLLERS
 #define SCSI_IDE_HOSTED_CHANNEL  (SCSI_MAX_CONTROLLERS + 1)
 #define SCSI_SATA_CHANNEL_FIRST  (SCSI_IDE_HOSTED_CHANNEL + 1)
-#define SCSI_MAX_CHANNELS        (SCSI_SATA_CHANNEL_FIRST + SATA_MAX_CONTROLLERS)
+#define SCSI_NVME_CHANNEL_FIRST  (SCSI_SATA_CHANNEL_FIRST + \
+                                  SATA_MAX_CONTROLLERS)
+#define SCSI_MAX_CHANNELS        (SCSI_NVME_CHANNEL_FIRST + \
+                                  NVME_MAX_CONTROLLERS)
+
+/************* SCSI-NVME channel IDs *******************************/
+#define NVME_ID_TO_SCSI_ID(nvmeId)    \
+   (SCSI_NVME_CHANNEL_FIRST + (nvmeId))
+
+#define SCSI_ID_TO_NVME_ID(scsiId)    \
+   ((scsiId) - SCSI_NVME_CHANNEL_FIRST)
 
 /************* SCSI-SATA channel IDs********************************/
 #define SATA_ID_TO_SCSI_ID(sataId)    \
@@ -264,10 +312,14 @@
 #define MAX_USB_DEVICES_PER_HOST_CONTROLLER 127
 
 /************* NVDIMM implementation limits ********************************/
+#define NVDIMM_MAX_CONTROLLERS   1
 #define MAX_NVDIMM 64
 
 /************* vRDMA implementation limits ******************************/
-#define MAX_VRDMA_DEVICES 2
+#define MAX_VRDMA_DEVICES 1
+
+/************* QAT implementation limits ********************/
+#define MAX_QAT_PCI_DEVICES 4
 
 /************* Strings for Host USB Driver *******************************/
 
@@ -306,4 +358,13 @@ DEFINE_GUID(GUID_CLASS_VMWARE_USB_DEVICES,
 #endif
 #endif
 
+/*
+ * Our JEDEC 2 Manufacturer ID number is 2 in bank 10.  Our number is nine
+ * bytes of continuation code (with an odd parity bit in bit 7) followed by the
+ * number itself.
+ *
+ */
+#define JEDEC_VENDOR_ID_VMWARE          0x289
+#define JEDEC_DEVICE_ID_VMWARE_NVDIMM   0x0
+
 #endif /* VM_DEVICE_VERSION_H */
diff --git a/vmnet-only/vm_oui.h b/vmnet-only/vm_oui.h
index a67075a2..83b8d73b 100644
--- a/vmnet-only/vm_oui.h
+++ b/vmnet-only/vm_oui.h
@@ -26,6 +26,10 @@
 
 #include "vm_basic_asm.h"
 
+#if defined __cplusplus
+extern "C" {
+#endif
+
 /*
  * Our own OUIs given by IEEE.
  */
@@ -204,4 +208,8 @@ VMX86_GENERATE_LEGACY_MAC(uint8 mac[6],  //OUT:
    mac[5] = (suffix) & 0xff;
 }
 
+#if defined __cplusplus
+} // extern "C"
+#endif
+
 #endif
diff --git a/vmnet-only/vmnetInt.h b/vmnet-only/vmnetInt.h
index 0ee52ec1..b49c3990 100644
--- a/vmnet-only/vmnetInt.h
+++ b/vmnet-only/vmnetInt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -25,27 +25,6 @@
 #include "driver-config.h"
 
 
-/*
- * Hide all kernel compatibility stuff in those macros.  This part of code
- * is used only when building prebuilt modules, when autoconf code is disabled.
- */
-
-/* All kernels above 2.6.23 have net namespaces. */
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24) && !defined(VMW_NETDEV_HAS_NET)
-#   define VMW_NETDEV_HAS_NET
-#endif
-
-/* All kernels above 2.6.23 have skb argument in nf_hookfn. */
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 24) && !defined(VMW_NFHOOK_USES_SKB)
-#   define VMW_NFHOOK_USES_SKB
-#endif
-
-/* All kernels above 2.6.25 have dev_net & friends. */
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 26) && !defined(VMW_NETDEV_HAS_DEV_NET)
-#   define VMW_NETDEV_HAS_DEV_NET
-#endif
-
-
 #ifdef skb_shinfo
 #  define SKB_IS_CLONE_OF(clone, skb)   (  \
       skb_shinfo(clone) == skb_shinfo(skb) \
@@ -64,27 +43,15 @@
   )
 #define dev_lock_list()    read_lock(&dev_base_lock)
 #define dev_unlock_list()  read_unlock(&dev_base_lock)
-#ifdef VMW_NETDEV_HAS_NET
-#   define DEV_GET(x)      __dev_get_by_name(&init_net, (x)->name)
-#   ifdef VMW_NETDEV_HAS_DEV_NET
-#      define compat_dev_net(x) dev_net(x)
-#   else
-#      define compat_dev_net(x) (x)->nd_net
-#   endif
-#else
-#   define DEV_GET(x)      __dev_get_by_name((x)->name)
-#endif
 
 
 extern struct proto vmnet_proto;
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 2, 0)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 2, 0) || defined(sk_net_refcnt)
 #   define compat_sk_alloc(_bri, _pri) sk_alloc(&init_net, \
                                                 PF_NETLINK, _pri, &vmnet_proto, 1)
-#elif defined(VMW_NETDEV_HAS_NET)
+#else
 #   define compat_sk_alloc(_bri, _pri) sk_alloc(&init_net, \
                                                 PF_NETLINK, _pri, &vmnet_proto)
-#else
-#   define compat_sk_alloc(_bri, _pri) sk_alloc(PF_NETLINK, _pri, &vmnet_proto, 1)
 #endif
 
 
diff --git a/vmnet-only/vmware_pack_begin.h b/vmnet-only/vmware_pack_begin.h
deleted file mode 100644
index d0eb4bd9..00000000
--- a/vmnet-only/vmware_pack_begin.h
+++ /dev/null
@@ -1,43 +0,0 @@
-/*********************************************************
- * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * vmware_pack_begin.h --
- *
- *    Begin of structure packing. See vmware_pack_init.h for details.
- *
- *    Note that we do not use the following construct in this include file,
- *    because we want to emit the code every time the file is included --hpreg
- *
- *    #ifndef foo
- *    #   define foo
- *    ...
- *    #endif
- *
- */
-
-
-#include "vmware_pack_init.h"
-
-
-#ifdef _MSC_VER
-#   pragma pack(push, 1)
-#elif __GNUC__
-#else
-#   error Compiler packing...
-#endif
diff --git a/vmnet-only/vmware_pack_end.h b/vmnet-only/vmware_pack_end.h
deleted file mode 100644
index f02e2152..00000000
--- a/vmnet-only/vmware_pack_end.h
+++ /dev/null
@@ -1,44 +0,0 @@
-/*********************************************************
- * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * vmware_pack_end.h --
- *
- *    End of structure packing. See vmware_pack_init.h for details.
- *
- *    Note that we do not use the following construct in this include file,
- *    because we want to emit the code every time the file is included --hpreg
- *
- *    #ifndef foo
- *    #   define foo
- *    ...
- *    #endif
- *
- */
-
-
-#include "vmware_pack_init.h"
-
-
-#ifdef _MSC_VER
-#   pragma pack(pop)
-#elif __GNUC__
-__attribute__((__packed__))
-#else
-#   error Compiler packing...
-#endif
diff --git a/vmnet-only/vmware_pack_init.h b/vmnet-only/vmware_pack_init.h
deleted file mode 100644
index c401d66c..00000000
--- a/vmnet-only/vmware_pack_init.h
+++ /dev/null
@@ -1,65 +0,0 @@
-/*********************************************************
- * Copyright (C) 2002-2015 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef __VMWARE_PACK_INIT_H__
-#   define __VMWARE_PACK_INIT_H__
-
-
-/*
- * vmware_pack_init.h --
- *
- *    Platform-independent code to make the compiler pack (i.e. have them
- *    occupy the smallest possible space) structure definitions. The following
- *    constructs are known to work --hpreg
- *
- *    #include "vmware_pack_begin.h"
- *    struct foo {
- *       ...
- *    }
- *    #include "vmware_pack_end.h"
- *    ;
- *
- *    typedef
- *    #include "vmware_pack_begin.h"
- *    struct foo {
- *       ...
- *    }
- *    #include "vmware_pack_end.h"
- *    foo;
- */
-
-
-#ifdef _MSC_VER
-/*
- * MSVC 6.0 emits warning 4103 when the pack push and pop pragma pairing is
- * not balanced within 1 included file. That is annoying because our scheme
- * is based on the pairing being balanced between 2 included files.
- *
- * So we disable this warning, but this is safe because the compiler will also
- * emit warning 4161 when there is more pops than pushes within 1 main
- * file --hpreg
- */
-
-#   pragma warning(disable:4103)
-#elif __GNUC__
-#else
-#   error Compiler packing...
-#endif
-
-
-#endif /* __VMWARE_PACK_INIT_H__ */
diff --git a/vmnet-only/vnet.h b/vmnet-only/vnet.h
index f6f45e72..4e2ba555 100644
--- a/vmnet-only/vnet.h
+++ b/vmnet-only/vnet.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -26,7 +26,11 @@
 #include "includeCheck.h"
 #include "vm_basic_types.h"
 #include "vm_atomic.h"
-#include "monitorAction_exported.h"
+
+#if defined __cplusplus
+extern "C" {
+#endif
+
 
 #define VNET_PVN_ABI_ID_LEN    (256 / 8)  // bytes used on ioctl()
 #define VNET_PVN_ID_LEN        (160 / 8)  // actual length used
@@ -67,7 +71,7 @@ typedef struct VNet_Bind {
 #define SIOCGETAPIVERSION  0x99FC
 #define SIOCINJECTLINKSTATE 0x99FD
 
-#define VNET_NOTIFY_VERSION     5
+#define VNET_NOTIFY_VERSION     6
 #define VNET_LAST_CMD      0x99FD
 
 #if defined __linux__ || defined __APPLE__
@@ -121,7 +125,7 @@ enum VMNetSockOpt {
 };
 
 /*
- * This magic value is populated in VNet_Notify.actionID and VNet_Notify.pollMask
+ * This magic value is populated in VNet_Notify.pollMask
  * to request the driver to clear the Notify pollPtr if the receive queue is empty.
  */
 #define VNET_NOTIFY_CLR_MAGIC   0xDECAFBAD
@@ -155,7 +159,7 @@ typedef struct VNet_Read {
  * as well as new driver with old executable).
  */
 
-#ifdef linux
+#ifdef __linux__
 #define VNET_API_VERSION                (3 << 16 | 0)
 #elif defined __APPLE__
 #define VNET_API_VERSION                (6 << 16 | 0)
@@ -176,11 +180,11 @@ typedef struct VNet_SetMacAddrIOCTL {
 #pragma pack(push, 1)
 typedef struct VNet_Notify {
    uint32            version;
-   uint32            actionVersion;  /* Version of monitor action logic */
-   VA64              actPtr;         /* User VA of a MonitorActionIntr */
+   uint32            _unused0;
+   VA64              _unused1;
    VA64              pollPtr;        /* User VA of a volatile uint32 */
    VA64              recvClusterPtr; /* User VA of a uint32 */
-   MonitorIdemAction actionID;
+   uint32            _unused2;
    uint32            pollMask;
 } VNet_Notify;
 #pragma pack(pop)
@@ -447,4 +451,8 @@ VMNetOpen(int hubNum,                   // IN: hub number to bind to
 
 #endif // __APPLE__ && ! KERNEL
 
+#if defined __cplusplus
+} // extern "C"
 #endif
+
+#endif // _VNET_H
diff --git a/vmnet-only/vnetFilterInt.h b/vmnet-only/vnetFilterInt.h
deleted file mode 100644
index e69de29b..00000000
diff --git a/vmnet-only/x86cpuid.h b/vmnet-only/x86cpuid.h
deleted file mode 100644
index a1412f32..00000000
--- a/vmnet-only/x86cpuid.h
+++ /dev/null
@@ -1,1815 +0,0 @@
-/*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef _X86CPUID_H_
-#define _X86CPUID_H_
-
-/* http://www.sandpile.org/ia32/cpuid.htm */
-
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMX
-
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_DISTRIBUTE
-#define INCLUDE_ALLOW_VMK_MODULE
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_VMMON
-#include "includeCheck.h"
-
-#include "vm_basic_types.h"
-#include "community_source.h"
-#include "x86vendor.h"
-#include "vm_assert.h"
-
-/*
- * The linux kernel's ptrace.h stupidly defines the bare
- * EAX/EBX/ECX/EDX, which wrecks havoc with our preprocessor tricks.
- */
-#undef EAX
-#undef EBX
-#undef ECX
-#undef EDX
-
-typedef struct CPUIDRegs {
-   uint32 eax, ebx, ecx, edx;
-} CPUIDRegs;
-
-typedef union CPUIDRegsUnion {
-   uint32 array[4];
-   CPUIDRegs regs;
-} CPUIDRegsUnion;
-
-/*
- * Results of calling cpuid(eax, ecx) on all host logical CPU.
- */
-#ifdef _MSC_VER
-#pragma warning (disable :4200) // non-std extension: zero-sized array in struct
-#endif
-
-typedef
-#include "vmware_pack_begin.h"
-struct CPUIDReply {
-   /*
-    * Unique host logical CPU identifier. It does not change across queries, so
-    * we use it to correlate the replies of multiple queries.
-    */
-   uint64 tag;                // OUT
-
-   CPUIDRegs regs;            // OUT
-}
-#include "vmware_pack_end.h"
-CPUIDReply;
-
-typedef
-#include "vmware_pack_begin.h"
-struct CPUIDQuery {
-   uint32 eax;                // IN
-   uint32 ecx;                // IN
-   uint32 numLogicalCPUs;     // IN/OUT
-   CPUIDReply logicalCPUs[0]; // OUT
-}
-#include "vmware_pack_end.h"
-CPUIDQuery;
-
-/*
- * CPUID levels the monitor caches.
- *
- * The first parameter defines whether the level has its default masks
- * generated from the values in this file.  Any level which is marked
- * as FALSE here *must* have all monitor support types set to NA.  A
- * static assert in lib/cpuidcompat/cpuidcompat.c will check this.
- *
- * The fourth parameter is a "sub leaf count", where 0 means that ecx
- * is ignored, otherwise is the count of sub-leaves cached/supported.
- */
-
-#define CPUID_CACHED_LEVELS                         \
-   CPUIDLEVEL(TRUE,  0,   0,          0)            \
-   CPUIDLEVEL(TRUE,  1,   1,          0)            \
-   CPUIDLEVEL(FALSE, 2,   2,          0)            \
-   CPUIDLEVEL(FALSE, 4,   4,          7)            \
-   CPUIDLEVEL(FALSE, 5,   5,          0)            \
-   CPUIDLEVEL(FALSE, 6,   6,          0)            \
-   CPUIDLEVEL(TRUE,  7,   7,          1)            \
-   CPUIDLEVEL(FALSE, A,   0xA,        0)            \
-   CPUIDLEVEL(FALSE, B,   0xB,        2)            \
-   CPUIDLEVEL(TRUE,  D,   0xD,        4)            \
-   CPUIDLEVEL(FALSE, 12,  0x12,       4)            \
-   CPUIDLEVEL(FALSE, 400, 0x40000000, 0)            \
-   CPUIDLEVEL(FALSE, 401, 0x40000001, 0)            \
-   CPUIDLEVEL(FALSE, 402, 0x40000002, 0)            \
-   CPUIDLEVEL(FALSE, 403, 0x40000003, 0)            \
-   CPUIDLEVEL(FALSE, 404, 0x40000004, 0)            \
-   CPUIDLEVEL(FALSE, 405, 0x40000005, 0)            \
-   CPUIDLEVEL(FALSE, 406, 0x40000006, 0)            \
-   CPUIDLEVEL(FALSE, 410, 0x40000010, 0)            \
-   CPUIDLEVEL(FALSE, 80,  0x80000000, 0)            \
-   CPUIDLEVEL(TRUE,  81,  0x80000001, 0)            \
-   CPUIDLEVEL(FALSE, 82,  0x80000002, 0)            \
-   CPUIDLEVEL(FALSE, 83,  0x80000003, 0)            \
-   CPUIDLEVEL(FALSE, 84,  0x80000004, 0)            \
-   CPUIDLEVEL(FALSE, 85,  0x80000005, 0)            \
-   CPUIDLEVEL(FALSE, 86,  0x80000006, 0)            \
-   CPUIDLEVEL(FALSE, 87,  0x80000007, 0)            \
-   CPUIDLEVEL(FALSE, 88,  0x80000008, 0)            \
-   CPUIDLEVEL(TRUE,  8A,  0x8000000A, 0)            \
-   CPUIDLEVEL(FALSE, 819, 0x80000019, 0)            \
-   CPUIDLEVEL(FALSE, 81A, 0x8000001A, 0)            \
-   CPUIDLEVEL(FALSE, 81B, 0x8000001B, 0)            \
-   CPUIDLEVEL(FALSE, 81C, 0x8000001C, 0)            \
-   CPUIDLEVEL(FALSE, 81D, 0x8000001D, 5)            \
-   CPUIDLEVEL(FALSE, 81E, 0x8000001E, 0)
-
-#define CPUID_ALL_LEVELS CPUID_CACHED_LEVELS
-
-/* Define cached CPUID levels in the form: CPUID_LEVEL_<ShortName> */
-typedef enum {
-#define CPUIDLEVEL(t, s, v, c) CPUID_LEVEL_##s,
-   CPUID_CACHED_LEVELS
-#undef CPUIDLEVEL
-   CPUID_NUM_CACHED_LEVELS
-} CpuidCachedLevel;
-
-/* Enum to translate between shorthand name and actual CPUID level value. */
-enum {
-#define CPUIDLEVEL(t, s, v, c) CPUID_LEVEL_VAL_##s = v,
-   CPUID_ALL_LEVELS
-#undef CPUIDLEVEL
-};
-
-
-/* Named feature leaves */
-#define CPUID_FEATURE_INFORMATION  0x01
-#define CPUID_PROCESSOR_TOPOLOGY   4
-#define CPUID_MWAIT_FEATURES       5
-#define CPUID_XSAVE_FEATURES       0xd
-#define CPUID_HYPERVISOR_LEVEL_0   0x40000000
-#define CPUID_SVM_FEATURES         0x8000000a
-
-
-/*
- * CPUID result registers
- */
-
-#define CPUID_REGS                              \
-   CPUIDREG(EAX, eax)                           \
-   CPUIDREG(EBX, ebx)                           \
-   CPUIDREG(ECX, ecx)                           \
-   CPUIDREG(EDX, edx)
-
-typedef enum {
-#define CPUIDREG(uc, lc) CPUID_REG_##uc,
-   CPUID_REGS
-#undef CPUIDREG
-   CPUID_NUM_REGS
-} CpuidReg;
-
-#define CPUID_INTEL_VENDOR_STRING       "GenuntelineI"
-#define CPUID_AMD_VENDOR_STRING         "AuthcAMDenti"
-#define CPUID_CYRIX_VENDOR_STRING       "CyriteadxIns"
-#define CPUID_VIA_VENDOR_STRING         "CentaulsaurH"
-
-#define CPUID_HYPERV_HYPERVISOR_VENDOR_STRING  "Microsoft Hv"
-#define CPUID_KVM_HYPERVISOR_VENDOR_STRING     "KVMKVMKVM\0\0\0"
-#define CPUID_VMWARE_HYPERVISOR_VENDOR_STRING  "VMwareVMware"
-#define CPUID_XEN_HYPERVISOR_VENDOR_STRING     "XenVMMXenVMM"
-
-#define CPUID_INTEL_VENDOR_STRING_FIXED "GenuineIntel"
-#define CPUID_AMD_VENDOR_STRING_FIXED   "AuthenticAMD"
-#define CPUID_CYRIX_VENDOR_STRING_FIXED "CyrixInstead"
-#define CPUID_VIA_VENDOR_STRING_FIXED   "CentaurHauls"
-
-/*
- * FIELD can be defined to process the CPUID information provided
- * in the following CPUID_FIELD_DATA macro.  The first parameter is
- * the CPUID level of the feature (must be defined in
- * CPUID_ALL_LEVELS, above.  The second parameter is the CPUID result
- * register in which the field is returned (defined in CPUID_REGS).
- * The third field is the vendor(s) this feature applies to.  "COMMON"
- * means all vendors apply.  UNKNOWN may not be used here.  The fourth
- * and fifth parameters are the bit position of the field and the
- * width, respectively.  The sixth is the text name of the field.
- *
- * The seventh parameters specifies the monitor support
- * characteristics for this field.  The value must be a valid
- * CpuidFieldSupported value (omitting CPUID_FIELD_SUPPORT_ for
- * convenience).  The meaning of those values are described below.
- *
- * The eighth parameter describes whether the feature is capable of
- * being used by usermode code (TRUE), or just CPL0 kernel code
- * (FALSE).
- *
- * FLAG is defined identically to FIELD, but its accessors are more
- * appropriate for 1-bit flags, and compile-time asserts enforce that
- * the size is 1 bit wide.
- */
-
-
-/*
- * CpuidFieldSupported is made up of the following values:
- *
- *     NO: A feature/field that IS NOT SUPPORTED by the monitor.  Even
- *     if the host supports this feature, we will never expose it to
- *     the guest.
- *
- *     YES: A feature/field that IS SUPPORTED by the monitor.  If the
- *     host supports this feature, we will expose it to the guest.  If
- *     not, then we will not set the feature.
- *
- *     ANY: A feature/field that IS ALWAYS SUPPORTED by the monitor.
- *     Even if the host does not support the feature, the monitor can
- *     expose the feature to the guest. As with "YES", the guest cpuid
- *     value defaults to the host/evc cpuid value.  But usually the
- *     guest cpuid value is recomputed at power on, ignoring the default
- *     value.
- *
- *
- *     NA: Only legal for levels not masked/tested by default (see
- *     above for this definition).  Such fields must always be marked
- *     as NA.
- *
- * These distinctions, when combined with the feature's CPL3
- * properties can be translated into a common CPUID mask string as
- * follows:
- *
- *     NO + CPL3 --> "R" (Reserved).  We don't support the feature,
- *     but we can't properly hide this from applications when using
- *     direct execution or HV with apps that do try/catch/fail, so we
- *     must still perform compatibility checks.
- *
- *     NO + !CPL3 --> "0" (Masked).  We can hide this from the guest.
- *
- *     YES --> "H" (Host).  We support the feature, so show it to the
- *     guest if the host has the feature.
- *
- *     ANY/NA --> "X" (Ignore).  By default, don't perform checks for
- *     this feature bit.  Per-GOS masks may choose to set this bit in
- *     the guest.  (e.g. the APIC feature bit is always set to 1.)
- *
- *     See lib/cpuidcompat/cpuidcompat.c for any possible overrides to
- *     these defaults.
- */
-typedef enum {
-   CPUID_FIELD_SUPPORTED_NO,
-   CPUID_FIELD_SUPPORTED_YES,
-   CPUID_FIELD_SUPPORTED_ANY,
-   CPUID_FIELD_SUPPORTED_NA,
-   CPUID_NUM_FIELD_SUPPORTEDS
-} CpuidFieldSupported;
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_0                                               \
-FIELD(  0,  0, EAX,  0, 32, NUMLEVELS,                             ANY, FALSE) \
-FIELD(  0,  0, EBX,  0, 32, VENDOR1,                               YES, TRUE)  \
-FIELD(  0,  0, ECX,  0, 32, VENDOR3,                               YES, TRUE)  \
-FIELD(  0,  0, EDX,  0, 32, VENDOR2,                               YES, TRUE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_1                                               \
-FIELD(  1,  0, EAX,  0,  4, STEPPING,                              ANY, FALSE) \
-FIELD(  1,  0, EAX,  4,  4, MODEL,                                 ANY, FALSE) \
-FIELD(  1,  0, EAX,  8,  4, FAMILY,                                YES, FALSE) \
-FIELD(  1,  0, EAX, 12,  2, TYPE,                                  ANY, FALSE) \
-FIELD(  1,  0, EAX, 16,  4, EXTENDED_MODEL,                        ANY, FALSE) \
-FIELD(  1,  0, EAX, 20,  8, EXTENDED_FAMILY,                       YES, FALSE) \
-FIELD(  1,  0, EBX,  0,  8, BRAND_ID,                              ANY, FALSE) \
-FIELD(  1,  0, EBX,  8,  8, CLFL_SIZE,                             ANY, FALSE) \
-FIELD(  1,  0, EBX, 16,  8, LCPU_COUNT,                            ANY, FALSE) \
-FIELD(  1,  0, EBX, 24,  8, APICID,                                ANY, FALSE) \
-FLAG(   1,  0, ECX,  0,  1, SSE3,                                  YES, TRUE)  \
-FLAG(   1,  0, ECX,  1,  1, PCLMULQDQ,                             YES, TRUE)  \
-FLAG(   1,  0, ECX,  2,  1, DTES64,                                NO,  FALSE) \
-FLAG(   1,  0, ECX,  3,  1, MWAIT,                                 YES, FALSE) \
-FLAG(   1,  0, ECX,  4,  1, DSCPL,                                 NO,  FALSE) \
-FLAG(   1,  0, ECX,  5,  1, VMX,                                   YES, FALSE) \
-FLAG(   1,  0, ECX,  6,  1, SMX,                                   NO,  FALSE) \
-FLAG(   1,  0, ECX,  7,  1, EIST,                                  NO,  FALSE) \
-FLAG(   1,  0, ECX,  8,  1, TM2,                                   NO,  FALSE) \
-FLAG(   1,  0, ECX,  9,  1, SSSE3,                                 YES, TRUE)  \
-FLAG(   1,  0, ECX, 10,  1, CNXTID,                                NO,  FALSE) \
-FLAG(   1,  0, ECX, 11,  1, SDBG,                                  NO,  FALSE) \
-FLAG(   1,  0, ECX, 12,  1, FMA,                                   YES, TRUE)  \
-FLAG(   1,  0, ECX, 13,  1, CMPXCHG16B,                            YES, TRUE)  \
-FLAG(   1,  0, ECX, 14,  1, xTPR,                                  NO,  FALSE) \
-FLAG(   1,  0, ECX, 15,  1, PDCM,                                  NO,  FALSE) \
-FLAG(   1,  0, ECX, 17,  1, PCID,                                  YES, FALSE) \
-FLAG(   1,  0, ECX, 18,  1, DCA,                                   NO,  FALSE) \
-FLAG(   1,  0, ECX, 19,  1, SSE41,                                 YES, TRUE)  \
-FLAG(   1,  0, ECX, 20,  1, SSE42,                                 YES, TRUE)  \
-FLAG(   1,  0, ECX, 21,  1, x2APIC,                                ANY, FALSE) \
-FLAG(   1,  0, ECX, 22,  1, MOVBE,                                 YES, TRUE)  \
-FLAG(   1,  0, ECX, 23,  1, POPCNT,                                YES, TRUE)  \
-FLAG(   1,  0, ECX, 24,  1, TSC_DEADLINE,                          ANY, FALSE) \
-FLAG(   1,  0, ECX, 25,  1, AES,                                   YES, TRUE)  \
-FLAG(   1,  0, ECX, 26,  1, XSAVE,                                 YES, FALSE) \
-FLAG(   1,  0, ECX, 27,  1, OSXSAVE,                               ANY, FALSE) \
-FLAG(   1,  0, ECX, 28,  1, AVX,                                   YES, FALSE) \
-FLAG(   1,  0, ECX, 29,  1, F16C,                                  YES, TRUE)  \
-FLAG(   1,  0, ECX, 30,  1, RDRAND,                                YES, TRUE)  \
-FLAG(   1,  0, ECX, 31,  1, HYPERVISOR,                            ANY, TRUE)  \
-FLAG(   1,  0, EDX,  0,  1, FPU,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX,  1,  1, VME,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  2,  1, DE,                                    YES, FALSE) \
-FLAG(   1,  0, EDX,  3,  1, PSE,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  4,  1, TSC,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX,  5,  1, MSR,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  6,  1, PAE,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  7,  1, MCE,                                   YES, FALSE) \
-FLAG(   1,  0, EDX,  8,  1, CX8,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX,  9,  1, APIC,                                  ANY, FALSE) \
-FLAG(   1,  0, EDX, 11,  1, SEP,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX, 12,  1, MTRR,                                  YES, FALSE) \
-FLAG(   1,  0, EDX, 13,  1, PGE,                                   YES, FALSE) \
-FLAG(   1,  0, EDX, 14,  1, MCA,                                   YES, FALSE) \
-FLAG(   1,  0, EDX, 15,  1, CMOV,                                  YES, TRUE)  \
-FLAG(   1,  0, EDX, 16,  1, PAT,                                   YES, FALSE) \
-FLAG(   1,  0, EDX, 17,  1, PSE36,                                 YES, FALSE) \
-FLAG(   1,  0, EDX, 18,  1, PSN,                                   YES, FALSE) \
-FLAG(   1,  0, EDX, 19,  1, CLFSH,                                 YES, TRUE)  \
-FLAG(   1,  0, EDX, 21,  1, DS,                                    YES, FALSE) \
-FLAG(   1,  0, EDX, 22,  1, ACPI,                                  ANY, FALSE) \
-FLAG(   1,  0, EDX, 23,  1, MMX,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX, 24,  1, FXSR,                                  YES, TRUE)  \
-FLAG(   1,  0, EDX, 25,  1, SSE,                                   YES, TRUE)  \
-FLAG(   1,  0, EDX, 26,  1, SSE2,                                  YES, TRUE)  \
-FLAG(   1,  0, EDX, 27,  1, SS,                                    YES, FALSE) \
-FLAG(   1,  0, EDX, 28,  1, HTT,                                   ANY, FALSE) \
-FLAG(   1,  0, EDX, 29,  1, TM,                                    NO,  FALSE) \
-FLAG(   1,  0, EDX, 30,  1, IA64,                                  NO,  FALSE) \
-FLAG(   1,  0, EDX, 31,  1, PBE,                                   NO,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_2                                               \
-FIELD(  2,  0, EAX,  0,  8, LEAF2_COUNT,                           NA, FALSE)  \
-FIELD(  2,  0, EAX,  8,  8, LEAF2_CACHE1,                          NA, FALSE)  \
-FIELD(  2,  0, EAX, 16,  8, LEAF2_CACHE2,                          NA, FALSE)  \
-FIELD(  2,  0, EAX, 24,  8, LEAF2_CACHE3,                          NA, FALSE)  \
-FIELD(  2,  0, EBX,  0,  8, LEAF2_CACHE4,                          NA, FALSE)  \
-FIELD(  2,  0, EBX,  8,  8, LEAF2_CACHE5,                          NA, FALSE)  \
-FIELD(  2,  0, EBX, 16,  8, LEAF2_CACHE6,                          NA, FALSE)  \
-FIELD(  2,  0, EBX, 24,  8, LEAF2_CACHE7,                          NA, FALSE)  \
-FIELD(  2,  0, ECX,  0,  8, LEAF2_CACHE8,                          NA, FALSE)  \
-FIELD(  2,  0, ECX,  8,  8, LEAF2_CACHE9,                          NA, FALSE)  \
-FIELD(  2,  0, ECX, 16,  8, LEAF2_CACHE10,                         NA, FALSE)  \
-FIELD(  2,  0, ECX, 24,  8, LEAF2_CACHE11,                         NA, FALSE)  \
-FIELD(  2,  0, EDX,  0,  8, LEAF2_CACHE12,                         NA, FALSE)  \
-FIELD(  2,  0, EDX,  8,  8, LEAF2_CACHE13,                         NA, FALSE)  \
-FIELD(  2,  0, EDX, 16,  8, LEAF2_CACHE14,                         NA, FALSE)  \
-FIELD(  2,  0, EDX, 24,  8, LEAF2_CACHE15,                         NA, FALSE)  \
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_4                                               \
-FIELD(  4,  0, EAX,  0,  5, LEAF4_CACHE_TYPE,                      NA,  FALSE) \
-FIELD(  4,  0, EAX,  5,  3, LEAF4_CACHE_LEVEL,                     NA,  FALSE) \
-FLAG(   4,  0, EAX,  8,  1, LEAF4_CACHE_SELF_INIT,                 NA,  FALSE) \
-FLAG(   4,  0, EAX,  9,  1, LEAF4_CACHE_FULLY_ASSOC,               NA,  FALSE) \
-FIELD(  4,  0, EAX, 14, 12, LEAF4_CACHE_NUMHT_SHARING,             NA,  FALSE) \
-FIELD(  4,  0, EAX, 26,  6, LEAF4_CORE_COUNT,                      NA,  FALSE) \
-FIELD(  4,  0, EBX,  0, 12, LEAF4_CACHE_LINE,                      NA,  FALSE) \
-FIELD(  4,  0, EBX, 12, 10, LEAF4_CACHE_PART,                      NA,  FALSE) \
-FIELD(  4,  0, EBX, 22, 10, LEAF4_CACHE_WAYS,                      NA,  FALSE) \
-FIELD(  4,  0, ECX,  0, 32, LEAF4_CACHE_SETS,                      NA,  FALSE) \
-FLAG(   4,  0, EDX,  0,  1, LEAF4_CACHE_WBINVD_NOT_GUARANTEED,     NA,  FALSE) \
-FLAG(   4,  0, EDX,  1,  1, LEAF4_CACHE_IS_INCLUSIVE,              NA,  FALSE) \
-FLAG(   4,  0, EDX,  2,  1, LEAF4_CACHE_COMPLEX_INDEXING,          NA,  FALSE)
-
-/*     LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                 MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_5                                               \
-FIELD(  5,  0, EAX,  0, 16, MWAIT_MIN_SIZE,                        NA,  FALSE) \
-FIELD(  5,  0, EBX,  0, 16, MWAIT_MAX_SIZE,                        NA,  FALSE) \
-FLAG(   5,  0, ECX,  0,  1, MWAIT_EXTENSIONS,                      NA,  FALSE) \
-FLAG(   5,  0, ECX,  1,  1, MWAIT_INTR_BREAK,                      NA,  FALSE) \
-FIELD(  5,  0, EDX,  0,  4, MWAIT_C0_SUBSTATE,                     NA,  FALSE) \
-FIELD(  5,  0, EDX,  4,  4, MWAIT_C1_SUBSTATE,                     NA,  FALSE) \
-FIELD(  5,  0, EDX,  8,  4, MWAIT_C2_SUBSTATE,                     NA,  FALSE) \
-FIELD(  5,  0, EDX, 12,  4, MWAIT_C3_SUBSTATE,                     NA,  FALSE) \
-FIELD(  5,  0, EDX, 16,  4, MWAIT_C4_SUBSTATE,                     NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_6                                               \
-FLAG(   6,  0, EAX,  0,  1, THERMAL_SENSOR,                        NA,  FALSE) \
-FLAG(   6,  0, EAX,  1,  1, TURBO_MODE,                            NA,  FALSE) \
-FLAG(   6,  0, EAX,  2,  1, APIC_INVARIANT,                        NA,  FALSE) \
-FLAG(   6,  0, EAX,  4,  1, PLN,                                   NA,  FALSE) \
-FLAG(   6,  0, EAX,  5,  1, ECMD,                                  NA,  FALSE) \
-FLAG(   6,  0, EAX,  6,  1, PTM,                                   NA,  FALSE) \
-FLAG(   6,  0, EAX,  7,  1, HWP,                                   NA,  FALSE) \
-FLAG(   6,  0, EAX,  8,  1, HWP_NOTIFICATION,                      NA,  FALSE) \
-FLAG(   6,  0, EAX,  9,  1, HWP_ACTIVITY_WINDOW,                   NA,  FALSE) \
-FLAG(   6,  0, EAX, 10,  1, HWP_ENERGY_PERFORMANCE_PREFERENCE,     NA,  FALSE) \
-FLAG(   6,  0, EAX, 11,  1, HWP_PACKAGE_LEVEL_REQUEST,             NA,  FALSE) \
-FLAG(   6,  0, EAX, 13,  1, HDC,                                   NA,  FALSE) \
-FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,                   NA,  FALSE) \
-FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                     NA,  FALSE) \
-FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                      NA,  FALSE)
-
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_7                                               \
-FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                              YES, FALSE) \
-FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                            ANY, FALSE) \
-FLAG(   7,  0, EBX,  3,  1, BMI1,                                  YES, TRUE)  \
-FLAG(   7,  0, EBX,  2,  1, SGX,                                   NO,  FALSE) \
-FLAG(   7,  0, EBX,  4,  1, HLE,                                   YES, TRUE)  \
-FLAG(   7,  0, EBX,  5,  1, AVX2,                                  YES, TRUE)  \
-FLAG(   7,  0, EBX,  7,  1, SMEP,                                  YES, FALSE) \
-FLAG(   7,  0, EBX,  8,  1, BMI2,                                  YES, TRUE)  \
-FLAG(   7,  0, EBX,  9,  1, ENFSTRG,                               YES, FALSE) \
-FLAG(   7,  0, EBX, 10,  1, INVPCID,                               YES, FALSE) \
-FLAG(   7,  0, EBX, 11,  1, RTM,                                   YES, TRUE)  \
-FLAG(   7,  0, EBX, 12,  1, PQM,                                   NO,  FALSE) \
-FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                       ANY, TRUE)  \
-FLAG(   7,  0, EBX, 15,  1, PQE,                                   NO,  FALSE) \
-FLAG(   7,  0, EBX, 18,  1, RDSEED,                                YES, TRUE)  \
-FLAG(   7,  0, EBX, 19,  1, ADX,                                   YES, TRUE)  \
-FLAG(   7,  0, EBX, 20,  1, SMAP,                                  YES, FALSE) \
-FLAG(   7,  0, EBX, 25,  1, PT,                                    NO,  FALSE) \
-FLAG(   7,  0, ECX,  0,  1, PREFETCHWT1,                           NO,  TRUE)
-
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_A                                               \
-FIELD(  A,  0, EAX,  0,  8, PMC_VERSION,                           NA,  FALSE) \
-FIELD(  A,  0, EAX,  8,  8, PMC_NUM_GEN,                           NA,  FALSE) \
-FIELD(  A,  0, EAX, 16,  8, PMC_WIDTH_GEN,                         NA,  FALSE) \
-FIELD(  A,  0, EAX, 24,  8, PMC_EBX_LENGTH,                        NA,  FALSE) \
-FLAG(   A,  0, EBX,  0,  1, PMC_CORE_CYCLES,                       NA,  FALSE) \
-FLAG(   A,  0, EBX,  1,  1, PMC_INSTR_RETIRED,                     NA,  FALSE) \
-FLAG(   A,  0, EBX,  2,  1, PMC_REF_CYCLES,                        NA,  FALSE) \
-FLAG(   A,  0, EBX,  3,  1, PMC_LAST_LVL_CREF,                     NA,  FALSE) \
-FLAG(   A,  0, EBX,  4,  1, PMC_LAST_LVL_CMISS,                    NA,  FALSE) \
-FLAG(   A,  0, EBX,  5,  1, PMC_BR_INST_RETIRED,                   NA,  FALSE) \
-FLAG(   A,  0, EBX,  6,  1, PMC_BR_MISS_RETIRED,                   NA,  FALSE) \
-FIELD(  A,  0, EDX,  0,  5, PMC_NUM_FIXED,                         NA,  FALSE) \
-FIELD(  A,  0, EDX,  5,  8, PMC_WIDTH_FIXED,                       NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_B                                               \
-FIELD(  B,  0, EAX,  0,  5, TOPOLOGY_MASK_WIDTH,                   NA,  FALSE) \
-FIELD(  B,  0, EBX,  0, 16, TOPOLOGY_CPUS_SHARING_LEVEL,           NA,  FALSE) \
-FIELD(  B,  0, ECX,  0,  8, TOPOLOGY_LEVEL_NUMBER,                 NA,  FALSE) \
-FIELD(  B,  0, ECX,  8,  8, TOPOLOGY_LEVEL_TYPE,                   NA,  FALSE) \
-FIELD(  B,  0, EDX,  0, 32, TOPOLOGY_X2APIC_ID,                    NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_D                                               \
-FLAG(   D,  0, EAX,  0,  1, XCR0_MASTER_LEGACY_FP,                 YES, FALSE) \
-FLAG(   D,  0, EAX,  1,  1, XCR0_MASTER_SSE,                       YES, FALSE) \
-FLAG(   D,  0, EAX,  2,  1, XCR0_MASTER_YMM_H,                     YES, FALSE) \
-FIELD(  D,  0, EAX,  3, 29, XCR0_MASTER_LOWER,                     NO,  FALSE) \
-FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                    ANY, FALSE) \
-FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                        YES, FALSE) \
-FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                     NO,  FALSE) \
-FLAG(   D,  0, EDX, 30,  1, XCR0_MASTER_LWP,                       NO,  FALSE) \
-FLAG(   D,  0, EDX, 31,  1, XCR0_MASTER_EXTENDED_XSAVE,            NO,  FALSE) \
-FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                              YES, FALSE) \
-FLAG(   D,  1, EAX,  1,  1, XSAVEC,                                NO,  FALSE) \
-FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                           NO,  FALSE) \
-FLAG(   D,  1, EAX,  3,  1, XSAVES,                                NO,  FALSE) \
-FIELD(  D,  1, EBX,  0, 32, XSAVE_XSS_SIZE,                        NO,  FALSE) \
-FIELD(  D,  1, ECX,  0, 32, XSS_LOWER,                             NO,  FALSE) \
-FIELD(  D,  1, EDX,  0, 32, XSS_UPPER,                             NO,  FALSE) \
-FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                        YES, FALSE) \
-FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                      YES, FALSE) \
-FIELD(  D,  2, ECX,  0, 32, XSAVE_YMM_RSVD1,                       YES, FALSE) \
-FIELD(  D,  2, EDX,  0, 32, XSAVE_YMM_RSVD2,                       YES, FALSE) \
-FIELD(  D, 62, EAX,  0, 32, XSAVE_LWP_SIZE,                        NO,  FALSE) \
-FIELD(  D, 62, EBX,  0, 32, XSAVE_LWP_OFFSET,                      NO,  FALSE) \
-FIELD(  D, 62, ECX,  0, 32, XSAVE_LWP_RSVD1,                       NO,  FALSE) \
-FIELD(  D, 62, EDX,  0, 32, XSAVE_LWP_RSVD2,                       NO,  FALSE)
-
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_12                                              \
-FLAG(  12,  0, EAX,  0,  1, SGX1,                                  NA,  FALSE) \
-FLAG(  12,  0, EAX,  1,  1, SGX2,                                  NA,  FALSE) \
-FLAG(  12,  0, EBX, 31,  1, SGX_MISCSELECT,                        NA,  FALSE) \
-FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,                NA,  FALSE) \
-FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,                   NA,  FALSE) \
-FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                      NA,  FALSE) \
-FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                      NA,  FALSE) \
-FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                      NA,  FALSE) \
-FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                      NA,  FALSE) \
-FIELD( 12,  2, EAX,  0,  4, EPC00_VALID,                           NA,  FALSE) \
-FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                        NA,  FALSE) \
-FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                       NA,  FALSE) \
-FIELD( 12,  2, ECX,  0,  4, EPC00_PROTECTED,                       NA,  FALSE) \
-FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                        NA,  FALSE) \
-FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                       NA,  FALSE) \
-FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                           NA,  FALSE) \
-FIELD( 12,  3, EAX, 12, 20, EPC01_BASE_LOW,                        NA,  FALSE) \
-FIELD( 12,  3, EBX,  0, 20, EPC01_BASE_HIGH,                       NA,  FALSE) \
-FIELD( 12,  3, ECX,  0,  4, EPC01_PROTECTED,                       NA,  FALSE) \
-FIELD( 12,  3, ECX, 12, 20, EPC01_SIZE_LOW,                        NA,  FALSE) \
-FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                       NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_400                                             \
-FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                         NA,  FALSE) \
-FIELD(400,  0, EBX,  0, 32, HYPERVISOR_VENDOR0,                    NA,  FALSE) \
-FIELD(400,  0, ECX,  0, 32, HYPERVISOR_VENDOR1,                    NA,  FALSE) \
-FIELD(400,  0, EDX,  0, 32, HYPERVISOR_VENDOR2,                    NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_401                                             \
-FIELD(401,  0, EAX,  0, 32, HV_INTERFACE_SIGNATURE,                NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_402                                             \
-FIELD(402,  0, EAX,  0, 32, BUILD_NUMBER,                          NA,  FALSE) \
-FIELD(402,  0, EBX,  0, 16, MINOR_VERSION,                         NA,  FALSE) \
-FIELD(402,  0, EBX, 16, 16, MAJOR_VERSION,                         NA,  FALSE) \
-FIELD(402,  0, ECX,  0, 32, SERVICE_PACK,                          NA,  FALSE) \
-FIELD(402,  0, EDX,  0, 24, SERVICE_NUMBER,                        NA,  FALSE) \
-FIELD(402,  0, EDX, 24,  8, SERVICE_BRANCH,                        NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_403                                             \
-FLAG( 403,  0, EAX,  0,  1, VP_RUNTIME_AVAIL,                      NA,  FALSE) \
-FLAG( 403,  0, EAX,  1,  1, REF_COUNTER_AVAIL,                     NA,  FALSE) \
-FLAG( 403,  0, EAX,  2,  1, BASIC_SYNIC_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EAX,  3,  1, SYNTH_TIMER_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EAX,  4,  1, APIC_ACCESS_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EAX,  5,  1, HYPERCALL_MSRS_AVAIL,                  NA,  FALSE) \
-FLAG( 403,  0, EAX,  6,  1, VP_INDEX_MSR_AVAIL,                    NA,  FALSE) \
-FLAG( 403,  0, EAX,  7,  1, VIRT_RESET_MSR_AVAIL,                  NA,  FALSE) \
-FLAG( 403,  0, EAX,  8,  1, STATS_PAGES_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EAX,  9,  1, REF_TSC_AVAIL,                         NA,  FALSE) \
-FLAG( 403,  0, EAX, 10,  1, GUEST_IDLE_MSR_AVAIL,                  NA,  FALSE) \
-FLAG( 403,  0, EAX, 11,  1, FREQUENCY_MSRS_AVAIL,                  NA,  FALSE) \
-FLAG( 403,  0, EAX, 12,  1, SYNTH_DEBUG_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EBX,  0,  1, CREATE_PARTITIONS_FLAG,                NA,  FALSE) \
-FLAG( 403,  0, EBX,  1,  1, ACCESS_PARTITION_ID_FLAG,              NA,  FALSE) \
-FLAG( 403,  0, EBX,  2,  1, ACCESS_MEMORY_POOL_FLAG,               NA,  FALSE) \
-FLAG( 403,  0, EBX,  3,  1, ADJUST_MESSAGE_BUFFERS_FLAG,           NA,  FALSE) \
-FLAG( 403,  0, EBX,  4,  1, POST_MESSAGES_FLAG,                    NA,  FALSE) \
-FLAG( 403,  0, EBX,  5,  1, SIGNAL_EVENTS_FLAG,                    NA,  FALSE) \
-FLAG( 403,  0, EBX,  6,  1, CREATE_PORT_FLAG,                      NA,  FALSE) \
-FLAG( 403,  0, EBX,  7,  1, CONNECT_PORT_FLAG,                     NA,  FALSE) \
-FLAG( 403,  0, EBX,  8,  1, ACCESS_STATS_FLAG,                     NA,  FALSE) \
-FLAG( 403,  0, EBX, 11,  1, DEBUGGING_FLAG,                        NA,  FALSE) \
-FLAG( 403,  0, EBX, 12,  1, CPU_MANAGEMENT_FLAG,                   NA,  FALSE) \
-FLAG( 403,  0, EBX, 13,  1, CONFIGURE_PROFILER_FLAG,               NA,  FALSE) \
-FLAG( 403,  0, EBX, 14,  1, ENABLE_EXPANDED_STACKWALKING_FLAG,     NA,  FALSE) \
-FIELD(403,  0, ECX,  0,  4, MAX_POWER_STATE,                       NA,  FALSE) \
-FLAG( 403,  0, ECX,  4,  1, HPET_NEEDED_FOR_C3,                    NA,  FALSE) \
-FLAG( 403,  0, EDX,  0,  1, MWAIT_AVAIL,                           NA,  FALSE) \
-FLAG( 403,  0, EDX,  1,  1, GUEST_DEBUGGING_AVAIL,                 NA,  FALSE) \
-FLAG( 403,  0, EDX,  2,  1, PERFORMANCE_MONITOR_AVAIL,             NA,  FALSE) \
-FLAG( 403,  0, EDX,  3,  1, CPU_DYN_PARTITIONING_AVAIL,            NA,  FALSE) \
-FLAG( 403,  0, EDX,  4,  1, XMM_REGISTERS_FOR_HYPERCALL_AVAIL,     NA,  FALSE) \
-FLAG( 403,  0, EDX,  5,  1, GUEST_IDLE_AVAIL,                      NA,  FALSE) \
-FLAG( 403,  0, EDX,  6,  1, HYPERVISOR_SLEEP_STATE_AVAIL,          NA,  FALSE) \
-FLAG( 403,  0, EDX,  7,  1, NUMA_DISTANCE_QUERY_AVAIL,             NA,  FALSE) \
-FLAG( 403,  0, EDX,  8,  1, TIMER_FREQUENCY_AVAIL,                 NA,  FALSE) \
-FLAG( 403,  0, EDX,  9,  1, SYNTH_MACHINE_CHECK_AVAIL,             NA,  FALSE) \
-FLAG( 403,  0, EDX, 10,  1, GUEST_CRASH_MSRS_AVAIL,                NA,  FALSE) \
-FLAG( 403,  0, EDX, 11,  1, DEBUG_MSRS_AVAIL,                      NA,  FALSE) \
-FLAG( 403,  0, EDX, 12,  1, NPIEP1_AVAIL,                          NA,  FALSE) \
-FLAG( 403,  0, EDX, 13,  1, DISABLE_HYPERVISOR_AVAIL,              NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_404                                             \
-FLAG( 404,  0, EAX,  0,  1, USE_HYPERCALL_TO_SWITCH_ADDR_SPACE,    NA,  FALSE) \
-FLAG( 404,  0, EAX,  1,  1, USE_HYPERCALL_TO_FLUSH_TLB,            NA,  FALSE) \
-FLAG( 404,  0, EAX,  2,  1, USE_HYPERCALL_FOR_TLB_SHOOTDOWN,       NA,  FALSE) \
-FLAG( 404,  0, EAX,  3,  1, USE_MSRS_FOR_EOI_ICR_TPR,              NA,  FALSE) \
-FLAG( 404,  0, EAX,  4,  1, USE_MSR_FOR_RESET,                     NA,  FALSE) \
-FLAG( 404,  0, EAX,  5,  1, USE_RELAXED_TIMING,                    NA,  FALSE) \
-FLAG( 404,  0, EAX,  6,  1, USE_DMA_REMAPPING,                     NA,  FALSE) \
-FLAG( 404,  0, EAX,  7,  1, USE_INTERRUPT_REMAPPING,               NA,  FALSE) \
-FLAG( 404,  0, EAX,  8,  1, USE_X2APIC,                            NA,  FALSE) \
-FLAG( 404,  0, EAX,  9,  1, DEPRECATE_AUTOEOI,                     NA,  FALSE) \
-FIELD(404,  0, EBX,  0, 32, SPINLOCK_RETRIES,                      NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_405                                             \
-FIELD(405,  0, EAX,  0, 32, MAX_VCPU,                              NA,  FALSE) \
-FIELD(405,  0, EBX,  0, 32, MAX_LCPU,                              NA,  FALSE) \
-FIELD(405,  0, ECX,  0, 32, MAX_REMAPPABLE_VECTORS,                NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_406                                             \
-FLAG( 406,  0, EAX,  0,  1, APIC_OVERLAY_ASSIST,                   NA,  FALSE) \
-FLAG( 406,  0, EAX,  1,  1, MSR_BITMAPS,                           NA,  FALSE) \
-FLAG( 406,  0, EAX,  2,  1, ARCH_PMCS,                             NA,  FALSE) \
-FLAG( 406,  0, EAX,  3,  1, SLAT,                                  NA,  FALSE) \
-FLAG( 406,  0, EAX,  4,  1, DMA_REMAPPING,                         NA,  FALSE) \
-FLAG( 406,  0, EAX,  5,  1, INTERRUPT_REMAPPING,                   NA,  FALSE) \
-FLAG( 406,  0, EAX,  6,  1, MEMORY_PATROL_SCRUBBER,                NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_410                                             \
-FIELD(410,  0, EAX,  0, 32, TSC_HZ,                                NA,  FALSE) \
-FIELD(410,  0, EBX,  0, 32, ACPIBUS_HZ,                            NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_80                                              \
-FIELD( 80,  0, EAX,  0, 32, NUM_EXT_LEVELS,                        NA,  FALSE) \
-FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                        NA,  FALSE) \
-FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                        NA,  FALSE) \
-FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                        NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81                                              \
-FIELD( 81,  0, EAX,  0, 32, UNKNOWN81EAX,                          ANY, FALSE) \
-FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                       ANY, FALSE) \
-FIELD( 81,  0, EAX,  4,  4, LEAF81_MODEL,                          ANY, FALSE) \
-FIELD( 81,  0, EAX,  8,  4, LEAF81_FAMILY,                         ANY, FALSE) \
-FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                           ANY, FALSE) \
-FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,                 ANY, FALSE) \
-FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,                ANY, FALSE) \
-FIELD( 81,  0, EBX,  0, 32, UNKNOWN81EBX,                          ANY, FALSE) \
-FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                       ANY, FALSE) \
-FIELD( 81,  0, EBX, 16, 16, UNDEF,                                 ANY, FALSE) \
-FLAG(  81,  0, ECX,  0,  1, LAHF64,                                YES, TRUE)  \
-FLAG(  81,  0, ECX,  1,  1, CMPLEGACY,                             ANY, FALSE) \
-FLAG(  81,  0, ECX,  2,  1, SVM,                                   YES, FALSE) \
-FLAG(  81,  0, ECX,  3,  1, EXTAPICSPC,                            YES, FALSE) \
-FLAG(  81,  0, ECX,  4,  1, CR8AVAIL,                              YES, FALSE) \
-FLAG(  81,  0, ECX,  5,  1, ABM,                                   YES, TRUE)  \
-FLAG(  81,  0, ECX,  6,  1, SSE4A,                                 YES, TRUE)  \
-FLAG(  81,  0, ECX,  7,  1, MISALIGNED_SSE,                        YES, TRUE)  \
-FLAG(  81,  0, ECX,  8,  1, 3DNPREFETCH,                           YES, TRUE)  \
-FLAG(  81,  0, ECX,  9,  1, OSVW,                                  ANY, FALSE) \
-FLAG(  81,  0, ECX, 10,  1, IBS,                                   NO,  FALSE) \
-FLAG(  81,  0, ECX, 11,  1, XOP,                                   YES, TRUE)  \
-FLAG(  81,  0, ECX, 12,  1, SKINIT,                                NO,  FALSE) \
-FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                              NO,  FALSE) \
-FLAG(  81,  0, ECX, 15,  1, LWP,                                   NO,  FALSE) \
-FLAG(  81,  0, ECX, 16,  1, FMA4,                                  YES, TRUE)  \
-FLAG(  81,  0, ECX, 17,  1, TCE,                                   NO,  FALSE) \
-FLAG(  81,  0, ECX, 19,  1, NODEID_MSR,                            NO,  FALSE) \
-FLAG(  81,  0, ECX, 21,  1, TBM,                                   YES, TRUE)  \
-FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                              NO,  FALSE) \
-FLAG(  81,  0, ECX, 23,  1, PERFCORE,                              ANY, TRUE)  \
-FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                            YES, TRUE)  \
-FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  2,  1, LEAF81_DE,                             YES, FALSE) \
-FLAG(  81,  0, EDX,  3,  1, LEAF81_PSE,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  4,  1, LEAF81_TSC,                            YES, TRUE)  \
-FLAG(  81,  0, EDX,  5,  1, LEAF81_MSR,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  6,  1, LEAF81_PAE,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  7,  1, LEAF81_MCE,                            YES, FALSE) \
-FLAG(  81,  0, EDX,  8,  1, LEAF81_CX8,                            YES, TRUE)  \
-FLAG(  81,  0, EDX,  9,  1, LEAF81_APIC,                           ANY, FALSE) \
-FLAG(  81,  0, EDX, 11,  1, SYSC,                                  ANY, TRUE)  \
-FLAG(  81,  0, EDX, 12,  1, LEAF81_MTRR,                           YES, FALSE) \
-FLAG(  81,  0, EDX, 13,  1, LEAF81_PGE,                            YES, FALSE) \
-FLAG(  81,  0, EDX, 14,  1, LEAF81_MCA,                            YES, FALSE) \
-FLAG(  81,  0, EDX, 15,  1, LEAF81_CMOV,                           YES, TRUE)  \
-FLAG(  81,  0, EDX, 16,  1, LEAF81_PAT,                            YES, FALSE) \
-FLAG(  81,  0, EDX, 17,  1, LEAF81_PSE36,                          YES, FALSE) \
-FLAG(  81,  0, EDX, 20,  1, NX,                                    YES, FALSE) \
-FLAG(  81,  0, EDX, 22,  1, MMXEXT,                                YES, TRUE)  \
-FLAG(  81,  0, EDX, 23,  1, LEAF81_MMX,                            YES, TRUE)  \
-FLAG(  81,  0, EDX, 24,  1, LEAF81_FXSR,                           YES, TRUE)  \
-FLAG(  81,  0, EDX, 25,  1, FFXSR,                                 YES, FALSE) \
-FLAG(  81,  0, EDX, 26,  1, PDPE1GB,                               YES, FALSE) \
-FLAG(  81,  0, EDX, 27,  1, RDTSCP,                                YES, TRUE)  \
-FLAG(  81,  0, EDX, 29,  1, LM,                                    YES, FALSE) \
-FLAG(  81,  0, EDX, 30,  1, 3DNOWPLUS,                             YES, TRUE)  \
-FLAG(  81,  0, EDX, 31,  1, 3DNOW,                                 YES, TRUE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_82                                              \
-FIELD( 82,  0, EAX,  0, 32, LEAF82_BRAND_STRING_EAX,               NA,  FALSE) \
-FIELD( 82,  0, EBX,  0, 32, LEAF82_BRAND_STRING_EBX,               NA,  FALSE) \
-FIELD( 82,  0, ECX,  0, 32, LEAF82_BRAND_STRING_ECX,               NA,  FALSE) \
-FIELD( 82,  0, EDX,  0, 32, LEAF82_BRAND_STRING_EDX,               NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_83                                              \
-FIELD( 83,  0, EAX,  0, 32, LEAF83_BRAND_STRING_EAX,               NA,  FALSE) \
-FIELD( 83,  0, EBX,  0, 32, LEAF83_BRAND_STRING_EBX,               NA,  FALSE) \
-FIELD( 83,  0, ECX,  0, 32, LEAF83_BRAND_STRING_ECX,               NA,  FALSE) \
-FIELD( 83,  0, EDX,  0, 32, LEAF83_BRAND_STRING_EDX,               NA,  FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_84                                              \
-FIELD( 84,  0, EAX,  0, 32, LEAF84_BRAND_STRING_EAX,               NA,  FALSE) \
-FIELD( 84,  0, EBX,  0, 32, LEAF84_BRAND_STRING_EBX,               NA,  FALSE) \
-FIELD( 84,  0, ECX,  0, 32, LEAF84_BRAND_STRING_ECX,               NA,  FALSE) \
-FIELD( 84,  0, EDX,  0, 32, LEAF84_BRAND_STRING_EDX,               NA,  FALSE)
-
-#ifdef COMMUNITY_SOURCE_AMD_SECRET /* { */
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_8A_EDX_11 \
-FLAG(  8A,  0, EDX, 11,  1, SKINIT_PATCH_RETAINED,                 NO,  FALSE)
-#define CPUID_8A_EDX_14_31 \
-FLAG(  8A,  0, EDX, 14,  1, SVM_X2APIC,                            NO,  FALSE) \
-FIELD( 8A,  0, EDX, 15, 17, SVMEDX_RSVD2,                          NO,  FALSE)
-#else
-#define CPUID_8A_EDX_11 \
-FLAG(  8A,  0, EDX, 11,  1, SVMEDX_RSVD1,                          NO,  FALSE)
-#define CPUID_8A_EDX_14_31 \
-FIELD( 8A,  0, EDX, 14, 18, SVMEDX_RSVD2,                          NO,  FALSE)
-#endif /* } COMMUNITY_SOURCE_AMD_SECRET */
-
-/*    LEVEL, REG, POS, SIZE, NAME,                             MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_8x                                              \
-FIELD( 85,  0, EAX,  0,  8, ITLB_ENTRIES_2M4M_PGS,                 NA,  FALSE) \
-FIELD( 85,  0, EAX,  8,  8, ITLB_ASSOC_2M4M_PGS,                   NA,  FALSE) \
-FIELD( 85,  0, EAX, 16,  8, DTLB_ENTRIES_2M4M_PGS,                 NA,  FALSE) \
-FIELD( 85,  0, EAX, 24,  8, DTLB_ASSOC_2M4M_PGS,                   NA,  FALSE) \
-FIELD( 85,  0, EBX,  0,  8, ITLB_ENTRIES_4K_PGS,                   NA,  FALSE) \
-FIELD( 85,  0, EBX,  8,  8, ITLB_ASSOC_4K_PGS,                     NA,  FALSE) \
-FIELD( 85,  0, EBX, 16,  8, DTLB_ENTRIES_4K_PGS,                   NA,  FALSE) \
-FIELD( 85,  0, EBX, 24,  8, DTLB_ASSOC_4K_PGS,                     NA,  FALSE) \
-FIELD( 85,  0, ECX,  0,  8, L1_DCACHE_LINE_SIZE,                   NA,  FALSE) \
-FIELD( 85,  0, ECX,  8,  8, L1_DCACHE_LINES_PER_TAG,               NA,  FALSE) \
-FIELD( 85,  0, ECX, 16,  8, L1_DCACHE_ASSOC,                       NA,  FALSE) \
-FIELD( 85,  0, ECX, 24,  8, L1_DCACHE_SIZE,                        NA,  FALSE) \
-FIELD( 85,  0, EDX,  0,  8, L1_ICACHE_LINE_SIZE,                   NA,  FALSE) \
-FIELD( 85,  0, EDX,  8,  8, L1_ICACHE_LINES_PER_TAG,               NA,  FALSE) \
-FIELD( 85,  0, EDX, 16,  8, L1_ICACHE_ASSOC,                       NA,  FALSE) \
-FIELD( 85,  0, EDX, 24,  8, L1_ICACHE_SIZE,                        NA,  FALSE) \
-FIELD( 86,  0, EAX,  0, 12, L2_ITLB_ENTRIES_2M4M_PGS,              NA,  FALSE) \
-FIELD( 86,  0, EAX, 12,  4, L2_ITLB_ASSOC_2M4M_PGS,                NA,  FALSE) \
-FIELD( 86,  0, EAX, 16, 12, L2_DTLB_ENTRIES_2M4M_PGS,              NA,  FALSE) \
-FIELD( 86,  0, EAX, 28,  4, L2_DTLB_ASSOC_2M4M_PGS,                NA,  FALSE) \
-FIELD( 86,  0, EBX,  0, 12, L2_ITLB_ENTRIES_4K_PGS,                NA,  FALSE) \
-FIELD( 86,  0, EBX, 12,  4, L2_ITLB_ASSOC_4K_PGS,                  NA,  FALSE) \
-FIELD( 86,  0, EBX, 16, 12, L2_DTLB_ENTRIES_4K_PGS,                NA,  FALSE) \
-FIELD( 86,  0, EBX, 28,  4, L2_DTLB_ASSOC_4K_PGS,                  NA,  FALSE) \
-FIELD( 86,  0, ECX,  0,  8, L2CACHE_LINE,                          NA,  FALSE) \
-FIELD( 86,  0, ECX,  8,  4, L2CACHE_LINE_PER_TAG,                  NA,  FALSE) \
-FIELD( 86,  0, ECX, 12,  4, L2CACHE_WAYS,                          NA,  FALSE) \
-FIELD( 86,  0, ECX, 16, 16, L2CACHE_SIZE,                          NA,  FALSE) \
-FIELD( 86,  0, EDX,  0,  8, L3CACHE_LINE,                          NA,  FALSE) \
-FIELD( 86,  0, EDX,  8,  4, L3CACHE_LINE_PER_TAG,                  NA,  FALSE) \
-FIELD( 86,  0, EDX, 12,  4, L3CACHE_WAYS,                          NA,  FALSE) \
-FIELD( 86,  0, EDX, 18, 14, L3CACHE_SIZE,                          NA,  FALSE) \
-FLAG(  87,  0, EDX,  0,  1, TS,                                    NA,  FALSE) \
-FLAG(  87,  0, EDX,  1,  1, FID,                                   NA,  FALSE) \
-FLAG(  87,  0, EDX,  2,  1, VID,                                   NA,  FALSE) \
-FLAG(  87,  0, EDX,  3,  1, TTP,                                   NA,  FALSE) \
-FLAG(  87,  0, EDX,  4,  1, LEAF87_TM,                             NA,  FALSE) \
-FLAG(  87,  0, EDX,  5,  1, STC,                                   NA,  FALSE) \
-FLAG(  87,  0, EDX,  6,  1, 100MHZSTEPS,                           NA,  FALSE) \
-FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                              NA,  FALSE) \
-FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                         NA,  FALSE) \
-FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                       NA,  FALSE) \
-FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                             NA,  FALSE) \
-FIELD( 88,  0, EAX,  8,  8, VIRT_BITS,                             NA,  FALSE) \
-FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                    NA,  FALSE) \
-FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                     NA,  FALSE) \
-FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                    NA,  FALSE) \
-FIELD( 8A,  0, EAX,  0,  8, SVM_REVISION,                          YES, FALSE) \
-FLAG(  8A,  0, EAX,  8,  1, SVM_HYPERVISOR,                        NO,  FALSE) \
-FIELD( 8A,  0, EAX,  9, 23, SVMEAX_RSVD,                           NO,  FALSE) \
-FIELD( 8A,  0, EBX,  0, 32, SVM_NUM_ASIDS,                         YES, FALSE) \
-FIELD( 8A,  0, ECX,  0, 32, SVMECX_RSVD,                           NO,  FALSE) \
-FLAG(  8A,  0, EDX,  0,  1, SVM_NPT,                               YES, FALSE) \
-FLAG(  8A,  0, EDX,  1,  1, SVM_LBR,                               NO,  FALSE) \
-FLAG(  8A,  0, EDX,  2,  1, SVM_LOCK,                              ANY, FALSE) \
-FLAG(  8A,  0, EDX,  3,  1, SVM_NRIP,                              YES, FALSE) \
-FLAG(  8A,  0, EDX,  4,  1, SVM_TSC_RATE_MSR,                      NO,  FALSE) \
-FLAG(  8A,  0, EDX,  5,  1, SVM_VMCB_CLEAN,                        YES, FALSE) \
-FLAG(  8A,  0, EDX,  6,  1, SVM_FLUSH_BY_ASID,                     YES, FALSE) \
-FLAG(  8A,  0, EDX,  7,  1, SVM_DECODE_ASSISTS,                    YES, FALSE) \
-FIELD( 8A,  0, EDX,  8,  2, SVMEDX_RSVD0,                          NO,  FALSE) \
-FLAG(  8A,  0, EDX, 10,  1, SVM_PAUSE_FILTER,                      NO,  FALSE) \
-CPUID_8A_EDX_11 \
-FLAG(  8A,  0, EDX, 12,  1, SVM_PAUSE_THRESHOLD,                   NO,  FALSE) \
-FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                              NO,  FALSE) \
-CPUID_8A_EDX_14_31
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81x                                             \
-FIELD(819,  0, EAX,  0, 12, L1_ITLB_ENTRIES_1G_PGS,                NA,  FALSE) \
-FIELD(819,  0, EAX, 12,  4, L1_ITLB_ASSOC_1G_PGS,                  NA,  FALSE) \
-FIELD(819,  0, EAX, 16, 12, L1_DTLB_ENTRIES_1G_PGS,                NA,  FALSE) \
-FIELD(819,  0, EAX, 28,  4, L1_DTLB_ASSOC_1G_PGS,                  NA,  FALSE) \
-FIELD(819,  0, EBX,  0, 12, L2_ITLB_ENTRIES_1G_PGS,                NA,  FALSE) \
-FIELD(819,  0, EBX, 12,  4, L2_ITLB_ASSOC_1G_PGS,                  NA,  FALSE) \
-FIELD(819,  0, EBX, 16, 12, L2_DTLB_ENTRIES_1G_PGS,                NA,  FALSE) \
-FIELD(819,  0, EBX, 28,  4, L2_DTLB_ASSOC_1G_PGS,                  NA,  FALSE) \
-FLAG( 81A,  0, EAX,  0,  1, FP128,                                 NA,  FALSE) \
-FLAG( 81A,  0, EAX,  1,  1, MOVU,                                  NA,  FALSE) \
-FLAG( 81B,  0, EAX,  0,  1, IBS_FFV,                               NA,  FALSE) \
-FLAG( 81B,  0, EAX,  1,  1, IBS_FETCHSAM,                          NA,  FALSE) \
-FLAG( 81B,  0, EAX,  2,  1, IBS_OPSAM,                             NA,  FALSE) \
-FLAG( 81B,  0, EAX,  3,  1, RW_OPCOUNT,                            NA,  FALSE) \
-FLAG( 81B,  0, EAX,  4,  1, OPCOUNT,                               NA,  FALSE) \
-FLAG( 81B,  0, EAX,  5,  1, BRANCH_TARGET_ADDR,                    NA,  FALSE) \
-FLAG( 81B,  0, EAX,  6,  1, OPCOUNT_EXT,                           NA,  FALSE) \
-FLAG( 81B,  0, EAX,  7,  1, RIP_INVALID_CHECK,                     NA,  FALSE) \
-FLAG( 81C,  0, EAX,  0,  1, LWP_AVAIL,                             NA,  FALSE) \
-FLAG( 81C,  0, EAX,  1,  1, LWP_VAL_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  2,  1, LWP_IRE_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  3,  1, LWP_BRE_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  4,  1, LWP_DME_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  5,  1, LWP_CNH_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX,  6,  1, LWP_RNH_AVAIL,                         NA,  FALSE) \
-FLAG( 81C,  0, EAX, 31,  1, LWP_INT_AVAIL,                         NA,  FALSE) \
-FIELD(81C,  0, EBX,  0,  8, LWP_CB_SIZE,                           NA,  FALSE) \
-FIELD(81C,  0, EBX,  8,  8, LWP_EVENT_SIZE,                        NA,  FALSE) \
-FIELD(81C,  0, EBX, 16,  8, LWP_MAX_EVENTS,                        NA,  FALSE) \
-FIELD(81C,  0, EBX, 24,  8, LWP_EVENT_OFFSET,                      NA,  FALSE) \
-FIELD(81C,  0, ECX,  0,  4, LWP_LATENCY_MAX,                       NA,  FALSE) \
-FLAG( 81C,  0, ECX,  5,  1, LWP_DATA_ADDR_VALID,                   NA,  FALSE) \
-FIELD(81C,  0, ECX,  6,  3, LWP_LATENCY_ROUND,                     NA,  FALSE) \
-FIELD(81C,  0, ECX,  9,  7, LWP_VERSION,                           NA,  FALSE) \
-FIELD(81C,  0, ECX, 16,  8, LWP_MIN_BUF_SIZE,                      NA,  FALSE) \
-FLAG( 81C,  0, ECX, 28,  1, LWP_BRANCH_PRED,                       NA,  FALSE) \
-FLAG( 81C,  0, ECX, 29,  1, LWP_IP_FILTERING,                      NA,  FALSE) \
-FLAG( 81C,  0, ECX, 30,  1, LWP_CACHE_LEVEL,                       NA,  FALSE) \
-FLAG( 81C,  0, ECX, 31,  1, LWP_CACHE_LATENCY,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  0,  1, LWP_SUPPORTED,                         NA,  FALSE) \
-FLAG( 81C,  0, EDX,  1,  1, LWP_VAL_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  2,  1, LWP_IRE_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  3,  1, LWP_BRE_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  4,  1, LWP_DME_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  5,  1, LWP_CNH_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX,  6,  1, LWP_RNH_SUPPORTED,                     NA,  FALSE) \
-FLAG( 81C,  0, EDX, 31,  1, LWP_INT_SUPPORTED,                     NA,  FALSE) \
-FIELD(81D,  0, EAX,  0,  5, LEAF81D_CACHE_TYPE,                    NA,  FALSE) \
-FIELD(81D,  0, EAX,  5,  3, LEAF81D_CACHE_LEVEL,                   NA,  FALSE) \
-FLAG( 81D,  0, EAX,  8,  1, LEAF81D_CACHE_SELF_INIT,               NA,  FALSE) \
-FLAG( 81D,  0, EAX,  9,  1, LEAF81D_CACHE_FULLY_ASSOC,             NA,  FALSE) \
-FIELD(81D,  0, EAX, 14, 12, LEAF81D_NUM_SHARING_CACHE,             NA,  FALSE) \
-FIELD(81D,  0, EBX,  0, 12, LEAF81D_CACHE_LINE_SIZE,               NA,  FALSE) \
-FIELD(81D,  0, EBX, 12, 10, LEAF81D_CACHE_PHYS_PARTITIONS,         NA,  FALSE) \
-FIELD(81D,  0, EBX, 22, 10, LEAF81D_CACHE_WAYS,                    NA,  FALSE) \
-FIELD(81D,  0, ECX,  0, 32, LEAF81D_CACHE_NUM_SETS,                NA,  FALSE) \
-FLAG( 81D,  0, EDX,  0,  1, LEAF81D_CACHE_WBINVD,                  NA,  FALSE) \
-FLAG( 81D,  0, EDX,  1,  1, LEAF81D_CACHE_INCLUSIVE,               NA,  FALSE) \
-FIELD(81E,  0, EAX,  0, 32, EXTENDED_APICID,                       NA,  FALSE) \
-FIELD(81E,  0, EBX,  0,  8, COMPUTE_UNIT_ID,                       NA,  FALSE) \
-FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,                NA,  FALSE) \
-FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                            NA,  FALSE) \
-FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                         NA,  FALSE)
-
-#define INTEL_CPUID_FIELD_DATA
-
-#ifdef COMMUNITY_SOURCE_AMD_SECRET
-/* These CPUID bit definitions are not yet public either. */
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,                  MON SUPP, CPL3 */
-#define AMD_CPUID_FIELD_DATA                                                   \
-FLAG(  81,  0, ECX, 14,  1, TBM0,                                  NO,  FALSE) \
-FLAG(  81,  0, ECX, 23,  1, PERFCTR_EXT_NB,                        NO,  FALSE) \
-FLAG(  81,  0, ECX, 24,  1, PERFCTR_EXT_CORE,                      NO,  FALSE)
-#else
-#define AMD_CPUID_FIELD_DATA
-#endif
-
-#define CPUID_FIELD_DATA                                              \
-   CPUID_FIELD_DATA_LEVEL_0                                           \
-   CPUID_FIELD_DATA_LEVEL_1                                           \
-   CPUID_FIELD_DATA_LEVEL_2                                           \
-   CPUID_FIELD_DATA_LEVEL_4                                           \
-   CPUID_FIELD_DATA_LEVEL_5                                           \
-   CPUID_FIELD_DATA_LEVEL_6                                           \
-   CPUID_FIELD_DATA_LEVEL_7                                           \
-   CPUID_FIELD_DATA_LEVEL_A                                           \
-   CPUID_FIELD_DATA_LEVEL_B                                           \
-   CPUID_FIELD_DATA_LEVEL_D                                           \
-   CPUID_FIELD_DATA_LEVEL_12                                          \
-   CPUID_FIELD_DATA_LEVEL_400                                         \
-   CPUID_FIELD_DATA_LEVEL_401                                         \
-   CPUID_FIELD_DATA_LEVEL_402                                         \
-   CPUID_FIELD_DATA_LEVEL_403                                         \
-   CPUID_FIELD_DATA_LEVEL_404                                         \
-   CPUID_FIELD_DATA_LEVEL_405                                         \
-   CPUID_FIELD_DATA_LEVEL_406                                         \
-   CPUID_FIELD_DATA_LEVEL_410                                         \
-   CPUID_FIELD_DATA_LEVEL_80                                          \
-   CPUID_FIELD_DATA_LEVEL_81                                          \
-   CPUID_FIELD_DATA_LEVEL_82                                          \
-   CPUID_FIELD_DATA_LEVEL_83                                          \
-   CPUID_FIELD_DATA_LEVEL_84                                          \
-   CPUID_FIELD_DATA_LEVEL_8x                                          \
-   CPUID_FIELD_DATA_LEVEL_81x                                         \
-   INTEL_CPUID_FIELD_DATA                                             \
-   AMD_CPUID_FIELD_DATA
-
-/*
- * Define all field and flag values as an enum.  The result is a full
- * set of values taken from the table above in the form:
- *
- * CPUID_<name>_MASK  == mask for feature/field
- * CPUID_<name>_SHIFT == offset of field
- *
- * e.g. - CPUID_VIRT_BITS_MASK  = 0xff00
- *      - CPUID_VIRT_BITS_SHIFT = 8
- *
- * Note: The MASK definitions must use some gymnastics to get
- * around a warning when shifting left by 32.
- */
-#define VMW_BIT_MASK(shift)  (((1 << (shift - 1)) << 1) - 1)
-
-#define FIELD(lvl, ecxIn, reg, bitpos, size, name, s, c3)      \
-   CPUID_##name##_SHIFT        = bitpos,                       \
-   CPUID_##name##_MASK         = VMW_BIT_MASK(size) << bitpos, \
-   CPUID_INTERNAL_SHIFT_##name = bitpos,                       \
-   CPUID_INTERNAL_MASK_##name  = VMW_BIT_MASK(size) << bitpos, \
-   CPUID_INTERNAL_REG_##name   = CPUID_REG_##reg,              \
-   CPUID_INTERNAL_EAXIN_##name = CPUID_LEVEL_VAL_##lvl,        \
-   CPUID_INTERNAL_ECXIN_##name = ecxIn,
-
-#define FLAG FIELD
-
-enum {
-   /* Define data for every CPUID field we have */
-   CPUID_FIELD_DATA
-};
-#undef VMW_BIT_MASK
-#undef FIELD
-#undef FLAG
-
-/*
- * Legal CPUID config file mask characters.  For a description of the
- * cpuid masking system, please see:
- *
- * http://vmweb.vmware.com/~mts/cgi-bin/view.cgi/Apps/CpuMigrationChecks
- */
-
-#define CPUID_MASK_HIDE_CHR    '0'
-#define CPUID_MASK_HIDE_STR    "0"
-#define CPUID_MASK_FORCE_CHR   '1'
-#define CPUID_MASK_FORCE_STR   "1"
-#define CPUID_MASK_PASS_CHR    '-'
-#define CPUID_MASK_PASS_STR    "-"
-#define CPUID_MASK_TRUE_CHR    'T'
-#define CPUID_MASK_TRUE_STR    "T"
-#define CPUID_MASK_FALSE_CHR   'F'
-#define CPUID_MASK_FALSE_STR   "F"
-#define CPUID_MASK_IGNORE_CHR  'X'
-#define CPUID_MASK_IGNORE_STR  "X"
-#define CPUID_MASK_HOST_CHR    'H'
-#define CPUID_MASK_HOST_STR    "H"
-#define CPUID_MASK_RSVD_CHR    'R'
-#define CPUID_MASK_RSVD_STR    "R"
-#define CPUID_MASK_INSTALL_CHR 'I'
-#define CPUID_MASK_INSTALL_STR "I"
-
-/*
- * When LM is disabled, we overlay the following masks onto the
- * guest's default masks.  Any level that is not defined below should
- * be treated as all "-"s
- */
-
-#define CPT_ID1ECX_LM_DISABLED  "----:----:----:----:--0-:----:----:----"
-#define CPT_ID81EDX_LM_DISABLED "--0-:----:----:----:----:----:----:----"
-#define CPT_ID81ECX_LM_DISABLED "----:----:----:----:----:----:----:---0"
-
-#define CPT_GET_LM_DISABLED_MASK(lvl, reg)                                  \
-   ((lvl == 1 && reg == CPUID_REG_ECX) ? CPT_ID1ECX_LM_DISABLED :           \
-    (lvl == 0x80000001 && reg == CPUID_REG_ECX) ? CPT_ID81ECX_LM_DISABLED : \
-    (lvl == 0x80000001 && reg == CPUID_REG_EDX) ? CPT_ID81EDX_LM_DISABLED : \
-    NULL)
-
-/*
- * CPUID_MASK --
- * CPUID_SHIFT --
- * CPUID_ISSET --
- * CPUID_GET --
- * CPUID_SET --
- * CPUID_CLEAR --
- * CPUID_SETTO --
- *
- * Accessor macros for all CPUID consts/fields/flags.  Level and reg are not
- * required, but are used to force compile-time asserts which help verify that
- * the flag is being used on the right CPUID input and result register.
- *
- * Note: ASSERT_ON_COMPILE is duplicated rather than factored into its own
- * macro, because token concatenation does not work as expected if an input is
- * #defined (e.g. APIC) when macros are nested.  Also, compound statements
- * within parenthes is a GCC extension, so we must use runtime asserts with
- * other compilers.
- */
-
-#if defined(__GNUC__) && !defined(__clang__)
-
-#define CPUID_MASK(eaxIn, reg, flag)                                    \
-   ({                                                                   \
-      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
-              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
-      CPUID_INTERNAL_MASK_##flag;                                       \
-   })
-
-#define CPUID_SHIFT(eaxIn, reg, flag)                                   \
-   ({                                                                   \
-      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
-              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
-      CPUID_INTERNAL_SHIFT_##flag;                                      \
-   })
-
-#define CPUID_ISSET(eaxIn, reg, flag, data)                             \
-   ({                                                                   \
-      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##flag &&         \
-              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);  \
-      (((data) & CPUID_INTERNAL_MASK_##flag) != 0);                     \
-   })
-
-#define CPUID_GET(eaxIn, reg, field, data)                              \
-   ({                                                                   \
-      ASSERT_ON_COMPILE(eaxIn == CPUID_INTERNAL_EAXIN_##field &&        \
-              CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field); \
-      (((uint32)(data) & CPUID_INTERNAL_MASK_##field) >>                \
-       CPUID_INTERNAL_SHIFT_##field);                                   \
-   })
-
-#else
-
-/*
- * CPUIDCheck --
- *
- * Return val after verifying parameters.
- */
-
-static INLINE uint32
-CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
-           CpuidReg reg, CpuidReg regCheck, uint32 val)
-{
-   ASSERT(eaxIn == eaxInCheck && reg == regCheck);
-   return val;
-}
-
-#define CPUID_MASK(eaxIn, reg, flag)                                    \
-   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                       \
-              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,     \
-              CPUID_INTERNAL_MASK_##flag)
-
-#define CPUID_SHIFT(eaxIn, reg, flag)                                   \
-   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                       \
-              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,     \
-              CPUID_INTERNAL_SHIFT_##flag)
-
-#define CPUID_ISSET(eaxIn, reg, flag, data)                             \
-   (CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##flag,                      \
-               CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##flag,    \
-               CPUID_INTERNAL_MASK_##flag & (data)) != 0)
-
-#define CPUID_GET(eaxIn, reg, field, data)                              \
-   CPUIDCheck(eaxIn, CPUID_INTERNAL_EAXIN_##field,                      \
-              CPUID_REG_##reg, (CpuidReg)CPUID_INTERNAL_REG_##field,    \
-              ((uint32)(data) & CPUID_INTERNAL_MASK_##field) >>         \
-              CPUID_INTERNAL_SHIFT_##field)
-
-#endif
-
-
-#define CPUID_SET(eaxIn, reg, flag, dataPtr)                            \
-   do {                                                                 \
-      ASSERT_ON_COMPILE(                                                \
-         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##flag &&      \
-         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);       \
-      *(dataPtr) |= CPUID_INTERNAL_MASK_##flag;                         \
-   } while (0)
-
-#define CPUID_CLEAR(eaxIn, reg, flag, dataPtr)                          \
-   do {                                                                 \
-      ASSERT_ON_COMPILE(                                                \
-         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##flag &&      \
-         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##flag);       \
-      *(dataPtr) &= ~CPUID_INTERNAL_MASK_##flag;                        \
-   } while (0)
-
-#define CPUID_SETTO(eaxIn, reg, field, dataPtr, val)                    \
-   do {                                                                 \
-      uint32 _v = val;                                                  \
-      uint32 *_d = dataPtr;                                             \
-      ASSERT_ON_COMPILE(                                                \
-         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##field &&     \
-         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field);      \
-      *_d = (*_d & ~CPUID_INTERNAL_MASK_##field) |                      \
-         (_v << CPUID_INTERNAL_SHIFT_##field);                          \
-      ASSERT(_v == (*_d & CPUID_INTERNAL_MASK_##field) >>               \
-             CPUID_INTERNAL_SHIFT_##field);                             \
-   } while (0)
-
-#define CPUID_SETTO_SAFE(eaxIn, reg, field, dataPtr, val)               \
-   do {                                                                 \
-      uint32 _v = val &                                                 \
-         (CPUID_INTERNAL_MASK_##field >> CPUID_INTERNAL_SHIFT_##field); \
-      uint32 *_d = dataPtr;                                             \
-      ASSERT_ON_COMPILE(                                                \
-         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##field &&     \
-         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field);      \
-      *_d = (*_d & ~CPUID_INTERNAL_MASK_##field) |                      \
-         (_v << CPUID_INTERNAL_SHIFT_##field);                          \
-   } while (0)
-
-
-/*
- * Definitions of various fields' values and more complicated
- * macros/functions for reading cpuid fields.
- */
-
-#define CPUID_FAMILY_EXTENDED        15
-
-/* Effective Intel CPU Families */
-#define CPUID_FAMILY_486              4
-#define CPUID_FAMILY_P5               5
-#define CPUID_FAMILY_P6               6
-#define CPUID_FAMILY_P4              15
-
-/* Effective AMD CPU Families */
-#define CPUID_FAMILY_5x86            0x4
-#define CPUID_FAMILY_K5              0x5
-#define CPUID_FAMILY_K6              0x5
-#define CPUID_FAMILY_K7              0x6
-#define CPUID_FAMILY_K8              0xf
-#define CPUID_FAMILY_K8L             0x10
-#define CPUID_FAMILY_K8MOBILE        0x11
-#define CPUID_FAMILY_LLANO           0x12
-#define CPUID_FAMILY_BOBCAT          0x14
-#define CPUID_FAMILY_BULLDOZER       0x15  // Bulldozer Piledriver Steamroller
-#define CPUID_FAMILY_KYOTO           0x16  // Note: Jaguar microarch
-
-/* Effective VIA CPU Families */
-#define CPUID_FAMILY_C7               6
-
-/* Intel model information */
-#define CPUID_MODEL_PPRO              1
-#define CPUID_MODEL_PII_03            3
-#define CPUID_MODEL_PII_05            5
-#define CPUID_MODEL_CELERON_06        6
-#define CPUID_MODEL_PM_09             9
-#define CPUID_MODEL_PM_0D            13
-#define CPUID_MODEL_PM_0E            14  // Yonah / Sossaman
-#define CPUID_MODEL_CORE_0F          15  // Conroe / Merom
-#define CPUID_MODEL_CORE_17        0x17  // Penryn
-#define CPUID_MODEL_NEHALEM_1A     0x1a  // Nehalem / Gainestown
-#define CPUID_MODEL_ATOM_1C        0x1c  // Silverthorne / Diamondville
-#define CPUID_MODEL_CORE_1D        0x1d  // Dunnington
-#define CPUID_MODEL_NEHALEM_1E     0x1e  // Lynnfield
-#define CPUID_MODEL_NEHALEM_1F     0x1f  // Havendale
-#define CPUID_MODEL_NEHALEM_25     0x25  // Westmere / Clarkdale
-#define CPUID_MODEL_ATOM_26        0x26  // Lincroft
-#define CPUID_MODEL_ATOM_27        0x27  // Saltwell
-#define CPUID_MODEL_SANDYBRIDGE_2A 0x2a  // Sandybridge (desktop/mobile)
-#define CPUID_MODEL_NEHALEM_2C     0x2c  // Westmere-EP
-#define CPUID_MODEL_SANDYBRIDGE_2D 0x2d  // Sandybridge-EP
-#define CPUID_MODEL_NEHALEM_2E     0x2e  // Nehalem-EX
-#define CPUID_MODEL_NEHALEM_2F     0x2f  // Westmere-EX
-#define CPUID_MODEL_ATOM_35        0x35  // Cloverview
-#define CPUID_MODEL_ATOM_36        0x36  // Cedarview
-#define CPUID_MODEL_ATOM_37        0x37  // Bay Trail
-#define CPUID_MODEL_SANDYBRIDGE_3A 0x3a  // Ivy Bridge
-#define CPUID_MODEL_HASWELL_3C     0x3c  // Haswell DT
-#define CPUID_MODEL_BROADWELL_3D   0x3d  // Broadwell-Ult
-#define CPUID_MODEL_SANDYBRIDGE_3E 0x3e  // Ivy Bridge-EP
-#define CPUID_MODEL_HASWELL_3F     0x3f  // Haswell EP/EN/EX
-#define CPUID_MODEL_HASWELL_45     0x45  // Haswell Ultrathin
-#define CPUID_MODEL_HASWELL_46     0x46  // Haswell (Crystal Well)
-#define CPUID_MODEL_BROADWELL_47   0x47  // Broadwell (Denlow)
-#define CPUID_MODEL_ATOM_4A        0x4a  // Future Silvermont
-#define CPUID_MODEL_ATOM_4C        0x4c  // Airmont
-#define CPUID_MODEL_ATOM_4D        0x4d  // Avoton
-#define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y
-#define CPUID_MODEL_BROADWELL_4F   0x4f  // Broadwell EP/EN/EX
-#define CPUID_MODEL_BROADWELL_56   0x56  // Broadwell DE
-#define CPUID_MODEL_ATOM_5A        0x5a  // Future Silvermont
-#define CPUID_MODEL_ATOM_5D        0x5d  // Future Silvermont
-#define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S
-
-#define CPUID_MODEL_PIII_07    7
-#define CPUID_MODEL_PIII_08    8
-#define CPUID_MODEL_PIII_0A    10
-
-/* AMD model information */
-#define CPUID_MODEL_BARCELONA_02      0x02 // Barcelona (Opteron & Phenom)
-#define CPUID_MODEL_SHANGHAI_04       0x04 // Shanghai RB
-#define CPUID_MODEL_SHANGHAI_05       0x05 // Shanghai BL
-#define CPUID_MODEL_SHANGHAI_06       0x06 // Shanghai DA
-#define CPUID_MODEL_ISTANBUL_MAGNY_08 0x08 // Istanbul (6 core) & Magny-cours (12) HY
-#define CPUID_MODEL_ISTANBUL_MAGNY_09 0x09 // HY - G34 package
-#define CPUID_MODEL_PHAROAH_HOUND_0A  0x0A // Pharoah Hound
-#define CPUID_MODEL_PILEDRIVER_1F     0x1F // Max piledriver model defined in BKDG
-#define CPUID_MODEL_PILEDRIVER_10     0x10 // family == CPUID_FAMILY_BULLDOZER
-#define CPUID_MODEL_PILEDRIVER_02     0x02 // family == CPUID_FAMILY_BULLDOZER
-#define CPUID_MODEL_OPTERON_REVF_41   0x41 // family == CPUID_FAMILY_K8
-#define CPUID_MODEL_KYOTO_00          0x00 // family == CPUID_FAMILY_KYOTO
-#ifdef COMMUNITY_SOURCE_AMD_SECRET /* { */
-#define CPUID_MODEL_STEAMROLLER_3F    0x3F // Max Steamroller model defined in BKDG
-#define CPUID_MODEL_STEAMROLLER_30    0x30 // family == CPUID_FAMILY_BULLDOZER
-#endif /* } COMMUNITY_SOURCE_AMD_SECRET */
-
-/* VIA model information */
-#define CPUID_MODEL_NANO       15     // Isaiah
-
-/*
- *----------------------------------------------------------------------
- *
- * CPUID_IsVendor{AMD,Intel,VIA} --
- *
- *      Determines if the vendor string in cpuid id0 is from {AMD,Intel,VIA}.
- *
- * Results:
- *      True iff vendor string is CPUID_{AMD,INTEL,VIA}_VENDOR_STRING
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-static INLINE Bool
-CPUID_IsRawVendor(CPUIDRegs *id0, const char* vendor)
-{
-   // hard to get strcmp() in some environments, so do it in the raw
-   return (id0->ebx == *(const uint32 *) (vendor + 0) &&
-           id0->ecx == *(const uint32 *) (vendor + 4) &&
-           id0->edx == *(const uint32 *) (vendor + 8));
-}
-
-static INLINE Bool
-CPUID_IsVendorAMD(CPUIDRegs *id0)
-{
-   return CPUID_IsRawVendor(id0, CPUID_AMD_VENDOR_STRING);
-}
-
-static INLINE Bool
-CPUID_IsVendorIntel(CPUIDRegs *id0)
-{
-   return CPUID_IsRawVendor(id0, CPUID_INTEL_VENDOR_STRING);
-}
-
-static INLINE Bool
-CPUID_IsVendorVIA(CPUIDRegs *id0)
-{
-   return CPUID_IsRawVendor(id0, CPUID_VIA_VENDOR_STRING);
-}
-
-static INLINE uint32
-CPUID_EFFECTIVE_FAMILY(uint32 v) /* %eax from CPUID with %eax=1. */
-{
-   uint32 f = CPUID_GET(1, EAX, FAMILY, v);
-   return f != CPUID_FAMILY_EXTENDED ? f : f +
-      CPUID_GET(1, EAX, EXTENDED_FAMILY, v);
-}
-
-/* Normally only used when FAMILY==CPUID_FAMILY_EXTENDED, but Intel is
- * now using the extended model field for FAMILY==CPUID_FAMILY_P6 to
- * refer to the newer Core2 CPUs
- */
-static INLINE uint32
-CPUID_EFFECTIVE_MODEL(uint32 v) /* %eax from CPUID with %eax=1. */
-{
-   uint32 m = CPUID_GET(1, EAX, MODEL, v);
-   uint32 em = CPUID_GET(1, EAX, EXTENDED_MODEL, v);
-   return m + (em << 4);
-}
-
-/*
- * Notice that CPUID families for Intel and AMD overlap. The following macros
- * should only be used AFTER the manufacturer has been established (through
- * the use of CPUID standard function 0).
- */
-static INLINE Bool
-CPUID_FAMILY_IS_486(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_486;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_P5(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P5;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_P6(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P6;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_PENTIUM4(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_P4;
-}
-
-/*
- * Intel Pentium M processors are Yonah/Sossaman or an older P-M
- */
-static INLINE Bool
-CPUID_UARCH_IS_PENTIUM_M(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   return CPUID_FAMILY_IS_P6(v) &&
-          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_09 ||
-           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_0D ||
-           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_PM_0E);
-}
-
-/*
- * Intel Core processors are Merom, Conroe, Woodcrest, Clovertown,
- * Penryn, Dunnington, Kentsfield, Yorktown, Harpertown, ........
- */
-static INLINE Bool
-CPUID_UARCH_IS_CORE(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   uint32 model = CPUID_EFFECTIVE_MODEL(v);
-   /* Assumes the CPU manufacturer is Intel. */
-   return CPUID_FAMILY_IS_P6(v) &&
-          model >= CPUID_MODEL_CORE_0F &&
-          (model < CPUID_MODEL_NEHALEM_1A ||
-           model == CPUID_MODEL_CORE_1D);
-}
-
-/*
- * Intel Nehalem processors are: Nehalem, Gainestown, Lynnfield, Clarkdale.
- */
-static INLINE Bool
-CPUID_UARCH_IS_NEHALEM(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
-
-   return CPUID_FAMILY_IS_P6(v) &&
-          (effectiveModel == CPUID_MODEL_NEHALEM_1A ||
-           effectiveModel == CPUID_MODEL_NEHALEM_1E ||
-           effectiveModel == CPUID_MODEL_NEHALEM_1F ||
-           effectiveModel == CPUID_MODEL_NEHALEM_25 ||
-           effectiveModel == CPUID_MODEL_NEHALEM_2C ||
-           effectiveModel == CPUID_MODEL_NEHALEM_2E ||
-           effectiveModel == CPUID_MODEL_NEHALEM_2F);
-}
-
-
-static INLINE Bool
-CPUID_UARCH_IS_SANDYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
-
-   return CPUID_FAMILY_IS_P6(v) &&
-          (effectiveModel == CPUID_MODEL_SANDYBRIDGE_2A ||
-           effectiveModel == CPUID_MODEL_SANDYBRIDGE_2D ||
-           effectiveModel == CPUID_MODEL_SANDYBRIDGE_3E ||
-           effectiveModel == CPUID_MODEL_SANDYBRIDGE_3A);
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_BROADWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
-
-   return CPUID_FAMILY_IS_P6(v) &&
-          (effectiveModel == CPUID_MODEL_BROADWELL_3D ||
-           effectiveModel == CPUID_MODEL_BROADWELL_47 ||
-           effectiveModel == CPUID_MODEL_BROADWELL_4F ||
-           effectiveModel == CPUID_MODEL_BROADWELL_56);
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
-
-   return CPUID_FAMILY_IS_P6(v) &&
-          (effectiveModel == CPUID_MODEL_HASWELL_3C ||
-           effectiveModel == CPUID_MODEL_HASWELL_3F ||
-           effectiveModel == CPUID_MODEL_HASWELL_45 ||
-           effectiveModel == CPUID_MODEL_HASWELL_46);
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   return CPUID_FAMILY_IS_P6(v) &&
-          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E ||
-           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E);
-}
-
-
-static INLINE Bool
-CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   return CPUID_FAMILY_IS_P6(v) && CPUID_MODEL_IS_SKYLAKE(v);
-}
-
-
-static INLINE Bool
-CPUID_UARCH_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   return CPUID_FAMILY_IS_P6(v) &&
-          (CPUID_MODEL_IS_BROADWELL(v) || CPUID_MODEL_IS_HASWELL(v));
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_CENTERTON(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   return CPUID_FAMILY_IS_P6(v) &&
-          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_1C;
-}
-
-static INLINE Bool
-CPUID_MODEL_IS_AVOTON(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   return CPUID_FAMILY_IS_P6(v) &&
-          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_4D;
-}
-
-static INLINE Bool
-CPUID_MODEL_IS_WESTMERE(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
-
-   return CPUID_FAMILY_IS_P6(v) &&
-          (effectiveModel == CPUID_MODEL_NEHALEM_25 || // Clarkdale
-           effectiveModel == CPUID_MODEL_NEHALEM_2C || // Westmere-EP
-           effectiveModel == CPUID_MODEL_NEHALEM_2F);  // Westmere-EX
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_SANDYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
-
-   return CPUID_FAMILY_IS_P6(v) &&
-          (effectiveModel == CPUID_MODEL_SANDYBRIDGE_2A ||
-           effectiveModel == CPUID_MODEL_SANDYBRIDGE_2D);
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_IVYBRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is Intel. */
-   uint32 effectiveModel = CPUID_EFFECTIVE_MODEL(v);
-
-   return CPUID_FAMILY_IS_P6(v) && (
-       effectiveModel == CPUID_MODEL_SANDYBRIDGE_3E ||
-       effectiveModel == CPUID_MODEL_SANDYBRIDGE_3A);
-}
-
-
-static INLINE Bool
-CPUID_FAMILY_IS_K7(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K7;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_K8(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_K8EXT(uint32 eax)
-{
-   /*
-    * We check for this pattern often enough that it's
-    * worth a separate function, for syntactic sugar.
-    */
-   return CPUID_FAMILY_IS_K8(eax) &&
-          CPUID_GET(1, EAX, EXTENDED_MODEL, eax) != 0;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_K8L(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8L ||
-          CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_LLANO;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_LLANO(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_LLANO;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_K8MOBILE(uint32 eax)
-{
-   /* Essentially a K8 (not K8L) part, but with mobile features. */
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_K8MOBILE;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_K8STAR(uint32 eax)
-{
-   /*
-    * Read function name as "K8*", as in wildcard.
-    * Matches K8 or K8L or K8MOBILE
-    */
-   return CPUID_FAMILY_IS_K8(eax) || CPUID_FAMILY_IS_K8L(eax) ||
-          CPUID_FAMILY_IS_K8MOBILE(eax);
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_BOBCAT(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BOBCAT;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_BULLDOZER(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER;
-}
-
-static INLINE Bool
-CPUID_FAMILY_IS_KYOTO(uint32 eax)
-{
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_KYOTO;
-}
-
-/*
- * AMD Barcelona (of either Opteron or Phenom kind).
- */
-static INLINE Bool
-CPUID_MODEL_IS_BARCELONA(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is AMD. */
-   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
-          CPUID_EFFECTIVE_MODEL(v)  == CPUID_MODEL_BARCELONA_02;
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_SHANGHAI(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is AMD. */
-   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
-          (CPUID_MODEL_SHANGHAI_04  <= CPUID_EFFECTIVE_MODEL(v) &&
-           CPUID_EFFECTIVE_MODEL(v) <= CPUID_MODEL_SHANGHAI_06);
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_ISTANBUL_MAGNY(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is AMD. */
-   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
-          (CPUID_MODEL_ISTANBUL_MAGNY_08 <= CPUID_EFFECTIVE_MODEL(v) &&
-           CPUID_EFFECTIVE_MODEL(v)      <= CPUID_MODEL_ISTANBUL_MAGNY_09);
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_PHAROAH_HOUND(uint32 v) // IN: %eax from CPUID with %eax=1.
-{
-   /* Assumes the CPU manufacturer is AMD. */
-   return CPUID_EFFECTIVE_FAMILY(v) == CPUID_FAMILY_K8L &&
-          CPUID_EFFECTIVE_MODEL(v)  == CPUID_MODEL_PHAROAH_HOUND_0A;
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_BULLDOZER(uint32 eax)
-{
-   /*
-    * Bulldozer is models of family 0x15 that are below 10 excluding
-    * Piledriver 02.
-    */
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
-          CPUID_EFFECTIVE_MODEL(eax)  < CPUID_MODEL_PILEDRIVER_10 &&
-          CPUID_EFFECTIVE_MODEL(eax) != CPUID_MODEL_PILEDRIVER_02;
-}
-
-
-static INLINE Bool
-CPUID_MODEL_IS_PILEDRIVER(uint32 eax)
-{
-   /* Piledriver is models 0x02 & 0x10 of family 0x15 (so far). */
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
-          ((CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_PILEDRIVER_10 &&
-            CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_PILEDRIVER_1F) ||
-           CPUID_EFFECTIVE_MODEL(eax) == CPUID_MODEL_PILEDRIVER_02);
-}
-
-
-#ifdef COMMUNITY_SOURCE_AMD_SECRET /* { */
-static INLINE Bool
-CPUID_MODEL_IS_STEAMROLLER(uint32 eax)
-{
-   /* Steamroller is model 0x30 of family 0x15 (so far). */
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_BULLDOZER &&
-          (CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_STEAMROLLER_30 &&
-           CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_STEAMROLLER_3F);
-}
-#endif /* } COMMUNITY_SOURCE_AMD_SECRET */
-
-
-static INLINE Bool
-CPUID_MODEL_IS_KYOTO(uint32 eax)
-{
-   /* Kyoto is models 0x00 of family 0x16 (so far). */
-   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_KYOTO &&
-          CPUID_EFFECTIVE_MODEL(eax) == CPUID_MODEL_KYOTO_00;
-}
-
-#define CPUID_TYPE_PRIMARY     0
-#define CPUID_TYPE_OVERDRIVE   1
-#define CPUID_TYPE_SECONDARY   2
-
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_NULL      0
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_DATA      1
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_INST      2
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_UNIF      3
-#define CPUID_LEAF4_CACHE_TYPE_NULL      0
-#define CPUID_LEAF4_CACHE_TYPE_DATA      1
-#define CPUID_LEAF4_CACHE_TYPE_INST      2
-#define CPUID_LEAF4_CACHE_TYPE_UNIF      3
-#define CPUID_LEAF4_CACHE_INDEXING_DIRECT  0
-#define CPUID_LEAF4_CACHE_INDEXING_COMPLEX 1
-
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_SELF_INIT      0x00000100
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_FULLY_ASSOC    0x00000200
-#define CPUID_LEAF4_CACHE_SELF_INIT      0x00000100
-#define CPUID_LEAF4_CACHE_FULLY_ASSOC    0x00000200
-
-#define CPUID_INTEL_IDBECX_LEVEL_TYPE_INVALID   0
-#define CPUID_INTEL_IDBECX_LEVEL_TYPE_SMT       1
-#define CPUID_INTEL_IDBECX_LEVEL_TYPE_CORE      2
-#define CPUID_TOPOLOGY_LEVEL_TYPE_INVALID   0
-#define CPUID_TOPOLOGY_LEVEL_TYPE_SMT       1
-#define CPUID_TOPOLOGY_LEVEL_TYPE_CORE      2
-
-
-/*
- * For certain AMD processors, an lfence instruction is necessary at various
- * places to ensure ordering.
- */
-
-static INLINE Bool
-CPUID_VendorRequiresFence(CpuidVendor vendor)
-{
-   return vendor == CPUID_VENDOR_AMD;
-}
-
-static INLINE Bool
-CPUID_VersionRequiresFence(uint32 version)
-{
-   return CPUID_EFFECTIVE_FAMILY(version) == CPUID_FAMILY_K8 &&
-          CPUID_EFFECTIVE_MODEL(version) < 0x40;
-}
-
-static INLINE Bool
-CPUID_ID0RequiresFence(CPUIDRegs *id0)
-{
-   if (id0->eax == 0) {
-      return FALSE;
-   }
-   return CPUID_IsVendorAMD(id0);
-}
-
-static INLINE Bool
-CPUID_ID1RequiresFence(CPUIDRegs *id1)
-{
-   return CPUID_VersionRequiresFence(id1->eax);
-}
-
-static INLINE Bool
-CPUID_RequiresFence(CpuidVendor vendor, // IN
-                    uint32 version)      // IN: %eax from CPUID with %eax=1.
-{
-   return CPUID_VendorRequiresFence(vendor) &&
-          CPUID_VersionRequiresFence(version);
-}
-
-
-/*
- * The following low-level functions compute the number of
- * cores per cpu.  They should be used cautiously because
- * they do not necessarily work on all types of CPUs.
- * High-level functions that are correct for all CPUs are
- * available elsewhere: see lib/cpuidInfo/cpuidInfo.c.
- */
-
-static INLINE uint32
-CPUID_IntelCoresPerPackage(uint32 v) /* %eax from CPUID with %eax=4 and %ecx=0. */
-{
-   // Note: This is not guaranteed to work on older Intel CPUs.
-   return 1 + CPUID_GET(4, EAX, LEAF4_CORE_COUNT, v);
-}
-
-
-static INLINE uint32
-CPUID_AMDCoresPerPackage(uint32 v) /* %ecx from CPUID with %eax=0x80000008. */
-{
-   // Note: This is not guaranteed to work on older AMD CPUs.
-   return 1 + CPUID_GET(0x80000008, ECX, LEAF88_CORE_COUNT, v);
-}
-
-
-/*
- * Hypervisor CPUID space is 0x400000XX.
- */
-static INLINE Bool
-CPUID_IsHypervisorLevel(uint32 level)
-{
-   return (level & 0xffffff00) == 0x40000000;
-}
-
-/*
- *----------------------------------------------------------------------
- *
- * CPUID_LevelUsesEcx --
- *
- *      Returns TRUE for leaves that support input ECX != 0 (subleaves).
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE Bool
-CPUID_LevelUsesEcx(uint32 level) {
-   return level == 4 || level == 7 || level == 0xb || level == 0xd ||
-          level == 0x8000001d;
-}
-
-/*
- *----------------------------------------------------------------------
- *
- * CPUID_IsValid*Subleaf --
- *
- *      Functions to determine the last subleaf for the level specified
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE Bool
-CPUID_IsValidBSubleaf(uint32 ebx)  // IN: %ebx = cpuid.b.sublevel.ebx
-{
-   return ebx != 0;
-}
-
-static INLINE Bool
-CPUID_IsValid4Subleaf(uint32 eax)  // IN: %eax = cpuid.4.sublevel.eax
-{
-   return eax != 0;
-}
-
-static INLINE Bool
-CPUID_IsValid7Subleaf(uint32 eax, uint32 subleaf)  // IN: %eax = cpuid.7.0.eax
-{
-   /*
-    * cpuid.7.0.eax is the max ecx (subleaf) index
-    */
-   return subleaf <= eax;
-}
-
-/*
- *----------------------------------------------------------------------
- *
- * CPUID_IsValidDSubleaf --
- *
- *    It is the caller's repsonsibility to determine if the processor
- *    supports XSAVE and therefore has D sub-leaves.
- *
- *----------------------------------------------------------------------
- */
-static INLINE Bool
-CPUID_IsValidDSubleaf(uint32 subleaf)  // IN: subleaf to check
-{
-   return subleaf <= 63;
-}
-
-/*
- *----------------------------------------------------------------------
- *
- * CPUID_SupportsMsrPlatformInfo --
- *
- *    Uses vendor and cpuid.1.0.eax to determine if the processor
- *    supports MSR_PLATFORM_INFO.
- *
- *----------------------------------------------------------------------
- */
-static INLINE Bool
-CPUID_SupportsMsrPlatformInfo(CpuidVendor vendor, uint32 version)
-{
-   return vendor == CPUID_VENDOR_INTEL &&
-          (CPUID_UARCH_IS_NEHALEM(version)     ||
-           CPUID_UARCH_IS_SANDYBRIDGE(version) ||
-           CPUID_UARCH_IS_HASWELL(version)     ||
-           CPUID_UARCH_IS_SKYLAKE(version)     ||
-           CPUID_MODEL_IS_AVOTON(version));
-}
-
-#endif

From f78dd5288e94c1244a3ff6e5d04555c9826c5dde Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Mon, 25 Dec 2017 10:06:21 +0100
Subject: [PATCH 05/41] import Workstation 14.1.0 module sources

---
 vmmon-only/linux/hostif.c       | 33 +++++++++++++++++++++-------
 vmnet-only/Makefile.kernel      |  1 +
 vmnet-only/compat_netdevice.h   |  4 +---
 vmnet-only/netif_trans_update.c | 39 +++++++++++++++++++++++++++++++++
 4 files changed, 66 insertions(+), 11 deletions(-)
 create mode 100644 vmnet-only/netif_trans_update.c

diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 78199daf..1a373658 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1516,17 +1516,34 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
    unsigned int reservedPages = MEMDEFAULTS_MIN_HOST_PAGES;
    unsigned int hugePages = (vm == NULL) ? 0 :
       BYTES_2_PAGES(vm->memInfo.hugePageBytes);
-   unsigned int lockedPages = global_page_state(NR_PAGETABLE) +
-                              global_page_state(NR_SLAB_UNRECLAIMABLE) +
-                              global_page_state(NR_UNEVICTABLE) +
-                              hugePages + reservedPages;
-   unsigned int anonPages =
+   unsigned int lockedPages = hugePages + reservedPages;
+   unsigned int anonPages;
+   unsigned int swapPages = BYTES_2_PAGES(linuxState.swapSize);
+
+   /* global_page_state is global_zone_page_state in 4.14. */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 14, 0)
+   lockedPages += global_zone_page_state(NR_PAGETABLE);
+#else
+   lockedPages += global_page_state(NR_PAGETABLE);
+#endif
+   /* NR_SLAB_* moved from zone to node in 4.13. */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 13, 0)
+   lockedPages += global_node_page_state(NR_SLAB_UNRECLAIMABLE);
+#else
+   lockedPages += global_page_state(NR_SLAB_UNRECLAIMABLE);
+#endif
+   /* NR_UNEVICTABLE moved from global to node in 4.8. */
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 8, 0)
-      global_page_state(NR_ANON_MAPPED);
+   lockedPages += global_node_page_state(NR_UNEVICTABLE);
 #else
-      global_page_state(NR_ANON_PAGES);
+   lockedPages += global_page_state(NR_UNEVICTABLE);
+#endif
+   /* NR_ANON_MAPPED moved & changed name in 4.8. */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 8, 0)
+   anonPages = global_node_page_state(NR_ANON_MAPPED);
+#else
+   anonPages = global_page_state(NR_ANON_PAGES);
 #endif
-   unsigned int swapPages = BYTES_2_PAGES(linuxState.swapSize);
 
    if (anonPages > swapPages) {
       lockedPages += anonPages - swapPages;
diff --git a/vmnet-only/Makefile.kernel b/vmnet-only/Makefile.kernel
index 09a1e3c9..44a8a95d 100644
--- a/vmnet-only/Makefile.kernel
+++ b/vmnet-only/Makefile.kernel
@@ -20,6 +20,7 @@
 INCLUDE := -I$(SRCROOT)
 
 EXTRA_CFLAGS := $(CC_OPTS) $(INCLUDE)
+EXTRA_CFLAGS += $(call vm_check_build, $(SRCROOT)/netif_trans_update.c,-DVMW_NETIF_TRANS_UPDATE, )
 
 obj-m += $(DRIVER).o
 
diff --git a/vmnet-only/compat_netdevice.h b/vmnet-only/compat_netdevice.h
index 0b34ccdf..ae5c79cb 100644
--- a/vmnet-only/compat_netdevice.h
+++ b/vmnet-only/compat_netdevice.h
@@ -337,9 +337,7 @@ typedef netdev_features_t compat_netdev_features_t;
 typedef u32 compat_netdev_features_t;
 #endif
 
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 7, 0) || \
-    (defined(RHEL_RELEASE_CODE) && RHEL_RELEASE_CODE >= 0x0704) || \
-    (defined(CONFIG_SUSE_KERNEL) && LINUX_VERSION_CODE >= KERNEL_VERSION(4, 4, 73))
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 7, 0) || defined(VMW_NETIF_TRANS_UPDATE)
 #define compat_netif_trans_update(d) netif_trans_update(d)
 #else
 #define compat_netif_trans_update(d) do { (d)->trans_start = jiffies; } while (0)
diff --git a/vmnet-only/netif_trans_update.c b/vmnet-only/netif_trans_update.c
new file mode 100644
index 00000000..2154ae09
--- /dev/null
+++ b/vmnet-only/netif_trans_update.c
@@ -0,0 +1,39 @@
+/*********************************************************
+ * Copyright (C) 2017 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+
+/*
+ * Detect whether there is netif_trans_update, which got introduced from 4.7.0
+ * Older kernels may have this function backported by vendors.
+ */
+
+#include "compat_version.h"
+#include "compat_autoconf.h"
+
+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 0, 0)
+#   error This compile test intentionally fails.
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(4, 7, 0)
+#include <linux/netdevice.h>
+
+void test_netif_trans_update(struct net_device *dev)
+{
+   netif_trans_update(dev);
+}
+
+#endif
+

From 876363be72e2c9e12b295d663b199f40bb302323 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 12 Jan 2018 13:51:07 +0100
Subject: [PATCH 06/41] import Workstation 14.1.1 module sources

---
 vmmon-only/common/cpuid.c       | 29 +++++++++++++++++++++++++++-
 vmmon-only/common/cpuid.h       |  3 ++-
 vmmon-only/common/task.c        | 34 ++++++++++++++++++++++++++++++++-
 vmmon-only/include/iocontrols.h |  4 ++--
 vmmon-only/include/modulecall.h |  5 +++--
 vmmon-only/include/x86cpuid.h   | 11 ++++++++++-
 vmmon-only/include/x86msr.h     |  6 +++++-
 vmmon-only/linux/driver.c       | 10 +++++++---
 vmmon-only/linux/hostif.c       | 12 +++++++-----
 9 files changed, 97 insertions(+), 17 deletions(-)

diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
index 04a071ed..93ad2518 100644
--- a/vmmon-only/common/cpuid.c
+++ b/vmmon-only/common/cpuid.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2016-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2016-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,6 +37,7 @@
 uint32 cpuidFeatures;
 static CpuidVendor vendor = CPUID_NUM_VENDORS;
 static uint32 version;
+static Bool hasSpecCtrl;
 
 
 /*
@@ -99,6 +100,9 @@ CPUID_Init(void)
       Warning("VMMON CPUID: Unrecognized CPU\n");
       vendor = CPUID_VENDOR_UNKNOWN;
    }
+
+   __GET_CPUID2(7, 0, &regs);
+   hasSpecCtrl = vendor == CPUID_VENDOR_INTEL && ((regs.edx >> 26) & 0x3) != 0;
 }
 
 
@@ -176,3 +180,26 @@ CPUID_HostSupportsHV(void)
    return (vendor == CPUID_VENDOR_AMD   && SVM_CapableCPU()) ||
           (vendor == CPUID_VENDOR_INTEL && VT_CapableCPU());
 }
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CPUID_HostSupportsSpecCtrl --
+ *
+ *     Determine whether the processor supports MSR_SPEC_CTRL.
+ *
+ * Results:
+ *     True iff the processor supports the required features.
+ *
+ * Side effects:
+ *     None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+CPUID_HostSupportsSpecCtrl(void)
+{
+   return hasSpecCtrl;
+}
diff --git a/vmmon-only/common/cpuid.h b/vmmon-only/common/cpuid.h
index c21b0715..4b8b04fe 100644
--- a/vmmon-only/common/cpuid.h
+++ b/vmmon-only/common/cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2016-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2016-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,6 +38,7 @@ CpuidVendor CPUID_GetVendor(void);
 uint32 CPUID_GetVersion(void);
 Bool CPUID_AddressSizeSupported(void);
 Bool CPUID_HostSupportsHV(void);
+Bool CPUID_HostSupportsSpecCtrl(void);
 
 static INLINE uint32
 CPUID_GetFeatures(void)
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index abb6630b..98cc74a8 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -82,6 +82,9 @@
 #   define USE_TEMPORARY_GDT 0
 #endif
 
+/* Cycle through values of SPEC_CTRL and verify they survive world switch. */
+#undef CYCLE_SPEC_CTRL
+
 #define TS_ASSERT(t) do { \
    DEBUG_ONLY(if (!(t)) TaskAssertFail(__LINE__);)  \
 } while (0)
@@ -2371,6 +2374,11 @@ Task_Switch(VMDriver *vm,  // IN
    uint32 pCPU;
    MPN hvRootMPN;
    Descriptor *tempGDTBase;
+#ifdef CYCLE_SPEC_CTRL
+   Bool specCtrlEqual = FALSE;
+   uint64 readSpecCtrlValue = 0;
+   static volatile uint64 currentSpecCtrlValue = 0;
+#endif
 
    ASSERT_ON_COMPILE(sizeof(VMCrossPage) == PAGE_SIZE);
    TaskDisableNMI(&vm->hostAPIC, &lint0NMI, &lint1NMI, &pcNMI, &thermalNMI);
@@ -2588,6 +2596,14 @@ Task_Switch(VMDriver *vm,  // IN
          TS_ASSERT(SELECTOR_TABLE(ds) == SELECTOR_GDT);
          TS_ASSERT(SELECTOR_TABLE(ss) == SELECTOR_GDT);
 
+         if (CPUID_HostSupportsSpecCtrl()) {
+#ifdef CYCLE_SPEC_CTRL
+            currentSpecCtrlValue = (currentSpecCtrlValue + 1) % 4;
+            __SET_MSR(MSR_SPEC_CTRL, currentSpecCtrlValue);
+#endif
+            crosspage->crosspageData.specCtrl = __GET_MSR(MSR_SPEC_CTRL);
+         }
+
          DEBUG_ONLY(crosspage->crosspageData.tinyStack[0] = 0xDEADBEEF;)
          /* Running in host context prior to TaskSwitchToMonitor() */
          TaskSwitchToMonitor(crosspage);
@@ -2595,6 +2611,16 @@ Task_Switch(VMDriver *vm,  // IN
 
          TS_ASSERT(crosspage->crosspageData.tinyStack[0] == 0xDEADBEEF);
 
+#ifdef CYCLE_SPEC_CTRL
+         if (CPUID_HostSupportsSpecCtrl()) {
+            readSpecCtrlValue = __GET_MSR(MSR_SPEC_CTRL);
+            specCtrlEqual = readSpecCtrlValue ==
+                            crosspage->crosspageData.specCtrl;
+            /* Do not leak cycling SPEC_CTRL value back to host. */
+            __SET_MSR(MSR_SPEC_CTRL, 0);
+         }
+#endif
+
          /*
           * Temporarily disable single-step stress as VMX/VMCS change code
           * ASSERTS on RFLAGS content without allowing TF/RF to be set.
@@ -2732,6 +2758,12 @@ Task_Switch(VMDriver *vm,  // IN
          if (UNLIKELY(TaskGotException(crosspage, EXC_UD))) {
             Warning("#UD occurred on switch back to host; dumping core");
          }
+#ifdef CYCLE_SPEC_CTRL
+         if (UNLIKELY(!specCtrlEqual)) {
+            Warning("SpecCtrl not equal: expected %"FMT64"x, got %"FMT64"x\n",
+                    crosspage->crosspageData.specCtrl, readSpecCtrlValue);
+         }
+#endif
          /*
           * The NMI/MCE checks above are special cases for interrupts
           * received during worldswitch.  Here is the more generic case
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index f5282910..fb81586a 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -144,7 +144,7 @@ PtrToVA64(void const *ptr) // IN
  *
  */
 
-#define VMMON_VERSION           (329 << 16 | 0)
+#define VMMON_VERSION           (330 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index 9487cd5f..b54872f1 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -374,6 +374,7 @@ struct VMCrossPageData {
 
    volatile Bool wsException[NUM_EXCEPTIONS]; // Tracks faults in worldswitch.
    uint64        wsUD2;                       // IP of ud2 instr or 0 if unset.
+   uint64        specCtrl; /* host MSR_SPEC_CTRL value before world switch. */
 }
 #include "vmware_pack_end.h"
 VMCrossPageData;
@@ -430,7 +431,7 @@ struct VMCrossPage {
 #include "vmware_pack_end.h"
 VMCrossPage;
 
-#define CROSSPAGE_VERSION_BASE 0xbfb /* increment by 1 */
+#define CROSSPAGE_VERSION_BASE 0xbfc /* increment by 1 */
 #define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
 
 #if !defined(VMX86_SERVER) && defined(VMM)
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 251e526b..c8efd92f 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -460,6 +460,10 @@ FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                 NO,   0, FALSE) \
 FLAG(   6,  0, ECX,  1,  1, ACNT2,                             ANY, 13, FALSE) \
 FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                  NO,   0, FALSE)
 
+#define CPUID_7_EDX_26 \
+FLAG(   7,  0, EDX, 26,  1, LEVEL7EDX_RSVD1,                    NO,  0, FALSE)
+#define CPUID_7_EDX_27 \
+FLAG(   7,  0, EDX, 27,  1, LEVEL7EDX_RSVD2,                    NO,  0, FALSE)
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_7                                               \
@@ -499,7 +503,8 @@ FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                        YES, 15, TRUE)  \
 FLAG(   7,  0, ECX,  3,  1, PKU,                               YES, 13, TRUE)  \
 FLAG(   7,  0, ECX,  4,  1, OSPKE,                             ANY, 13, TRUE)  \
 FLAG(   7,  0, ECX, 30,  1, SGX_LC,                            NO,   0, FALSE) \
-
+CPUID_7_EDX_26 \
+CPUID_7_EDX_27
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_A                                               \
@@ -941,6 +946,9 @@ FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                          NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                     NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                   NA,   0, FALSE)
 
+#define CPUID_88_EBX_12 \
+FLAG(  88,  0, EBX, 12,  1, LEVEL88EBX_RSVD1,                  NO,   0, FALSE)
+
 /*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_88                                              \
 FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                         YES,  4, FALSE) \
@@ -949,6 +957,7 @@ FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                YES,  8, FALSE) \
 FLAG(  88,  0, EBX,  0,  1, CLZERO,                            YES, 14, TRUE)  \
 FLAG(  88,  0, EBX,  1,  1, IRPERF,                            NO,   0, FALSE) \
 FLAG(  88,  0, EBX,  2,  1, XSAVE_ERR_PTR,                     NO,   0, FALSE) \
+CPUID_88_EBX_12 \
 FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                 YES,  4, FALSE) \
 FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                YES,  7, FALSE) \
 FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                      NO,   0, FALSE)
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 3a6bfe8e..40dfbc67 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -84,6 +84,7 @@ MSRQuery;
 #define MSR_SMI_COUNT         0x00000034 // Intel Nehalem Family
 #define MSR_FEATCTL           0x0000003a
 #define MSR_TSC_ADJUST        0x0000003b
+#define MSR_SPEC_CTRL         0x00000048
 #define MSR_BIOS_UPDT_TRIG    0x00000079
 #define MSR_BIOS_SIGN_ID      0x0000008b
 #define MSR_PERFCTR0          0x000000c1
@@ -112,6 +113,7 @@ MSRQuery;
 #define MSR_TSC_AUX           0xc0000103
 #define MSR_BD_TSC_RATIO      0xc0000104
 
+
 #define MSR_MISC_FEATURES_ENABLES            0x140
 
 /* Intel Core Architecture and later: use only architected counters. */
@@ -478,6 +480,8 @@ typedef enum {
 #define MSR_VM_CR_SVME_DISABLE     0x0000000000000010ULL
 #define MSR_VM_CR_RESERVED         0xffffffffffffffe0ULL
 
+#define MSR_AMD_DE_CFG           0xc0011029  // Decode configuration
+#define MSR_AMD_DE_CFG_BIT1      (1ULL<<1)
 
 /* Syscall/Sysret related MSRs (x86_64) */
 #define MSR_STAR             0xc0000081 // Also present on Athlons.
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 3080525b..1905aa49 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -216,7 +216,7 @@ LinuxDriverEstimateTSCkHz(void)
  *----------------------------------------------------------------------
  */
 static void
-LinuxDriverEstimateTSCkHzDeferred(unsigned long data)
+LinuxDriverEstimateTSCkHzDeferred(struct timer_list *data)
 {
    LinuxDriverEstimateTSCkHz();
 }
@@ -251,9 +251,7 @@ LinuxDriverInitTSCkHz(void)
    }
 
    LinuxDriverReadTSCAndUptime(&tsckHzStartTime);
-   tscTimer.function = LinuxDriverEstimateTSCkHzDeferred;
    tscTimer.expires  = jiffies + 4 * HZ;
-   tscTimer.data     = 0;
    add_timer(&tscTimer);
 }
 
@@ -335,7 +333,13 @@ init_module(void)
        linuxState.deviceName, linuxState.major, linuxState.minor);
 
    HostIF_InitUptime();
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 15, 0) && !defined(timer_setup)
    init_timer(&tscTimer);
+   tscTimer.function = (void *)LinuxDriverEstimateTSCkHzDeferred;
+   tscTimer.data = (unsigned long)&tscTimer;
+#else
+   timer_setup(&tscTimer, LinuxDriverEstimateTSCkHzDeferred, 0);
+#endif
    LinuxDriverInitTSCkHz();
    Vmx86_InitIDList();
 
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 1a373658..b793539c 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1637,9 +1637,6 @@ HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies
    unsigned long jifs, jifBase;
    unsigned int attempts = 0;
 
-   /* Assert that HostIF_InitUptime has been called. */
-   ASSERT(uptimeState.timer.function);
-
  retry:
    do {
       version  = VersionedAtomic_BeginTryRead(&uptimeState.version);
@@ -1705,7 +1702,7 @@ HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies
  */
 
 static void
-HostIFUptimeResyncMono(unsigned long data)  // IN: ignored
+HostIFUptimeResyncMono(struct timer_list *timer)  // IN: ignored
 {
    unsigned long jifs;
    uintptr_t flags;
@@ -1767,8 +1764,13 @@ HostIF_InitUptime(void)
                   -(tv.tv_usec * (UPTIME_FREQ / 1000000) +
                     tv.tv_sec * UPTIME_FREQ));
 
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 15, 0) && !defined(timer_setup)
    init_timer(&uptimeState.timer);
-   uptimeState.timer.function = HostIFUptimeResyncMono;
+   uptimeState.timer.function = (void *)HostIFUptimeResyncMono;
+   uptimeState.timer.data = (unsigned long)&uptimeState.timer;
+#else
+   timer_setup(&uptimeState.timer, HostIFUptimeResyncMono, 0);
+#endif
    mod_timer(&uptimeState.timer, jiffies + HZ);
 }
 

From 2749950c5fba95783c6193d1b6928a60c82f6ba1 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Wed, 23 May 2018 18:49:52 +0200
Subject: [PATCH 07/41] import Workstation 14.1.2 module sources

---
 vmmon-only/include/x86cpuid.h | 19 ++++++++-----------
 vmmon-only/include/x86msr.h   |  9 +++++++++
 2 files changed, 17 insertions(+), 11 deletions(-)

diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index c8efd92f..09b36ff8 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -460,10 +460,8 @@ FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                 NO,   0, FALSE) \
 FLAG(   6,  0, ECX,  1,  1, ACNT2,                             ANY, 13, FALSE) \
 FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                  NO,   0, FALSE)
 
-#define CPUID_7_EDX_26 \
-FLAG(   7,  0, EDX, 26,  1, LEVEL7EDX_RSVD1,                    NO,  0, FALSE)
-#define CPUID_7_EDX_27 \
-FLAG(   7,  0, EDX, 27,  1, LEVEL7EDX_RSVD2,                    NO,  0, FALSE)
+#define CPUID_7_EDX_31 \
+FLAG(   7,  0, EDX, 31,  1, LEVEL7EDX_RSVD1,                    NO,  0, FALSE)
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_7                                               \
@@ -503,8 +501,10 @@ FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                        YES, 15, TRUE)  \
 FLAG(   7,  0, ECX,  3,  1, PKU,                               YES, 13, TRUE)  \
 FLAG(   7,  0, ECX,  4,  1, OSPKE,                             ANY, 13, TRUE)  \
 FLAG(   7,  0, ECX, 30,  1, SGX_LC,                            NO,   0, FALSE) \
-CPUID_7_EDX_26 \
-CPUID_7_EDX_27
+FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                          ANY,  9, FALSE) \
+FLAG(   7,  0, EDX, 27,  1, STIBP,                             YES,  9, FALSE) \
+FLAG(   7,  0, EDX, 29,  1, ARCH_CAPABILITIES,                 ANY,  9, FALSE) \
+CPUID_7_EDX_31
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_A                                               \
@@ -946,9 +946,6 @@ FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                          NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                     NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                   NA,   0, FALSE)
 
-#define CPUID_88_EBX_12 \
-FLAG(  88,  0, EBX, 12,  1, LEVEL88EBX_RSVD1,                  NO,   0, FALSE)
-
 /*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_88                                              \
 FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                         YES,  4, FALSE) \
@@ -957,7 +954,7 @@ FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                YES,  8, FALSE) \
 FLAG(  88,  0, EBX,  0,  1, CLZERO,                            YES, 14, TRUE)  \
 FLAG(  88,  0, EBX,  1,  1, IRPERF,                            NO,   0, FALSE) \
 FLAG(  88,  0, EBX,  2,  1, XSAVE_ERR_PTR,                     NO,   0, FALSE) \
-CPUID_88_EBX_12 \
+FLAG(  88,  0, EBX, 12,  1, IBPBONLY,                          ANY,  9, FALSE) \
 FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                 YES,  4, FALSE) \
 FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                YES,  7, FALSE) \
 FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                      NO,   0, FALSE)
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 40dfbc67..bffc591b 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -85,6 +85,7 @@ MSRQuery;
 #define MSR_FEATCTL           0x0000003a
 #define MSR_TSC_ADJUST        0x0000003b
 #define MSR_SPEC_CTRL         0x00000048
+#define MSR_PRED_CMD          0x00000049
 #define MSR_BIOS_UPDT_TRIG    0x00000079
 #define MSR_BIOS_SIGN_ID      0x0000008b
 #define MSR_PERFCTR0          0x000000c1
@@ -113,6 +114,14 @@ MSRQuery;
 #define MSR_TSC_AUX           0xc0000103
 #define MSR_BD_TSC_RATIO      0xc0000104
 
+#define IA32_MSR_ARCH_CAPABILITIES           0x10a
+#define MSR_ARCH_CAPABILITIES_RDCL_NO             (1ULL << 0)
+#define MSR_ARCH_CAPABILITIES_IBRS_ALL            (1ULL << 1)
+#define MSR_ARCH_CAPABILITIES_RSBA                (1ULL << 2)
+
+#define MSR_SPEC_CTRL_IBRS                        (1UL << 0)
+#define MSR_SPEC_CTRL_STIBP                       (1UL << 1)
+#define MSR_PRED_CMD_IBPB                         (1UL << 0)
 
 #define MSR_MISC_FEATURES_ENABLES            0x140
 

From 3f188d0a764b9e6a7021d738e76648ac68051941 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Mon, 20 Aug 2018 07:30:12 +0200
Subject: [PATCH 08/41] import Workstation 14.1.3 module sources

---
 vmmon-only/include/iocontrols.h   | 2 +-
 vmmon-only/include/x86cpuid.h     | 6 +++++-
 vmmon-only/include/x86msr.h       | 3 +++
 vmmon-only/include/x86paging_64.h | 5 ++++-
 4 files changed, 13 insertions(+), 3 deletions(-)

diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index fb81586a..d7688962 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -144,7 +144,7 @@ PtrToVA64(void const *ptr) // IN
  *
  */
 
-#define VMMON_VERSION           (330 << 16 | 0)
+#define VMMON_VERSION           (331 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 09b36ff8..fb4d7e0f 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -460,8 +460,11 @@ FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                 NO,   0, FALSE) \
 FLAG(   6,  0, ECX,  1,  1, ACNT2,                             ANY, 13, FALSE) \
 FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                  NO,   0, FALSE)
 
+#define CPUID_7_EDX_28 \
+FLAG(   7,  0, EDX, 28,  1, LEVEL7EDX_RSVD1,                    NO,  0, FALSE)
+
 #define CPUID_7_EDX_31 \
-FLAG(   7,  0, EDX, 31,  1, LEVEL7EDX_RSVD1,                    NO,  0, FALSE)
+FLAG(   7,  0, EDX, 31,  1, LEVEL7EDX_RSVD2,                    NO,  0, FALSE)
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_7                                               \
@@ -503,6 +506,7 @@ FLAG(   7,  0, ECX,  4,  1, OSPKE,                             ANY, 13, TRUE)  \
 FLAG(   7,  0, ECX, 30,  1, SGX_LC,                            NO,   0, FALSE) \
 FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                          ANY,  9, FALSE) \
 FLAG(   7,  0, EDX, 27,  1, STIBP,                             YES,  9, FALSE) \
+CPUID_7_EDX_28                                                                 \
 FLAG(   7,  0, EDX, 29,  1, ARCH_CAPABILITIES,                 ANY,  9, FALSE) \
 CPUID_7_EDX_31
 
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index bffc591b..6e11bb66 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -119,6 +119,9 @@ MSRQuery;
 #define MSR_ARCH_CAPABILITIES_IBRS_ALL            (1ULL << 1)
 #define MSR_ARCH_CAPABILITIES_RSBA                (1ULL << 2)
 
+#define MSR_FLUSH_CMD                        0x10b
+#define MSR_FLUSH_CMD_FLUSH_L1D              1
+
 #define MSR_SPEC_CTRL_IBRS                        (1UL << 0)
 #define MSR_SPEC_CTRL_STIBP                       (1UL << 1)
 #define MSR_PRED_CMD_IBPB                         (1UL << 0)
diff --git a/vmmon-only/include/x86paging_64.h b/vmmon-only/include/x86paging_64.h
index a8e09469..eceea27b 100644
--- a/vmmon-only/include/x86paging_64.h
+++ b/vmmon-only/include/x86paging_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016,2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,6 +39,7 @@
 #include "vm_basic_types.h"
 #include "x86types.h"
 #include "vm_pagetable.h"
+#include "x86paging_common.h"
 
 #define LM_PTE_PFN_MASK      CONST64U(0xffffffffff000)
 #define LM_PTE_2_PFN(_pte)   (((_pte) & LM_PTE_PFN_MASK) >> PT_PTE_PFN_SHIFT)
@@ -70,6 +71,8 @@
 #define LM_MAKE_L1E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
 
 
+
+
 /*
  * x86-64 architecture requires implementations supporting less than
  * full 64-bit VAs to ensure that all virtual addresses are in canonical

From d7fe4fe97c205849f708a4c4cd513b68652227c1 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Tue, 2 Oct 2018 19:58:28 +0200
Subject: [PATCH 09/41] import Workstation 15.0.0 module sources

---
 vmmon-only/Makefile.normal                   |   4 +-
 vmmon-only/bootstrap/monLoader.c             |  14 +-
 vmmon-only/bootstrap/monLoaderVmmon.c        | 155 ++++-
 vmmon-only/bootstrap/vmmblob.c               | 230 +++++++
 vmmon-only/common/apic.c                     |  13 +-
 vmmon-only/common/cpuid.c                    |  90 +--
 vmmon-only/common/cpuid.h                    |  48 +-
 vmmon-only/common/hashFunc.c                 |  41 --
 vmmon-only/common/hostif.h                   |  18 +-
 vmmon-only/common/hostifMem.h                |   2 +-
 vmmon-only/common/task.c                     | 667 +++++++++++--------
 vmmon-only/common/vmx86.c                    | 497 +++++++++++---
 vmmon-only/common/vmx86.h                    |  69 +-
 vmmon-only/include/basic_initblock.h         |   8 +-
 vmmon-only/include/circList.h                |   6 +-
 vmmon-only/include/contextinfo.h             |   4 +-
 vmmon-only/include/cpu_defs.h                |   2 +-
 vmmon-only/include/cpuid_info.h              |  29 +-
 vmmon-only/include/crossgdt.h                |  41 +-
 vmmon-only/include/hashFunc.h                | 345 ----------
 vmmon-only/include/iocontrols.h              |  66 +-
 vmmon-only/include/modulecall.h              | 192 +++---
 vmmon-only/include/monAddrLayout.h           |  26 +-
 vmmon-only/include/monLoader.h               |  55 +-
 vmmon-only/include/monitorAction_exported.h  | 121 ----
 vmmon-only/include/numa_defs.h               |  12 +-
 vmmon-only/include/pcip_defs.h               |  12 +-
 vmmon-only/include/pshare_ext.h              |   4 +-
 vmmon-only/include/ptsc.h                    |   3 +-
 vmmon-only/include/vcpuid.h                  |   6 +-
 vmmon-only/include/vcpuset.h                 | 178 +++--
 vmmon-only/include/vcpuset_types.h           |   7 +-
 vmmon-only/include/versioned_atomic.h        |  14 -
 vmmon-only/include/vm_asm_x86.h              |   4 +-
 vmmon-only/include/vm_atomic.h               | 532 ++++++++-------
 vmmon-only/include/vm_basic_asm.h            |   6 +-
 vmmon-only/include/vm_basic_asm_x86.h        |   2 +-
 vmmon-only/include/vm_basic_asm_x86_64.h     |   2 +-
 vmmon-only/include/vm_basic_asm_x86_common.h |  10 +-
 vmmon-only/include/vm_basic_defs.h           | 106 +--
 vmmon-only/include/vm_basic_math.h           |   2 +-
 vmmon-only/include/vm_basic_types.h          | 254 +++----
 vmmon-only/include/vm_pagetable.h            |   6 +-
 vmmon-only/include/vmmblob.h                 |  50 ++
 vmmon-only/include/vmmem_shared.h            |  28 +-
 vmmon-only/include/x86_basic_defs.h          |   2 +-
 vmmon-only/include/x86apic.h                 |   4 +-
 vmmon-only/include/x86cpuid.h                | 201 +++---
 vmmon-only/include/x86cpuid_asm.h            |   2 +-
 vmmon-only/include/x86msr.h                  |  28 +-
 vmmon-only/include/x86paging_common.h        |   3 +-
 vmmon-only/include/x86perfctr.h              |  10 +-
 vmmon-only/include/x86svm.h                  |  41 +-
 vmmon-only/include/x86types.h                |   5 +-
 vmmon-only/include/x86vendor.h               |   4 +-
 vmmon-only/include/x86vt-vmcs-fields.h       | 319 ++++-----
 vmmon-only/include/x86vt.h                   |  36 +-
 vmmon-only/linux/driver.c                    | 208 +++---
 vmmon-only/linux/driver.h                    |   8 +-
 vmmon-only/linux/hostif.c                    | 349 ++++++++--
 vmmon-only/linux/vmhost.h                    |  15 +-
 vmmon-only/vmcore/moduleloop.c               |  48 +-
 vmnet-only/smac_compat.c                     |   7 +-
 vmnet-only/vm_atomic.h                       | 532 ++++++++-------
 vmnet-only/vm_basic_asm.h                    |   6 +-
 vmnet-only/vm_basic_asm_x86.h                |   2 +-
 vmnet-only/vm_basic_asm_x86_64.h             |   2 +-
 vmnet-only/vm_basic_asm_x86_common.h         |  10 +-
 vmnet-only/vm_basic_defs.h                   | 106 +--
 vmnet-only/vm_basic_types.h                  | 254 +++----
 vmnet-only/vm_device_version.h               |  62 +-
 vmnet-only/vnetInt.h                         |  11 +-
 72 files changed, 3464 insertions(+), 2792 deletions(-)
 create mode 100644 vmmon-only/bootstrap/vmmblob.c
 delete mode 100644 vmmon-only/common/hashFunc.c
 delete mode 100644 vmmon-only/include/hashFunc.h
 create mode 100644 vmmon-only/include/vmmblob.h

diff --git a/vmmon-only/Makefile.normal b/vmmon-only/Makefile.normal
index a38a6dae..cde99ed3 100644
--- a/vmmon-only/Makefile.normal
+++ b/vmmon-only/Makefile.normal
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998,2015 VMware, Inc. All rights reserved.
+# Copyright (C) 1998,2015,2017 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -72,7 +72,7 @@ INCLUDE += $(shell $(CC) $(INCLUDE) -E $(SRCROOT)/autoconf/geninclude.c \
 	   | sed -n -e 's!^APATH!-I$(HEADER_DIR)/asm!p')
 
 C_TARGETS_LINUX  := driver.o hostif.o driverLog.o
-C_TARGETS_COMMON := vmx86.o memtrack.o phystrack.o cpuid.o task.o hashFunc.o
+C_TARGETS_COMMON := vmx86.o memtrack.o phystrack.o cpuid.o task.o
 C_TARGETS_VMCORE := moduleloop.o
 C_TARGETS_BOOTSTRAP := bootstrap.o
 C_TARGETS_LINUX_D := ${C_TARGETS_LINUX:.o=.d}
diff --git a/vmmon-only/bootstrap/monLoader.c b/vmmon-only/bootstrap/monLoader.c
index 34797cf5..bf5f4877 100644
--- a/vmmon-only/bootstrap/monLoader.c
+++ b/vmmon-only/bootstrap/monLoader.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -104,7 +104,7 @@ typedef struct MonPTMPNs {
 } MonPTMPNs;
  
 typedef struct MonLoaderContext {
-   MonLoaderEnvContext *envCtx; /* Environment-specific context */
+   struct MonLoaderEnvContext *envCtx; /* Environment-specific context */
    struct {
       MonPTMPNs    ptMPNs;      /* Mappings into the AS for the current VCPU. */
       VPN          ASFirstVPN;  /* first VPN in the address space */
@@ -405,6 +405,10 @@ MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
          }
          LOG(5, "%s: monVPN=0x%"FMTVPN"x: L2E=0x%"FMT64"x\n", __FUNCTION__,
                  monVPN, pte);
+         if (!PTE_PRESENT(pte)) {
+            ptMPNs->L1MPNs[i] = INVALID_MPN;
+            continue;
+         }
          mpn = LM_PTE_2_PFN(pte);
          if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
             return ML_ERROR_PAGE_TABLE_IMPORT;
@@ -490,6 +494,9 @@ MonLoaderMapPageTables(MonLoaderContext *ctx,      // IN/OUT
          VPN vpn = monVPN + i;
          if (verify) {
             PT_L1E l1e;
+            if (ptMPNs[i] == INVALID_MPN && level == 1) {
+               continue;
+            }
             if (MonLoaderTranslateMonVPNToL1E(ctx, vpn, &l1e) != ML_OK ||
                 LM_PTE_2_PFN(l1e) != ptMPNs[i] || !ML_PERMS_MATCH(l1e, flags)) {
                return ML_ERROR_PAGE_TABLE_VERIFY;
@@ -786,7 +793,8 @@ MonLoaderShareFromBlob(MonLoaderContext *ctx,        // IN/OUT
 {
    uint64 endOff = blobOffset + blobSize;
 
-   if ((blobOffset & PAGE_MASK) != 0 || (blobSize & PAGE_MASK) != 0 ||
+   if ((blobOffset & (PAGE_SIZE - 1)) != 0 ||
+       (blobSize & (PAGE_SIZE - 1)) != 0 ||
        (flags & PTE_RW) != 0) {
       return ML_ERROR_SHARE;
    }
diff --git a/vmmon-only/bootstrap/monLoaderVmmon.c b/vmmon-only/bootstrap/monLoaderVmmon.c
index 6879e617..85931983 100644
--- a/vmmon-only/bootstrap/monLoaderVmmon.c
+++ b/vmmon-only/bootstrap/monLoaderVmmon.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,7 +37,10 @@
 #include "x86paging_common.h"
 #include "x86paging_64.h"
 #include "vmx86.h"
+#include "monLoader.h"
 #include "monLoaderLog.h"
+#include "vmmblob.h"
+#include "memtrack.h"
 
 typedef struct MonLoaderEnvContext {
    VMDriver *vm;
@@ -101,6 +104,7 @@ void
 MonLoaderCallout_CleanUp(MonLoaderEnvContext *ctx)
 {
    ASSERT(ctx != NULL);
+   Vmx86_CleanupVMMPages(ctx->vm);
    HostIF_FreeKernelMem(ctx);
 }
 
@@ -179,11 +183,52 @@ MonLoaderCallout_ImportPage(MonLoaderEnvContext *ctx, // IN
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_AllocMPN --
+ *
+ *      Allocates and maps a new VMM page for the specified VCPU.
+ *
+ * Returns:
+ *      An MPN on success, INVALID_MPN on failure.
+ *
+ * Side effects:
+ *      The allocated page is accounted for and its mapping tracked.
+ *
+ *----------------------------------------------------------------------
+ */
+
 MPN
 MonLoaderCallout_AllocMPN(MonLoaderEnvContext *ctx,  // IN
                           Vcpuid               vcpu) // IN
 {
-   NOT_IMPLEMENTED();
+   VMDriver *vm = ctx->vm;
+   MemTrackEntry *entry;
+   MPN mpn;
+   VPN vpn;
+
+   if (Vmx86_AllocLockedPages(vm, (VA64)&mpn, 1, TRUE, FALSE) != 1) {
+      Log("Failed to allocate page\n");
+      return INVALID_MPN;
+   }
+   vpn = Vmx86_MapPage(mpn);
+   if (vpn == 0) {
+      Log("Failed to map MPN 0x%"FMT64"x\n", mpn);
+      Vmx86_FreeLockedPages(vm, (VA64)&mpn, 1, TRUE);
+      return INVALID_MPN;
+   }
+   HostIF_VMLock(vm, 41);
+   entry = MemTrack_Add(vm->vmmTracker, vpn, mpn);
+   HostIF_VMUnlock(vm, 41);
+   if (entry == NULL) {
+      Log("Failed to track mapping from VPN 0x%"FMTVPN"x to MPN 0x%"FMT64"x\n",
+          vpn, mpn);
+      Vmx86_UnmapPage(vpn);
+      Vmx86_FreeLockedPages(vm, (VA64)&mpn, 1, TRUE);
+      return INVALID_MPN;
+   }
+   return mpn;
 }
 
 
@@ -227,16 +272,62 @@ MonLoaderCallout_MapMPNInPTE(MonLoaderEnvContext *ctx, // IN
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_FillPage --
+ *
+ *      Fills a page with a pattern, given the MPN of the page.
+ *
+ * Returns:
+ *      TRUE on success, FALSE if a mapping of the page was not found or
+ *      invalid.
+ *
+ * Side effects:
+ *      The page is filled.
+ *
+ *----------------------------------------------------------------------
+ */
+
 Bool
 MonLoaderCallout_FillPage(MonLoaderEnvContext *ctx,     // IN
                           uint8                pattern, // IN
                           MPN                  mpn,     // IN
                           Vcpuid               vcpu)    // IN
 {
-   NOT_IMPLEMENTED();
+   VMDriver *vm = ctx->vm;
+   MemTrackEntry *entry;
+
+   HostIF_VMLock(vm, 42);
+   entry = MemTrack_LookupMPN(vm->vmmTracker, mpn);
+   HostIF_VMUnlock(vm, 42);
+   if (entry == NULL || entry->mpn != mpn || entry->vpn == 0) {
+      Log("Failed to look up MPN 0x%"FMT64"x\n", mpn);
+      return FALSE;
+   }
+   memset((void *)VPN_2_VA(entry->vpn), pattern, PAGE_SIZE);
+   return TRUE;
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_CopyFromBlob --
+ *
+ *     Copies contents of up to PAGE_SIZE length from the blob at a
+ *     given offset into the page specified by the given MPN. Zero-fills
+ *     the remaining space.
+ *
+ * Returns:
+ *      TRUE on success, FALSE on failure.
+ *
+ * Side effects:
+ *      The page is filled with blob contents.
+ *
+ *----------------------------------------------------------------------
+ */
+
 Bool
 MonLoaderCallout_CopyFromBlob(MonLoaderEnvContext *ctx,        // IN
                               uint64               blobOffset, // IN
@@ -244,7 +335,30 @@ MonLoaderCallout_CopyFromBlob(MonLoaderEnvContext *ctx,        // IN
                               MPN                  mpn,        // IN
                               Vcpuid               vcpu)       // IN
 {
-   NOT_IMPLEMENTED();
+   MemTrackEntry *entry;
+   VMDriver *vm = ctx->vm;
+   uint64 blobSize = VmmBlob_GetSize(vm);
+   uint8 *blob = VmmBlob_GetPtr(vm);
+   uint8 *buf;
+
+   if (copySize > PAGE_SIZE || copySize == 0 || blobSize < copySize ||
+       blobOffset > blobSize - copySize) {
+      Log("Invalid VMM blob copy parameters: blobOffset 0x%"FMT64"x, "
+          "copySize 0x%"FMTSZ"x, blobSize 0x%"FMT64"x\n", blobOffset, copySize,
+          blobSize);
+      return FALSE;
+   }
+   HostIF_VMLock(vm, 44);
+   entry = MemTrack_LookupMPN(vm->vmmTracker, mpn);
+   HostIF_VMUnlock(vm, 44);
+   if (entry == NULL || entry->vpn == 0) {
+      Log("Failed to look up MPN 0x%"FMT64"x\n", mpn);
+      return FALSE;
+   }
+   buf = (uint8 *)VPN_2_VA(entry->vpn);
+   memcpy(buf, blob + blobOffset, copySize);
+   memset(buf + copySize, 0, PAGE_SIZE - copySize);
+   return TRUE;
 }
 
 
@@ -322,15 +436,14 @@ MonLoaderGetSharedRegionMPN(MonLoaderEnvContext *ctx,
    if (pgOffset >= s->numPages) {
       return INVALID_MPN;
    }
-
    addr = VPN_2_VA(s->baseVpn) + pgOffset * PAGE_SIZE;
-   HostIF_VMLock(ctx->vm, 38);
+   HostIF_VMLock(ctx->vm, 43);
    if (HostIF_LookupUserMPN(ctx->vm, addr, &mpn) != PAGE_LOOKUP_SUCCESS) {
-      HostIF_VMUnlock(ctx->vm, 38);
+      HostIF_VMUnlock(ctx->vm, 43);
       Log("Failed to lookup MPN for shared region VA %"FMTVA"x\n", addr);
       return INVALID_MPN;
    }
-   HostIF_VMUnlock(ctx->vm, 38);
+   HostIF_VMUnlock(ctx->vm, 43);
    return mpn;
 }
 
@@ -357,7 +470,11 @@ MonLoaderCallout_GetSharedUserPage(MonLoaderEnvContext *ctx,
                                    unsigned page,   // IN
                                    Vcpuid vcpu)     // IN
 {
-   return MonLoaderGetSharedRegionMPN(ctx, subIndex, vcpu, page);
+   if (subIndex == MONLOADER_HEADER_IDX) {
+      return VmmBlob_GetHeaderMpn(ctx->vm);
+   } else {
+      return MonLoaderGetSharedRegionMPN(ctx, subIndex, vcpu, page);
+   }
 }
 
 
@@ -393,11 +510,29 @@ MonLoaderCallout_IsPrivileged(MonLoaderEnvContext *ctx) // IN
    return TRUE;
 }
 
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderCallout_GetBlobMpn --
+ *
+ *      Returns the MPN backing the given VMM blob offset.
+ *
+ * Returns:
+ *      An MPN, or INVALID_MPN
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
 MPN
 MonLoaderCallout_GetBlobMpn(MonLoaderEnvContext *ctx,    // IN
                             uint64               offset) // IN
 {
-   return INVALID_MPN;
+   ASSERT((offset & (PAGE_SIZE - 1)) == 0);
+   return VmmBlob_GetMpn(ctx->vm, BYTES_2_PAGES(offset));
 }
 
 Bool
diff --git a/vmmon-only/bootstrap/vmmblob.c b/vmmon-only/bootstrap/vmmblob.c
new file mode 100644
index 00000000..0e599d9e
--- /dev/null
+++ b/vmmon-only/bootstrap/vmmblob.c
@@ -0,0 +1,230 @@
+/*********************************************************
+ * Copyright (C) 2017-2018 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmmblob.c --
+ *
+ *     VMM blob management.
+ */
+
+#ifdef __linux__
+#   include "driver-config.h"
+#endif
+#include "vmware.h"
+#include "vm_assert.h"
+#include "hostif.h"
+#include "vmmblob.h"
+#include "monLoader.h"
+
+#define VMMBLOB_SIZE_MAX (12 * 1024 * 1024)
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VmmBlob_GetPtr --
+ *
+ *      Returns a pointer to the buffer containing the VMM blob.
+ *
+ * Results:
+ *      A pointer.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint8 *
+VmmBlob_GetPtr(VMDriver *vm)
+{
+   return vm->blobInfo->blobPtr;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VmmBlob_GetSize --
+ *
+ *      Returns the size of the VMM blob in bytes.
+ *
+ * Results:
+ *      Number of bytes.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint64
+VmmBlob_GetSize(VMDriver *vm)
+{
+   return vm->blobInfo->numBytes;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VmmBlob_GetMpn --
+ *
+ *      Returns the MPN backing a VMM blob page.
+ *
+ * Results:
+ *      An MPN, or INVALID_MPN.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+VmmBlob_GetMpn(VMDriver *vm, uint64 pgOffset)
+{
+   VmmBlobInfo *bi = vm->blobInfo;
+   uint32 blobNumPages = CEILING(bi->numBytes, PAGE_SIZE);
+   MPN mpn = INVALID_MPN;
+
+   if (pgOffset < blobNumPages) {
+      mpn = bi->mpns[pgOffset];
+   }
+   return mpn;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VmmBlob_GetHeaderMpn --
+ *
+ *      Returns the MPN backing the MonLoader header.
+ *
+ * Results:
+ *      An MPN, or INVALID_MPN.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+VmmBlob_GetHeaderMpn(VMDriver *vm)
+{
+   VmmBlobInfo *bi = vm->blobInfo;
+   uint64 headerOffset = (uint8 *)bi->header - (uint8 *)bi->blobPtr;
+   ASSERT((headerOffset & (PAGE_SIZE - 1)) == 0);
+   return VmmBlob_GetMpn(vm, BYTES_2_PAGES(headerOffset));
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VmmBlob_Cleanup --
+ *
+ *      Cleans up VMM blob state by freeing its memory and associated
+ *      metadata.
+ *
+ * Results:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+VmmBlob_Cleanup(VmmBlobInfo *bi)
+{
+   const uint32 numPages = CEILING(bi->numBytes, PAGE_SIZE);
+
+   HostIF_FreeKernelPages(numPages, bi->blobPtr);
+   HostIF_FreeKernelMem(bi->mpns);
+   HostIF_FreeKernelMem(bi);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VmmBlob_Load --
+ *
+ *      Copies and instantiates a VMM bootstrap blob from userspace.
+ *
+ * Results:
+ *      TRUE if successful, FALSE if not.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+VmmBlob_Load(UserVA64 blobAddr,
+             uint32 numBytes,
+             uint32 headerOffset,
+             VmmBlobInfo **blobInfo)
+{
+   uint8 *blob = NULL;
+   MPN *mpns = NULL;
+   MonLoaderHeader *header;
+   VmmBlobInfo *bi = NULL;
+   uint32 numPages = CEILING(numBytes, PAGE_SIZE);
+   size_t fixedHdrSize = MonLoader_GetFixedHeaderSize();
+
+   if (numBytes > VMMBLOB_SIZE_MAX || headerOffset > numBytes ||
+       fixedHdrSize > numBytes - headerOffset) {
+      Warning("Invalid arguments for processing bootstrap. "
+              "Header offset: %u, Fixed header size: %"FMTSZ"u bytes, "
+              "Blob size: %u bytes\n", headerOffset, fixedHdrSize, numBytes);
+      goto error;
+   }
+   mpns = HostIF_AllocKernelMem(numPages * sizeof(*mpns), FALSE);
+   if (mpns == NULL) {
+      Warning("Memory allocation for VMM bootstrap blob failed\n");
+      goto error;
+   }
+   bi = HostIF_AllocKernelMem(sizeof *bi, FALSE);
+   if (bi == NULL) {
+      Warning("Memory allocation for VMM bootstrap blob failed\n");
+      goto error;
+   }
+   blob = HostIF_AllocKernelPages(numPages, mpns);
+   if (blob == NULL) {
+      Warning("Memory allocation for VMM bootstrap blob failed\n");
+      goto error;
+   }
+   if (HostIF_CopyFromUser(blob, blobAddr, numBytes) != 0) {
+      Warning("Error copying VMM bootstrap blob from userspace\n");
+      goto error;
+   }
+   header = (MonLoaderHeader *)(blob + headerOffset);
+   if (header->count > (numBytes - headerOffset - fixedHdrSize) /
+                        sizeof (MonLoaderEntry)) {
+      Warning("Invalid arguments for processing bootstrap. "
+              "Header offset: %u, Number of header entries: %u, "
+              "Blob size: %u bytes\n", headerOffset, header->count, numBytes);
+      goto error;
+   }
+   bi->mpns = mpns;
+   bi->blobPtr = blob;
+   bi->numBytes = numBytes;
+   bi->header = header;
+   *blobInfo = bi;
+
+   return TRUE;
+
+error:
+   if (blob != NULL) {
+      HostIF_FreeKernelPages(numPages, blob);
+   }
+   if (bi != NULL) {
+      HostIF_FreeKernelMem(bi);
+   }
+   if (mpns != NULL) {
+      HostIF_FreeKernelMem(mpns);
+   }
+   return FALSE;
+}
diff --git a/vmmon-only/common/apic.c b/vmmon-only/common/apic.c
index 753a729f..7ba781ea 100644
--- a/vmmon-only/common/apic.c
+++ b/vmmon-only/common/apic.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2011 VMware, Inc. All rights reserved.
+ * Copyright (C) 2011, 2016, 2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,7 +17,8 @@
  *********************************************************/
 
 #include "vmware.h"
-#include "hostif.h"
+#include "x86apic.h"
+#include "x86msr.h"
 #include "x86cpuid_asm.h"
 #include "vm_asm.h"
 #include "cpuid.h"
@@ -56,7 +57,7 @@ APIC_GetMA(void)
 
    if (cpuVendor != CPUID_VENDOR_INTEL &&
        cpuVendor != CPUID_VENDOR_AMD &&
-       cpuVendor != CPUID_VENDOR_VIA) {
+       cpuVendor != CPUID_VENDOR_HYGON) {
       return (MA)-1;
    }
 
@@ -78,14 +79,12 @@ APIC_GetMA(void)
 
    /*
     * On Intel, the high bits are reserved so we mask.
-    * On AMD, high bits are explicitly MBZ, so no need.
-    * Via doesn't specify, so we'll assume reserved.
+    * On AMD and Hygon, high bits are explicitly MBZ, so no need.
     */
-   if (cpuVendor == CPUID_VENDOR_INTEL || cpuVendor == CPUID_VENDOR_VIA) {
+   if (cpuVendor == CPUID_VENDOR_INTEL) {
       /*
        * Intel suggests using CPUID 0x80000008.eax[7-0] (physical
        * address size), with 36 (24 bit MPNs) as a fallback.
-       * Via has that cpuid leaf as well.
        */
       unsigned numPhysicalBits = 36;
 
diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
index 93ad2518..ed534962 100644
--- a/vmmon-only/common/cpuid.c
+++ b/vmmon-only/common/cpuid.c
@@ -34,10 +34,12 @@
 #include "x86svm.h"
 #include "x86vt.h"
 
-uint32 cpuidFeatures;
-static CpuidVendor vendor = CPUID_NUM_VENDORS;
-static uint32 version;
-static Bool hasSpecCtrl;
+uint32      cpuidFeatures;
+CpuidVendor cpuidVendor = CPUID_NUM_VENDORS;
+uint32      cpuidVersion;
+Bool        hostSupportsVT;
+Bool        hostSupportsSVM;
+Bool        hostHasSpecCtrl;
 
 
 /*
@@ -80,7 +82,7 @@ CPUID_Init(void)
    char name[16];
 
    __GET_CPUID(1, &regs);
-   version = regs.eax;
+   cpuidVersion = regs.eax;
    cpuidFeatures = regs.edx;
 
    __GET_CPUID(0, &regs);
@@ -91,33 +93,25 @@ CPUID_Init(void)
    ptr[3] = 0;
 
    if (strcmp(name, CPUID_INTEL_VENDOR_STRING_FIXED) == 0) {
-      vendor = CPUID_VENDOR_INTEL;
+      cpuidVendor = CPUID_VENDOR_INTEL;
    } else if (strcmp(name, CPUID_AMD_VENDOR_STRING_FIXED) == 0) {
-      vendor = CPUID_VENDOR_AMD;
+      cpuidVendor = CPUID_VENDOR_AMD;
    } else if (strcmp(name, CPUID_CYRIX_VENDOR_STRING_FIXED) == 0) {
-      vendor = CPUID_VENDOR_CYRIX;
+      cpuidVendor = CPUID_VENDOR_CYRIX;
+   } else if (strcmp(name, CPUID_HYGON_VENDOR_STRING_FIXED) == 0) {
+      cpuidVendor = CPUID_VENDOR_HYGON;
    } else {
       Warning("VMMON CPUID: Unrecognized CPU\n");
-      vendor = CPUID_VENDOR_UNKNOWN;
+      cpuidVendor = CPUID_VENDOR_UNKNOWN;
    }
 
    __GET_CPUID2(7, 0, &regs);
-   hasSpecCtrl = vendor == CPUID_VENDOR_INTEL && ((regs.edx >> 26) & 0x3) != 0;
-}
-
+   hostHasSpecCtrl = cpuidVendor == CPUID_VENDOR_INTEL &&
+                     (CPUID_ISSET(7, EDX, IBRSIBPB, regs.edx) ||
+                      CPUID_ISSET(7, EDX, STIBP, regs.edx));
 
-CpuidVendor
-CPUID_GetVendor(void)
-{
-   ASSERT(vendor != CPUID_NUM_VENDORS);
-   return vendor;
-}
-
-
-uint32
-CPUID_GetVersion(void)
-{
-   return version;
+   hostSupportsVT = VT_CapableCPU();
+   hostSupportsSVM = SVM_CapableCPU();
 }
 
 
@@ -155,51 +149,3 @@ CPUID_AddressSizeSupported(void)
 
    return result;
 }
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * CPUID_HostSupportsHV --
- *
- *     Determine whether processor supports hardware virtualization.  Two
- *     possibilities are valid: VMX on Intel or SVM on AMD.
- *
- * Results:
- *     True iff the processor supports the required features.
- *
- * Side effects:
- *     None.
- *
- *-----------------------------------------------------------------------------
- */
-
-Bool
-CPUID_HostSupportsHV(void)
-{
-   return (vendor == CPUID_VENDOR_AMD   && SVM_CapableCPU()) ||
-          (vendor == CPUID_VENDOR_INTEL && VT_CapableCPU());
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * CPUID_HostSupportsSpecCtrl --
- *
- *     Determine whether the processor supports MSR_SPEC_CTRL.
- *
- * Results:
- *     True iff the processor supports the required features.
- *
- * Side effects:
- *     None.
- *
- *-----------------------------------------------------------------------------
- */
-
-Bool
-CPUID_HostSupportsSpecCtrl(void)
-{
-   return hasSpecCtrl;
-}
diff --git a/vmmon-only/common/cpuid.h b/vmmon-only/common/cpuid.h
index 4b8b04fe..cc6c95b7 100644
--- a/vmmon-only/common/cpuid.h
+++ b/vmmon-only/common/cpuid.h
@@ -31,14 +31,15 @@
 
 #include "x86cpuid.h"
 
-extern uint32 cpuidFeatures;
+extern uint32      cpuidFeatures;
+extern uint32      cpuidVersion;
+extern CpuidVendor cpuidVendor;
+extern Bool        hostSupportsVT;
+extern Bool        hostSupportsSVM;
+extern Bool        hostHasSpecCtrl;
 
 void CPUID_Init(void);
-CpuidVendor CPUID_GetVendor(void);
-uint32 CPUID_GetVersion(void);
 Bool CPUID_AddressSizeSupported(void);
-Bool CPUID_HostSupportsHV(void);
-Bool CPUID_HostSupportsSpecCtrl(void);
 
 static INLINE uint32
 CPUID_GetFeatures(void)
@@ -46,6 +47,43 @@ CPUID_GetFeatures(void)
    return cpuidFeatures;
 }
 
+static INLINE CpuidVendor
+CPUID_GetVendor(void)
+{
+   ASSERT(cpuidVendor != CPUID_NUM_VENDORS);
+   return cpuidVendor;
+}
+
+static INLINE uint32
+CPUID_GetVersion(void)
+{
+   return cpuidVersion;
+}
+
+static INLINE Bool
+CPUID_HostSupportsVT(void)
+{
+   return hostSupportsVT;
+}
+
+static INLINE Bool
+CPUID_HostSupportsSVM(void)
+{
+   return hostSupportsSVM;
+}
+
+static INLINE Bool
+CPUID_HostSupportsHV(void)
+{
+   return hostSupportsVT || hostSupportsSVM;
+}
+
+static INLINE Bool
+CPUID_HostSupportsSpecCtrl(void)
+{
+   return hostHasSpecCtrl;
+}
+
 static INLINE Bool
 CPUID_SSE2Supported(void)
 {
diff --git a/vmmon-only/common/hashFunc.c b/vmmon-only/common/hashFunc.c
deleted file mode 100644
index 38f05165..00000000
--- a/vmmon-only/common/hashFunc.c
+++ /dev/null
@@ -1,41 +0,0 @@
-/*********************************************************
- * Copyright (C) 2001 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-
-/*
- * hashFunc.c --
- *
- *      The core implementation lives in lib/shared/hashFunc.h because it
- *      is shared by the vmkernel and vmmon.
- */
-
-#include "hashFunc.h"
-
-/*
- * Wrappers
- */
-
-// arbitrary constant
-#define HASH_INIT_VALUE (42)
-
-// 64-bit hash for one 4K page
-uint64
-HashFunc_HashPage(const void *addr)
-{
-   return hash2((uint64 *)addr, PAGE_SIZE / sizeof (uint64), HASH_INIT_VALUE);
-}
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index c11b8658..c0d0a789 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -59,14 +59,7 @@
 
 #define CROSSCALL_SLEEP_US 1000
 
-/* Return value for HostIF_IPI. */
-typedef enum {
-   IPI_NONE,      // No IPI was sent.
-   IPI_UNICAST,   // Unicast IPIs were sent.
-   IPI_BROADCAST  // A broadcast IPI was sent to all PCPUs.
-} HostIFIPIMode;
-
-EXTERN int   HostIF_Init(VMDriver *vm);
+EXTERN int   HostIF_Init(VMDriver *vm, uint32 numVCPUs);
 EXTERN int   HostIF_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
 EXTERN void *HostIF_MapCrossPage(VMDriver *vm, VA64 uAddr);
 
@@ -96,6 +89,9 @@ EXTERN Bool HostIF_VMLockIsHeld(VMDriver *vm);
 #endif
 
 EXTERN Bool  HostIF_APICInit(VMDriver *vm, Bool setVMPtr, Bool probe);
+EXTERN uint8 HostIF_GetMonitorIPIVector(void);
+EXTERN uint8 HostIF_GetHVIPIVector(void);
+EXTERN void  HostIF_GetTimerVectors(uint8 *v0, uint8 *v1);
 
 EXTERN int   HostIF_SemaphoreWait(VMDriver *vm,
                                   Vcpuid vcpuid,
@@ -104,7 +100,8 @@ EXTERN int   HostIF_SemaphoreWait(VMDriver *vm,
 EXTERN int   HostIF_SemaphoreSignal(uint64 *args);
 
 EXTERN void  HostIF_SemaphoreForceWakeup(VMDriver *vm, const VCPUSet *vcs);
-EXTERN HostIFIPIMode HostIF_IPI(VMDriver *vm, const VCPUSet *vcs);
+EXTERN void  HostIF_IPI(VMDriver *vm, const VCPUSet *vcs);
+EXTERN void  HostIF_OneIPI(VMDriver *vm, Vcpuid v);
 
 EXTERN uint32 HostIF_GetCurrentPCPU(void);
 EXTERN void HostIF_CallOnEachCPU(void (*func)(void *), void *data);
@@ -119,6 +116,7 @@ EXTERN int HostIF_AllocLockedPages(VMDriver *vm, VA64 addr,
 EXTERN int HostIF_FreeLockedPages(VMDriver *vm, VA64 addr,
                                   unsigned int numPages, Bool kernelMPNBuffer);
 EXTERN MPN HostIF_GetNextAnonPage(VMDriver *vm, MPN mpn);
+EXTERN MPN HostIF_AllocLowPage(VMDriver *vm);
 
 EXTERN int HostIF_ReadPhysical(VMDriver *vm, MA ma, VA64 addr,
                                Bool kernelBuffer, size_t len);
diff --git a/vmmon-only/common/hostifMem.h b/vmmon-only/common/hostifMem.h
index 318534c2..789f223e 100644
--- a/vmmon-only/common/hostifMem.h
+++ b/vmmon-only/common/hostifMem.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2008, 2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index 98cc74a8..e17d728f 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -89,8 +89,8 @@
    DEBUG_ONLY(if (!(t)) TaskAssertFail(__LINE__);)  \
 } while (0)
 
-static CrossGDT *crossGDT = NULL;
-static MPN crossGDTMPNs[CROSSGDT_NUMPAGES];
+static CrossGDT *crossGDT;
+static MPN crossGDTMPN;
 static Selector kernelStackSegment = 0;
 static uint32 dummyLVT;
 static Atomic_uint64 hvRootPage[MAX_PCPUS];
@@ -414,12 +414,12 @@ TaskAssertFail(int line)
 /*
  *-----------------------------------------------------------------------------
  *
- * TaskSaveGDT64 --
+ * TaskSaveGDT --
  *
  *      Save the current GDT in the caller-supplied struct.
  *
  * Results:
- *      *hostGDT64 = copy of the processor's GDT.
+ *      *hostGDT = copy of the processor's GDT.
  *
  * Side effects:
  *      None.
@@ -428,22 +428,21 @@ TaskAssertFail(int line)
  */
 
 static INLINE void
-TaskSaveGDT64(DTR64 *hostGDT64)  // OUT
+TaskSaveGDT(DTR64 *hostGDT)  // OUT
 {
-   hostGDT64->offset = 0;
-   _Get_GDT((DTR *)hostGDT64);
+   _Get_GDT((DTR *)hostGDT);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * TaskSaveIDT64 --
+ * TaskSaveIDT --
  *
  *      Save the current IDT in the caller-supplied struct.
  *
  * Results:
- *      *hostIDT64 = copy of the processor's IDT.
+ *      *hostIDT = copy of the processor's IDT.
  *
  * Side effects:
  *      None.
@@ -452,22 +451,21 @@ TaskSaveGDT64(DTR64 *hostGDT64)  // OUT
  */
 
 static INLINE void
-TaskSaveIDT64(DTR64 *hostIDT64)  // OUT
+TaskSaveIDT(DTR64 *hostIDT)  // OUT
 {
-   hostIDT64->offset = 0;
-   _Get_IDT((DTR *)hostIDT64);
+   _Get_IDT((DTR *)hostIDT);
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * TaskLoadIDT64 --
+ * TaskLoadIDT --
  *
  *      Load the current IDT from the caller-supplied struct.
  *
  * Results:
- *      Processor's IDT = *hostIDT64.
+ *      Processor's IDT = *hostIDT.
  *
  * Side effects:
  *      None.
@@ -476,38 +474,9 @@ TaskSaveIDT64(DTR64 *hostIDT64)  // OUT
  */
 
 static INLINE void
-TaskLoadIDT64(DTR64 *hostIDT64)  // IN
+TaskLoadIDT(DTR64 *hostIDT)  // IN
 {
-   _Set_IDT((DTR *)hostIDT64);
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * TaskCopyGDT64 --
- *
- *      Copy the given GDT contents to the caller-supplied buffer.
- *
- *      This routine assumes the caller has already verified there is enough
- *      room in the output buffer.
- *
- * Results:
- *      *out = copy of the processor's GDT contents.
- *
- * Side effects:
- *      None.
- *
- *-----------------------------------------------------------------------------
- */
-
-static INLINE void
-TaskCopyGDT64(DTR64 *hostGDT64,  // IN  GDT to be copied from
-              Descriptor *out)   // OUT where to copy contents to
-{
-   memcpy(out,
-          (void *)HOST_KERNEL_LA_2_VA((LA)hostGDT64->offset),
-          hostGDT64->limit + 1);
+   _Set_IDT((DTR *)hostIDT);
 }
 
 
@@ -516,13 +485,13 @@ TaskCopyGDT64(DTR64 *hostGDT64,  // IN  GDT to be copied from
  *
  * Task_Terminate --
  *
- *      Called at driver unload time.  Undoes whatever Task_Initialize did.
+ *      Called at driver unload time.  Frees memory for any allocated GDTs.
  *
  * Results:
  *      None.
  *
  * Side effects:
- *      Release temporary GDT memory.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -533,7 +502,7 @@ Task_Terminate(void)
    TaskFreeHVRootPages();
 
    if (crossGDT != NULL) {
-      HostIF_FreeKernelPages(ARRAYSIZE(crossGDTMPNs), crossGDT);
+      HostIF_FreeKernelPages(1, crossGDT);
       crossGDT = NULL;
    }
 
@@ -551,6 +520,53 @@ Task_Terminate(void)
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskGetFlatWriteableDataSegment --
+ *
+ *      Searches the host GDT for a flat writeable data segment.  The limit and
+ *      granularity bits are not checked because both host and VMM are always
+ *      64-bit and SLC64 is not enabled by either.  Some operating systems
+ *      (e.g. Windows 10) set these values to zero, while most others set them
+ *      to 0xfffff (maximal limit) and 1 (coarse granularity) respectively.
+ *
+ * Results:
+ *      The selector of a flat writeable data segment or a NULL selector
+ *      if none was found.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Selector
+TaskGetFlatWriteableDataSegment(void)
+{
+   DTR hostGDTR;
+   Descriptor *desc;
+   Descriptor *start;
+   Descriptor *end;
+
+   GET_GDT(hostGDTR);
+   start = (Descriptor *)hostGDTR.offset;
+   end = start + hostGDTR.limit / sizeof *desc;
+
+   for (desc = start + 1; desc + 1 < end; desc++) {
+      if (DT_WRITEABLE_DATA(*desc) &&
+          Desc_GetBase(desc)  == 0 &&
+          Desc_S(desc)        == 1 &&
+          Desc_DPL(desc)      == 0 &&
+          Desc_Present(desc)  == 1 &&
+          Desc_DB(desc)       == 1) {
+         return (desc - start) * sizeof *desc;
+      }
+   }
+   return 0;
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -572,7 +588,7 @@ Task_Initialize(void)
 {
    unsigned i;
 
-   ASSERT_ON_COMPILE(sizeof (Atomic_uint64) == sizeof (MPN));
+   ASSERT_ON_COMPILE(sizeof(Atomic_uint64) == sizeof(MPN));
    for (i = 0; i < ARRAYSIZE(hvRootPage); i++) {
       Atomic_Write64(&hvRootPage[i], INVALID_MPN);
    }
@@ -589,30 +605,10 @@ Task_Initialize(void)
     * read/write flat data segment.
     */
 
-   kernelStackSegment = GET_SS();
-   if (kernelStackSegment == 0) {
-      DTR hostGDTR;
-
-      GET_GDT(hostGDTR);
-      for (kernelStackSegment = 8;
-           kernelStackSegment + 7 <= hostGDTR.limit;
-           kernelStackSegment += 8) {
-         uint64 gdte = *(uint64 *)(hostGDTR.offset + kernelStackSegment);
-
-         if ((gdte & 0xFFCFFEFFFFFFFFFFULL) == 0x00CF92000000FFFFULL) {
-            goto gotnzss;
-         }
-      }
-      Warning("%s: no non-null flat kernel data GDT segment\n",
-              __FUNCTION__);
-
-      return FALSE;
-gotnzss:;
-   }
+   kernelStackSegment = TaskGetFlatWriteableDataSegment();
    if ((kernelStackSegment == 0) || ((kernelStackSegment & 7) != 0)) {
-           Warning("Task_Initialize: unsupported SS %04x\n",
-                   kernelStackSegment);
-         return FALSE;
+      Warning("Task_Initialize: unsupported SS %04x\n", kernelStackSegment);
+      return FALSE;
    }
 
    /*
@@ -659,7 +655,7 @@ gotnzss:;
 
 static INLINE_SINGLE_CALLER void
 TaskRestoreHostGDTTRLDT(Descriptor *tempGDTBase,
-                        DTR64 hostGDT64,
+                        DTR64 hostGDT,
                         Selector ldt,
                         Selector cs,
                         Selector tr)
@@ -668,18 +664,18 @@ TaskRestoreHostGDTTRLDT(Descriptor *tempGDTBase,
    TS_ASSERT((tr & 7) == 0);
 
    if (USE_TEMPORARY_GDT) {
-      DTR64 tempGDT64;
+      DTR64 tempGDT;
 
       /*
        * Set up a temporary GDT so that the TSS 'busy bit' can be
        * changed without affecting the host's data structures.
        */
 
-      const VA hostGDTVA  = HOST_KERNEL_LA_2_VA(hostGDT64.offset);
+      const VA hostGDTVA  = HOST_KERNEL_LA_2_VA(hostGDT.offset);
       const unsigned size = sizeof(Descriptor);
       const Selector ss   = SELECTOR_CLEAR_RPL(GET_SS());
 
-      ASSERT(hostGDTVA == HOST_KERNEL_LA_2_VA(hostGDT64.offset));
+      ASSERT(hostGDTVA == HOST_KERNEL_LA_2_VA(hostGDT.offset));
 
       ASSERT(SELECTOR_RPL(cs) == 0 && SELECTOR_TABLE(cs) == 0);
       ASSERT(SELECTOR_RPL(ss) == 0 && SELECTOR_TABLE(ss) == 0);
@@ -715,11 +711,11 @@ TaskRestoreHostGDTTRLDT(Descriptor *tempGDTBase,
        * then host LDT.
        */
 
-      tempGDT64.limit  = hostGDT64.limit;
-      tempGDT64.offset = HOST_KERNEL_VA_2_LA((VA)tempGDTBase);
-      _Set_GDT((DTR *)&tempGDT64);
+      tempGDT.limit  = hostGDT.limit;
+      tempGDT.offset = HOST_KERNEL_VA_2_LA((VA)tempGDTBase);
+      _Set_GDT((DTR *)&tempGDT);
       SET_TR(tr);
-      _Set_GDT((DTR *)&hostGDT64);
+      _Set_GDT((DTR *)&hostGDT);
       SET_LDT(ldt);
    } else {
       Descriptor *desc;
@@ -729,27 +725,28 @@ TaskRestoreHostGDTTRLDT(Descriptor *tempGDTBase,
        * in the host GDT, then restore host GDT and TR, then LDT.
        */
 
-      desc = (Descriptor *)((VA)HOST_KERNEL_LA_2_VA(hostGDT64.offset + tr));
+      desc = (Descriptor *)((VA)HOST_KERNEL_LA_2_VA(hostGDT.offset + tr));
 #ifdef LINUX_GDT_IS_RO
       /*
-       * If GDT is read-only, we must always load TR from alternative gdt,
-       * otherwise CPU gets page fault when marking TR busy.
+       * If the GDT is read-only, we must always load TR from alternative GDT.
+       * Otherwise the CPU gets a page fault when marking TR busy.
        */
       {
-         DTR64 rwGDT64;
+         DTR64 rwGDT;
 
-         rwGDT64.offset = (unsigned long)tempGDTBase;
-         rwGDT64.limit = hostGDT64.limit;
-         Desc_SetType((Descriptor *)((unsigned long)tempGDTBase + tr), TASK_DESC);
-         _Set_GDT((DTR *)&rwGDT64);
+         rwGDT.offset = (unsigned long)tempGDTBase;
+         rwGDT.limit = hostGDT.limit;
+         Desc_SetType((Descriptor *)((unsigned long)tempGDTBase + tr),
+                      TASK_DESC);
+         _Set_GDT((DTR *)&rwGDT);
          SET_TR(tr);
-         _Set_GDT((DTR *)&hostGDT64);
+         _Set_GDT((DTR *)&hostGDT);
       }
 #else
       if (Desc_Type(desc) == TASK_DESC_BUSY) {
          Desc_SetType(desc, TASK_DESC);
       }
-      _Set_GDT((DTR *)&hostGDT64);
+      _Set_GDT((DTR *)&hostGDT);
       SET_TR(tr);
 #endif
       SET_LDT(ldt);
@@ -819,6 +816,142 @@ TaskSwitchPTPLookupVPN(VMDriver *vm, VPN vpn)
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskApplyPTPatches --
+ *
+ *    Applies the page table patches to the monitor page tables. This is
+ *    only necessary before the first switch to the VMM. After that, it
+ *    is the VMM's responsibility to patch and unpatch its page tables
+ *    before/after doing a BackToHost.
+ *
+ *    For each populated patch, performs a page walk from L4 to the patch's
+ *    level.  The lowest allowed level is L3.  Invalid patch levels, collisions
+ *    at the patch's level with existing PTEs and non-present PTEs during the
+ *    walk all result in failure.
+ *
+ * Results:
+ *    TRUE if patching was successful, FALSE otherwise.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+TaskApplyPTPatches(VMDriver *vm, VMCrossPageData *cpData)
+{
+   unsigned i;
+
+   for (i = 0; i < MAX_SWITCH_PT_PATCHES; i++) {
+      VMMPageTablePatch *patch = &cpData->vmmPTP[i];
+      unsigned l4idx = PT_LPN_2_L4OFF(patch->lpn);
+      unsigned l3idx = PT_LPN_2_L3OFF(patch->lpn);
+      PT_L4E pte;
+      MA ma = cpData->monCR3 + l4idx * sizeof pte; /* PTE machine address. */
+
+      if (patch->level == PTP_EMPTY) {
+         return TRUE; /* No more entries. */
+      }
+
+      if (HostIF_ReadPhysical(vm, ma, PtrToVA64(&pte), TRUE, sizeof pte) != 0) {
+         return FALSE;
+      }
+      switch (patch->level) {
+         case 4:
+            ASSERT(patch->pteIdx == l4idx);
+            if (pte != 0) {
+               return FALSE; /* Collision. */
+            }
+            if (HostIF_WritePhysical(vm, ma, PtrToVA64(&patch->pte), TRUE,
+                                     sizeof patch->pte) != 0) {
+               return FALSE;
+            }
+            break;
+         case 3:
+            ASSERT(patch->pteIdx == l3idx);
+            if (!PTE_PRESENT(pte)) {
+               return FALSE; /* Terminate page walk, L4 not present. */
+            }
+            ma = MPN_2_MA(LM_PTE_2_PFN(pte)) + l3idx * sizeof pte;
+            if (HostIF_ReadPhysical(vm, ma, PtrToVA64(&pte), TRUE,
+                                    sizeof pte) != 0) {
+               return FALSE;
+            }
+            if (pte != 0) {
+               return FALSE; /* Collision. */
+            }
+            if (HostIF_WritePhysical(vm, ma, PtrToVA64(&patch->pte), TRUE,
+                                     sizeof patch->pte) != 0) {
+               return FALSE;
+            }
+            break;
+         default:
+            return FALSE; /* Invalid level. */
+            break;
+      }
+   }
+   return TRUE;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * TaskVerifyPTPatch --
+ *
+ *      Verify that the given 64-bit pagetable contains the given mapping.
+ *      Requires that the mapping is small (at L1).
+ *
+ * Result:
+ *      TRUE if the mapping is as expected, FALSE otherwise.
+ *
+ *-----------------------------------------------------------------------------
+ */
+static Bool
+TaskVerifyPTMap(VMDriver *vm,  // IN
+                MA64      cr3, // IN
+                LPN64     lpn, // IN LPN in mon PT to map
+                MPN       mpn) // IN MPN to which that LPN should map
+{
+   PT_L4E pte = cr3;
+   PT_Level i;
+   for (i = PT_LEVEL_4; i >= PT_LEVEL_1; i--) {
+      unsigned ptShiftBits = PT_LEVEL_SHIFT * (i - 1);
+      unsigned ptIdx = (lpn >> ptShiftBits) & 0x1ff;
+      pte &= LM_PTE_PFN_MASK;
+      if (HostIF_ReadPhysical(vm, pte + ptIdx * sizeof pte, PtrToVA64(&pte),
+                              TRUE, sizeof pte) != 0 || !PTE_PRESENT(pte)) {
+         return FALSE;
+      }
+   }
+   return LM_PTE_2_PFN(pte) == mpn;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MonitorVerifyPTPatches --
+ *
+ *    Verifies that the page table patches were correctly applied to the
+ *    VMM's page tables.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+TaskVerifyPTPatches(VMDriver *vm,
+                    VMCrossPageData *cpData)
+{
+   LPN64 xgCPN = LA_2_LPN(cpData->vmmCrossGDTLA);
+   LPN64 xpCPN = LA_2_LPN(cpData->vmmCrossPageLA);
+   MPN   xpMPN = MA_2_MPN(cpData->crosspageMA);
+   MA    cr3   = cpData->monCR3;
+   return TaskVerifyPTMap(vm, cr3, xpCPN, xpMPN) &&
+          TaskVerifyPTMap(vm, cr3, xgCPN, crossGDTMPN);
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -892,9 +1025,6 @@ TaskSetCrossGDTEntry(uint16 index, Descriptor d)
 
    if (index >= ARRAYSIZE(crossGDT->gdtes)) {
       Warning("%s: index %u too big\n", __FUNCTION__, index);
-   } else if (!CROSSGDT_TESTINDEXMASK(index)) {
-      Warning("%s: index %u not in CROSSGDT_PAGEMASK %x\n", __FUNCTION__,
-              index, CROSSGDT_PAGEMASK);
    } else if (!Desc_Present(crossGDT->gdtes + index)) {
       crossGDT->gdtes[index] = d;
       res = TRUE;
@@ -917,6 +1047,8 @@ TaskSetCrossGDTEntry(uint16 index, Descriptor d)
  * TaskSetCrossGDTVMM --
  *
  *      Initialize/compare the VMM portion of the crossGDT.
+ *      If any VMM entry overlaps with a previously defined
+ *      host entry (and they differ), we return failure.
  *
  * Results:
  *      TRUE if success, FALSE otherwise.
@@ -959,9 +1091,9 @@ TaskSetCrossGDTVMM(BSVMM_GDTInit *gdt)
  *
  * TaskSetCrossGDTHost --
  *
- *      Initializes the host portion of the crossGDT by copying it directly from
- *      the host kernel's GDT. We assume that all the host segments we
- *      will ever need are below CROSSGDT_HOSTLIMIT.
+ *      Initializes the host portion of the crossGDT by copying it directly
+ *      from the host kernel's GDT. We assume that all the host segments we
+ *      will ever need come from the first page of the host's GDT.
  *
  * Results:
  *      TRUE on success, FALSE otherwise.
@@ -975,20 +1107,16 @@ TaskSetCrossGDTVMM(BSVMM_GDTInit *gdt)
 static void
 TaskSetCrossGDTHost(void)
 {
+   unsigned len;
    DTR64 hostGDT;
    /*
     * All copied host segment descriptors will come from the first page of
     * the host kernel GDT.
     */
    ASSERT(HostIF_GlobalLockIsHeld());
-   ASSERT_ON_COMPILE(CROSSGDT_HOSTLIMIT <= PAGE_SIZE / sizeof(Descriptor));
-   ASSERT_ON_COMPILE(CROSSGDT_PAGEMASK & 1);
-
-   TaskSaveGDT64(&hostGDT);
-   if (hostGDT.limit > CROSSGDT_HOSTLIMIT * sizeof(Descriptor) - 1) {
-      hostGDT.limit = CROSSGDT_HOSTLIMIT * sizeof(Descriptor) - 1;
-   }
-   TaskCopyGDT64(&hostGDT, crossGDT->gdtes);
+   TaskSaveGDT(&hostGDT);
+   len = MIN((unsigned)hostGDT.limit + 1, sizeof(CrossGDT));
+   memcpy(crossGDT->gdtes, (void*)HOST_KERNEL_LA_2_VA((LA)hostGDT.offset), len);
 }
 
 
@@ -1012,6 +1140,8 @@ TaskSetCrossGDTHost(void)
 Bool
 Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
 {
+   Bool populatedCrossGDT;
+
    HostIF_GlobalLock(2);
 
    if (crossGDT == NULL) {
@@ -1019,37 +1149,33 @@ Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
        * The crossGDT has not yet been created. This must be the first
        * VM that this driver powers on.
        */
-      ASSERT_ON_COMPILE(sizeof *crossGDT == CROSSGDT_NUMPAGES * PAGE_SIZE);
-      crossGDT = HostIF_AllocKernelPages(ARRAYSIZE(crossGDTMPNs),
-                                         crossGDTMPNs);
+      ASSERT_ON_COMPILE(sizeof *crossGDT == PAGE_SIZE);
+      crossGDT = HostIF_AllocKernelPages(1, &crossGDTMPN);
       if (crossGDT == NULL) {
          HostIF_GlobalUnlock(2);
          Warning("%s: unable to allocate crossGDT\n", __FUNCTION__);
-
          return FALSE;
       }
       memset(crossGDT, 0, sizeof *crossGDT);
       TaskSetCrossGDTHost();
    }
-   if (!TaskSetCrossGDTVMM(gdt)) {
-      HostIF_GlobalUnlock(2);
-      return FALSE;
-   }
+
+   populatedCrossGDT = TaskSetCrossGDTVMM(gdt);
 
    HostIF_GlobalUnlock(2);
 
-   return TRUE;
+   return populatedCrossGDT;
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- * TaskFixupHostSwitchIDTE --
+ * TaskPopulateHostSwitchIDTE --
  *
- *      Fixes up a 64-bit host IDT entry in the crosspage, given the
- *      host kernel CS and the crosspage's code section address on the
- *      host.
+ *      Populates a host interrupt descriptor in the crosspage, setting its
+ *      handler to the associated gate stub, given a host code segment selector
+ *      and the crosspage.
  *
  * Results:
  *      None
@@ -1061,47 +1187,38 @@ Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
  */
 
 static void
-TaskFixupHostSwitchIDTE(Gate64 *entry, Selector cs, VMCrossPageCode *cpCode)
+TaskPopulateHostSwitchIDTE(unsigned idx, Selector cs, VMCrossPage *cp)
 {
+   Gate64 *entry;
    VA64 handlerVA;
-   DEBUG_ONLY(const VA64 codeBase = offsetof(VMCrossPageCode, codeBlock);)
 
    ASSERT_ON_COMPILE(sizeof *entry == 16);
+   ASSERT(idx < NUM_EXCEPTIONS);
 
-   ASSERT(entry->segment      == 0 && entry->ist          == 0 &&
-          entry->reserved0    == 0 && entry->type         == INTER_GATE &&
-          entry->DPL          == 0 && entry->present      == 0 &&
-          entry->offset_16_31 == 0 && entry->offset_32_63 == 0 &&
-          entry->reserved1    == 0);
+   handlerVA = PtrToVA64(&cp->crosspageCode.gateStubs[idx * CP_STUB_SIZE]);
 
-   /*
-    * entry->offset_0_15 is initialized in crosspage.S with an offset relative
-    * to the crosspage's code section. Here, we transform it into an absolute
-    * address.
-    */
-   ASSERT(entry->offset_0_15 >= codeBase &&
-          entry->offset_0_15 < codeBase + sizeof cpCode->codeBlock);
-
-   handlerVA = PtrToVA64(cpCode) + entry->offset_0_15;
+   entry = &cp->crosspageData.switchHostIDT[idx];
 
    entry->offset_0_15  = LOWORD(handlerVA);
-   entry->segment      = cs;
-   entry->present      = 1;
    entry->offset_16_31 = HIWORD(handlerVA);
    entry->offset_32_63 = HIDWORD(handlerVA);
+   entry->type         = INTER_GATE;
+   entry->segment      = cs;
+   entry->present      = 1;
+   entry->ist          = 0;
+   entry->DPL          = 0;
+   entry->reserved0    = 0;
+   entry->reserved1    = 0;
 }
 
 
 /*
  *-----------------------------------------------------------------------------
  *
- *  TaskFixupHostSwitchIDT --
+ *  TaskInitHostSwitchIDT --
  *
- *      Fixes up the contents of the host-context switch IDT and IDTR,
- *      which were partially initialized at compile-time. At this point,
- *      we have the necessary runtime information needed to fully
- *      initialize them: the crosspage's address in the host and the
- *      host kernel's CS.
+ *      Initializes the contents of the host-context switch IDT and IDTR.
+ *      Uses the cross page's host kernel linear address and host kernel CS.
  *
  * Results:
  *      None
@@ -1113,21 +1230,18 @@ TaskFixupHostSwitchIDTE(Gate64 *entry, Selector cs, VMCrossPageCode *cpCode)
  */
 
 static void
-TaskFixupHostSwitchIDT(VMCrossPage *crosspage)
+TaskInitHostSwitchIDT(VMCrossPage *crosspage)
 {
    VMCrossPageData *cpData = &crosspage->crosspageData;
-   VMCrossPageCode *cpCode = &crosspage->crosspageCode;
    const Selector   cs     = cpData->hostInitial64CS;
-   Gate64          *idt    = (Gate64 *)&cpData->switchHostIDT;
 
-   ASSERT(cpData->switchHostIDTR.limit == sizeof cpData->switchHostIDT - 1);
-   ASSERT(cpData->switchHostIDTR.offset == 0);
+   cpData->switchHostIDTR.limit = sizeof cpData->switchHostIDT - 1;
    cpData->switchHostIDTR.offset = PtrToVA64(&cpData->switchHostIDT);
 
-   TaskFixupHostSwitchIDTE(&idt[EXC_DB ], cs, cpCode);
-   TaskFixupHostSwitchIDTE(&idt[EXC_NMI], cs, cpCode);
-   TaskFixupHostSwitchIDTE(&idt[EXC_UD ], cs, cpCode);
-   TaskFixupHostSwitchIDTE(&idt[EXC_MC ], cs, cpCode);
+   TaskPopulateHostSwitchIDTE(EXC_DB,  cs, crosspage);
+   TaskPopulateHostSwitchIDTE(EXC_NMI, cs, crosspage);
+   TaskPopulateHostSwitchIDTE(EXC_UD,  cs, crosspage);
+   TaskPopulateHostSwitchIDTE(EXC_MC,  cs, crosspage);
 }
 
 
@@ -1273,17 +1387,19 @@ TaskSavePTPatch(VMCrossPageData *crosspage,
    ASSERT(PTP_LEVEL_L1 <= level && level <= PTP_LEVEL_L4);
 
    for (i = 0; i < MAX_SWITCH_PT_PATCHES; ++i) {
-      ASSERT(crosspage->vmmPTP[i].level != level || /* No duplicates. */
-             crosspage->vmmPTP[i].pteGlobalIdx != pteGlobalIdx ||
-             crosspage->vmmPTP[i].pteIdx != pteIdx);
+      VMMPageTablePatch *patch = &crosspage->vmmPTP[i];
+      ASSERT(patch->level != level || /* No duplicates. */
+             patch->pteGlobalIdx != pteGlobalIdx ||
+             patch->pteIdx != pteIdx);
 
-      if (crosspage->vmmPTP[i].level == PTP_EMPTY) {
-         crosspage->vmmPTP[i].level = level;
-         crosspage->vmmPTP[i].pteIdx = pteIdx;
-         crosspage->vmmPTP[i].pte   = pte;
-         crosspage->vmmPTP[i].pteGlobalIdx = pteGlobalIdx;
+      if (patch->level == PTP_EMPTY) {
+         patch->level        = level;
+         patch->pteIdx       = pteIdx;
+         patch->pteGlobalIdx = pteGlobalIdx;
+         patch->lpn          = lpn;
+         patch->pte          = pte;
 
-         return &crosspage->vmmPTP[i];
+         return patch;
       }
    }
    Panic("Internal error: PTP table is full");
@@ -1459,36 +1575,22 @@ TaskCreatePTPatches(VMDriver    *vm,
                     uint16      *numPages)
 {
    VMCrossPageData * const cpData = &crosspage->crosspageData;
-   LPN64                   xgCPN  = LA_2_LPN(cpData->vmm64CrossGDTLA);
-   LPN64                   xpCPN  = LA_2_LPN(cpData->vmm64CrossPageLA);
+   LPN64                   xgCPN  = LA_2_LPN(cpData->vmmCrossGDTLA);
+   LPN64                   xpCPN  = LA_2_LPN(cpData->vmmCrossPageLA);
    MPN                     xpMPN  = MA_2_MPN(cpData->crosspageMA);
-   int                     i;
-
    /*
     * Set up patches that the BackToHost code will use to map the
     * crosspage and crossGDT at their crossover addresses (HKLA for
     * the host).
     */
-   if (!TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN, xpCPN, xpMPN,
-                          numPages)) {
-      return FALSE;
-   }
-
-   for (i = 0; CROSSGDT_PAGEMASK >> i; i++) {
-      if ((CROSSGDT_PAGEMASK >> i) & 1) {
-         /*
-          * Set up patches for just first and last pages of cross-gdt
-          * due to the selected value of CROSSGDT_PAGEMASK.
-          */
-         if (!TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN, xgCPN + i,
-                                crossGDTMPNs[i], numPages)) {
-            return FALSE;
-         }
-      }
+   if (TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN,
+                         xpCPN, xpMPN, numPages) &&
+       TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN,
+                         xgCPN, crossGDTMPN, numPages)) {
+      TaskFixupPTPatches(vm, cpData);
+      return TRUE;
    }
-   TaskFixupPTPatches(vm, cpData);
-
-   return TRUE;
+   return FALSE;
 }
 
 
@@ -1521,73 +1623,54 @@ Task_InitCrosspage(VMDriver *vm,          // IN
       return 1;
    }
 
-   initParams->crossGDTHKLA = HOST_KERNEL_VA_2_LA((VA)crossGDT);
-   ASSERT_ON_COMPILE(sizeof initParams->crossGDTMPNs == sizeof crossGDTMPNs);
-   memcpy(initParams->crossGDTMPNs, crossGDTMPNs, sizeof crossGDTMPNs);
+   initParams->crossGDTMPN = crossGDTMPN;
 
-   for (vcpuid = 0; vcpuid < initParams->numVCPUs;  vcpuid++) {
-      VA64         crossPageUserAddr = initParams->crosspage[vcpuid];
-      VMCrossPage *p                 = HostIF_MapCrossPage(vm, crossPageUserAddr);
-      MPN          crossPageMPN;
+   ASSERT(0 < vm->numVCPUs && vm->numVCPUs <= MAX_VCPUS);
+   for (vcpuid = 0; vcpuid < vm->numVCPUs; vcpuid++) {
+      VA64             crossPageUserAddr = initParams->crosspage[vcpuid];
+      VMCrossPage     *p = HostIF_MapCrossPage(vm, crossPageUserAddr);
+      VMCrossPageData *cpData;
+      MPN              crossPageMPN;
 
       if (p == NULL) {
          return 1;
       }
+      cpData = &p->crosspageData;
 
+      HostIF_VMLock(vm, 38);
       if (HostIF_LookupUserMPN(vm, crossPageUserAddr, &crossPageMPN) !=
           PAGE_LOOKUP_SUCCESS ||
           crossPageMPN == 0) {
+         HostIF_VMUnlock(vm, 38);
          return 1;
       }
+      HostIF_VMUnlock(vm, 38);
 
-      {
-         /* The version of the crosspage must be the first four
-          * bytes of the crosspage.  See the declaration
-          * of VMCrossPage in modulecall.h.
-          */
-
-         ASSERT_ON_COMPILE(offsetof(VMCrossPage, version) == 0);
-         ASSERT_ON_COMPILE(sizeof(p->version) == sizeof(uint32));
-
-         /* p->version is VMX's version; CROSSPAGE_VERSION is vmmon's. */
-         if (p->version != CROSSPAGE_VERSION) {
-            Warning("%s: crosspage version mismatch: vmmon claims %#x, must "
-                    "match vmx version of %#x.\n", __FUNCTION__,
-                    (int)CROSSPAGE_VERSION, p->version);
-            return 1;
-         }
-      }
-      {
-         /* The following constants are the size and offset of the
-          * VMCrossPage->crosspage_size field as defined by the
-          * vmm/vmx.
-          */
-
-         ASSERT_ON_COMPILE(offsetof(VMCrossPage, crosspage_size) ==
-                           sizeof(uint32));
-         ASSERT_ON_COMPILE(sizeof(p->crosspage_size) == sizeof(uint32));
+      /*
+       * The version of the crosspage must be the first four bytes of the
+       * crosspage.  See the declaration of VMCrossPage in modulecall.h.
+       */
 
-         if (p->crosspage_size != sizeof(VMCrossPage)) {
-            Warning("%s: crosspage size mismatch: vmmon claims %#x bytes, "
-                    "must match vmm size of %#x bytes.\n", __FUNCTION__,
-                    (unsigned)sizeof(VMCrossPage), p->crosspage_size);
-            return 1;
-         }
-      }
+      ASSERT_ON_COMPILE(offsetof(VMCrossPage, crosspageData.version) == 0);
+      ASSERT_ON_COMPILE(sizeof(cpData->version) == sizeof(uint32));
 
-      if (crossPageMPN > MA_2_MPN(0xFFFFFFFF)) {
-         Warning("%s*: crossPageMPN 0x%016" FMT64 "x invalid\n", __FUNCTION__,
-                 crossPageMPN);
+      /* cpData->version is VMX's version; CROSSPAGE_VERSION is vmmon's. */
+      if (cpData->version != CROSSPAGE_VERSION) {
+         Warning("%s: crosspage version mismatch: vmmon claims %#x, must "
+                 "match vmx version of %#x.\n", __FUNCTION__,
+                 (int)CROSSPAGE_VERSION, cpData->version);
          return 1;
       }
       if (!pseudoTSC.initialized) {
          Warning("%s*: PseudoTSC has not been initialized\n", __FUNCTION__);
          return 1;
       }
-      p->crosspageData.crosspageMA = (uint32)MPN_2_MA(crossPageMPN);
-      p->crosspageData.hostCrossPageLA = (LA64)(uintptr_t)p;
-      p->crosspageData.vmm64CrossPageLA = p->crosspageData.hostCrossPageLA;
-      p->crosspageData.vmm64CrossGDTLA = HOST_KERNEL_VA_2_LA((VA)crossGDT);
+      cpData->crosspageMA = MPN_2_MA(crossPageMPN);
+      cpData->hostCrossPageLA = (LA64)(uintptr_t)p;
+      cpData->vmmCrossPageLA = cpData->hostCrossPageLA;
+      cpData->vmmCrossGDTLA = HOST_KERNEL_VA_2_LA((VA)crossGDT);
+      cpData->crossGDTHKLADesc.offset = HOST_KERNEL_VA_2_LA((VA)crossGDT);
+      cpData->crossGDTHKLADesc.limit  = sizeof(CrossGDT) - 1;
 
       HostIF_VMLock(vm, 39);
       if (!TaskCreatePTPatches(vm, p,
@@ -1600,29 +1683,40 @@ Task_InitCrosspage(VMDriver *vm,          // IN
          return 1;
       }
       HostIF_VMUnlock(vm, 39);
+      if (!TaskApplyPTPatches(vm, cpData)) {
+         Warning("%s: Could not apply page table patches for VCPU %d\n",
+                 __FUNCTION__, vcpuid);
+         return 1;
+      }
+      if (!TaskVerifyPTPatches(vm, cpData)) {
+         Warning("%s: Page table patches for VCPU %d failed verification\n",
+                 __FUNCTION__, vcpuid);
+         return 1;
+      }
+
       /*
        * Pass our kernel code segment numbers back to MonitorPlatformInit.
        * They have to be in the GDT so they will be valid when the crossGDT is
        * active.
        */
 
-      p->crosspageData.hostInitial64CS = GET_CS();
-      TS_ASSERT(SELECTOR_RPL  (p->crosspageData.hostInitial64CS) == 0 &&
-                SELECTOR_TABLE(p->crosspageData.hostInitial64CS) == 0);
-
-      p->crosspageData.moduleCallInterrupted = FALSE;
-      VersionedAtomic_BeginWrite(&p->crosspageData.pseudoTSCConv.vers);
-      p->crosspageData.pseudoTSCConv.p.mult  = 1;
-      p->crosspageData.pseudoTSCConv.p.shift = 0;
-      p->crosspageData.pseudoTSCConv.p.add   = 0;
-      VersionedAtomic_EndWrite(&p->crosspageData.pseudoTSCConv.vers);
-      p->crosspageData.worldSwitchPTSC       = Vmx86_GetPseudoTSC();
-      p->crosspageData.timerIntrTS           = MAX_ABSOLUTE_TS;
-      p->crosspageData.hstTimerExpiry        = MAX_ABSOLUTE_TS;
-      p->crosspageData.monTimerExpiry        = MAX_ABSOLUTE_TS;
-      vm->crosspage[vcpuid]                  = p;
-
-      TaskFixupHostSwitchIDT(p);
+      cpData->hostInitial64CS = GET_CS();
+      TS_ASSERT(SELECTOR_RPL  (cpData->hostInitial64CS) == 0 &&
+                SELECTOR_TABLE(cpData->hostInitial64CS) == 0);
+
+      cpData->moduleCallInterrupted = FALSE;
+      VersionedAtomic_BeginWrite(&cpData->pseudoTSCConv.vers);
+      cpData->pseudoTSCConv.p.mult  = 1;
+      cpData->pseudoTSCConv.p.shift = 0;
+      cpData->pseudoTSCConv.p.add   = 0;
+      VersionedAtomic_EndWrite(&cpData->pseudoTSCConv.vers);
+      cpData->worldSwitchPTSC       = Vmx86_GetPseudoTSC();
+      cpData->timerIntrTS           = MAX_ABSOLUTE_TS;
+      cpData->hstTimerExpiry        = MAX_ABSOLUTE_TS;
+      cpData->monTimerExpiry        = MAX_ABSOLUTE_TS;
+      vm->crosspage[vcpuid]         = p;
+
+      TaskInitHostSwitchIDT(p);
    }
    /*
     * Report back to the VMX the number of pages allocated for this VM's
@@ -1983,8 +2077,11 @@ TaskUpdateLatestPTSC(VMDriver *vm, VMCrossPageData *crosspage)
             break;
          }
       } while (!Atomic_CMPXCHG64(&vm->ptscLatest, latest, ptsc));
-      /* After updating the latest PTSC, decrement the reference count. */
-      Atomic_Dec32((Atomic_uint32 *)&vm->ptscOffsetInfo.inVMMCnt);
+      /*
+       * vm->ptscOffsetInfo is composed of two dwords, {vcpuid, inVmmCnt}.
+       * After updating the latest PTSC, decrement the reference count.
+       */
+      Atomic_Dec64(&vm->ptscOffsetInfo);
    }
 }
 
@@ -2014,7 +2111,7 @@ TaskUpdatePTSCParameters(VMDriver *vm,
    uint64 tsc, ptsc;
 
    ASSERT_NO_INTERRUPTS();
-   ASSERT_ON_COMPILE(sizeof(vm->ptscOffsetInfo) == sizeof(Atomic_uint64));
+   ASSERT(vcpuid < vm->numVCPUs);
    ptsc = Vmx86_GetPseudoTSC();
    /*
     * Use unsigned comparison to test ptsc inside the interval:
@@ -2094,11 +2191,20 @@ TaskUpdatePTSCParameters(VMDriver *vm,
        * sleep state (otherwise the TSCs wouldn't be in sync to begin
        * with).
        */
-      PseudoTSCOffsetInfo old, new;
+      uint64 old;
+      uint32 newInVMMCnt;    /* Number of vcpus executing in the VMM. */
+      uint32 newVcpuid;      /* Index into VMDriver.ptscOffsets. */
       do {
-         old = vm->ptscOffsetInfo;
-         new = old;
-         if (new.inVMMCnt == 0) {
+         /*
+          * vm->ptscOffsetInfo is composed of two dwords, {vcpuid, inVmmCnt}.
+          * The inVmmCnt data needs to be the low dword because the inVmmCnt
+          * field is decremented in TaskUpdateLatestPTSC() as part of an
+          * atomic decrement of vm->ptscOffsetInfo.
+          */
+         old = Atomic_Read64(&vm->ptscOffsetInfo);
+         newInVMMCnt = LODWORD(old);
+         newVcpuid = HIDWORD(old);
+         if (newInVMMCnt == 0) {
             int64 ptscOffset;
             if (Vmx86_PseudoTSCUsesRefClock()) {
                /* Must read ptscLatest after reading ptscOffsetInfo. */
@@ -2122,14 +2228,14 @@ TaskUpdatePTSCParameters(VMDriver *vm,
              */
             vm->ptscOffsets[vcpuid] = ptscOffset;
             /* Try to use this thread's offset as the global offset. */
-            new.vcpuid = vcpuid;
+            newVcpuid = vcpuid;
          }
-         new.inVMMCnt++;
-      } while (!Atomic_CMPXCHG64((Atomic_uint64 *)&vm->ptscOffsetInfo,
-                                 *(uint64 *)&old, *(uint64 *)&new));
+         newInVMMCnt++;
+      } while (!Atomic_CMPXCHG64(&vm->ptscOffsetInfo, old,
+                                 QWORD(newVcpuid, newInVMMCnt)));
       /* Use the designated global offset as this thread's offset. */
       VersionedAtomic_BeginWrite(&crosspage->pseudoTSCConv.vers);
-      crosspage->pseudoTSCConv.p.add   = vm->ptscOffsets[new.vcpuid];
+      crosspage->pseudoTSCConv.p.add = vm->ptscOffsets[newVcpuid];
       VersionedAtomic_EndWrite(&crosspage->pseudoTSCConv.vers);
       /*
        * Need to derive the worldSwitchPTSC value from TSC since the
@@ -2139,7 +2245,7 @@ TaskUpdatePTSCParameters(VMDriver *vm,
       ptsc = tsc + crosspage->pseudoTSCConv.p.add;
    } else {
       VersionedAtomic_BeginWrite(&crosspage->pseudoTSCConv.vers);
-      crosspage->pseudoTSCConv.p.add   = ptsc - tsc;
+      crosspage->pseudoTSCConv.p.add = ptsc - tsc;
       VersionedAtomic_EndWrite(&crosspage->pseudoTSCConv.vers);
    }
    /* Cache PTSC value for BackToHost. */
@@ -2190,8 +2296,7 @@ TaskUpdatePTSCParameters(VMDriver *vm,
 static INLINE_SINGLE_CALLER void
 TaskSwitchToMonitor(VMCrossPage *crosspage)
 {
-   const uint8 *codePtr = ((uint8 *)&crosspage->crosspageCode +
-                           crosspage->crosspageCode.offsets.hostToVmm);
+   const void *codePtr = ((void *)&crosspage->crosspageCode.toVmmFunc);
 
 #if defined(__GNUC__)
    /*
@@ -2362,7 +2467,7 @@ Task_Switch(VMDriver *vm,  // IN
    uint64      kgs64 = 0;
    uint64      ptMSR = 0;
    uint64      pebsMSR = 0;
-   DTR64       hostGDT64, hostIDT64;
+   DTR64       hostGDT, hostIDT;
    Selector    cs, ds, es, fs, gs, ss;
    Selector    hostTR;
    Selector    hostLDT;
@@ -2370,7 +2475,7 @@ Task_Switch(VMDriver *vm,  // IN
    Bool lint1NMI;
    Bool pcNMI;
    Bool thermalNMI;
-   VMCrossPage *crosspage = vm->crosspage[vcpuid];
+   VMCrossPage *crosspage;
    uint32 pCPU;
    MPN hvRootMPN;
    Descriptor *tempGDTBase;
@@ -2380,6 +2485,9 @@ Task_Switch(VMDriver *vm,  // IN
    static volatile uint64 currentSpecCtrlValue = 0;
 #endif
 
+   ASSERT(vcpuid < vm->numVCPUs);
+   crosspage = vm->crosspage[vcpuid];
+
    ASSERT_ON_COMPILE(sizeof(VMCrossPage) == PAGE_SIZE);
    TaskDisableNMI(&vm->hostAPIC, &lint0NMI, &lint1NMI, &pcNMI, &thermalNMI);
    SAVE_FLAGS(flags);
@@ -2414,7 +2522,7 @@ Task_Switch(VMDriver *vm,  // IN
          MA foreignVMCS  = ~0ULL;
          MA foreignHSAVE = ~0ULL;
 
-         vm->currentHostCpu[vcpuid] = pCPU;
+         Atomic_Write32(&vm->currentHostCpu[vcpuid], pCPU);
 
          TaskUpdatePTSCParameters(vm, &crosspage->crosspageData, vcpuid);
 
@@ -2446,11 +2554,11 @@ Task_Switch(VMDriver *vm,  // IN
           * few are handled).
           */
 
-         TaskSaveIDT64(&hostIDT64);
-         TaskLoadIDT64(&crosspage->crosspageData.switchHostIDTR);
+         TaskSaveIDT(&hostIDT);
+         TaskLoadIDT(&crosspage->crosspageData.switchHostIDTR);
          TaskTestCrossPageExceptionHandlers(crosspage);
 
-         if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
+         if (CPUID_HostSupportsVT()) {
             /*
              * Ensure that VMX is enabled and locked in the feature control MSR,
              * so that we can set CR4.VMXE to activate VMX.
@@ -2486,7 +2594,7 @@ Task_Switch(VMDriver *vm,  // IN
          /*
           * CR4.VMXE must be enabled to support VMX in the monitor.
           */
-         if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
+         if (CPUID_HostSupportsVT()) {
             crosspage->crosspageData.wsCR4 |= CR4_VMXE;
          }
 
@@ -2516,9 +2624,9 @@ Task_Switch(VMDriver *vm,  // IN
 
          TaskSaveDebugRegisters(crosspage);
 
-         TaskSaveGDT64(&hostGDT64);
+         TaskSaveGDT(&hostGDT);
 
-         if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
+         if (CPUID_HostSupportsVT()) {
             MA vmxonRegion = MPN_2_MA(hvRootMPN);
             VMXStatus status = VMXON_2_STATUS(&vmxonRegion);
             if (status == VMX_Success) {
@@ -2528,7 +2636,7 @@ Task_Switch(VMDriver *vm,  // IN
             }
          }
 
-         if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
+         if (CPUID_HostSupportsSVM()) {
             efer = __GET_MSR(MSR_EFER);
             if ((efer & MSR_EFER_SVME) == 0) {
                __SET_MSR(MSR_EFER, efer | MSR_EFER_SVME);
@@ -2604,12 +2712,14 @@ Task_Switch(VMDriver *vm,  // IN
             crosspage->crosspageData.specCtrl = __GET_MSR(MSR_SPEC_CTRL);
          }
 
-         DEBUG_ONLY(crosspage->crosspageData.tinyStack[0] = 0xDEADBEEF;)
+         DEBUG_ONLY(crosspage->crosspageData.monTinyStack[0] = 0xDEADBEEF;)
+         DEBUG_ONLY(crosspage->crosspageData.hostTinyStack[0] = 0xDEADBEEF;)
          /* Running in host context prior to TaskSwitchToMonitor() */
          TaskSwitchToMonitor(crosspage);
          /* Running in host context after to TaskSwitchToMonitor() */
 
-         TS_ASSERT(crosspage->crosspageData.tinyStack[0] == 0xDEADBEEF);
+         TS_ASSERT(crosspage->crosspageData.monTinyStack[0] == 0xDEADBEEF);
+         TS_ASSERT(crosspage->crosspageData.hostTinyStack[0] == 0xDEADBEEF);
 
 #ifdef CYCLE_SPEC_CTRL
          if (CPUID_HostSupportsSpecCtrl()) {
@@ -2639,7 +2749,7 @@ Task_Switch(VMDriver *vm,  // IN
             TaskEnableTF();
          }
 
-         if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
+         if (CPUID_HostSupportsSVM()) {
             __SET_MSR(MSR_VM_HSAVE_PA, foreignHSAVE);
             if ((efer & MSR_EFER_SVME) == 0) {
                __SET_MSR(MSR_EFER, efer);
@@ -2682,8 +2792,7 @@ Task_Switch(VMDriver *vm,  // IN
           * bit needs to be fiddled with.  Also restore host LDT while we're
           * at it.
           */
-         TaskRestoreHostGDTTRLDT(tempGDTBase, hostGDT64,
-                                 hostLDT, cs, hostTR);
+         TaskRestoreHostGDTTRLDT(tempGDTBase, hostGDT, hostLDT, cs, hostTR);
 
          SET_DS(ds);
          SET_ES(es);
@@ -2714,7 +2823,7 @@ Task_Switch(VMDriver *vm,  // IN
           * iff we disabled it.
           */
 
-         TaskLoadIDT64(&hostIDT64);
+         TaskLoadIDT(&hostIDT);
 
          if (pebsMSR != 0) {
             __SET_MSR(IA32_MSR_PEBS_ENABLE, pebsMSR);
@@ -2725,7 +2834,7 @@ Task_Switch(VMDriver *vm,  // IN
          }
 
          TaskUpdateLatestPTSC(vm, &crosspage->crosspageData);
-         vm->currentHostCpu[vcpuid] = INVALID_PCPU;
+         Atomic_Write32(&vm->currentHostCpu[vcpuid], INVALID_PCPU);
 
          /*
           * If an #NMI or #MCE was logged while switching, re-raise such an
@@ -2756,7 +2865,7 @@ Task_Switch(VMDriver *vm,  // IN
             RAISE_INTERRUPT(EXC_MC);
          }
          if (UNLIKELY(TaskGotException(crosspage, EXC_UD))) {
-            Warning("#UD occurred on switch back to host; dumping core");
+            Warning("#UD occurred on switch back to host; dumping core.\n");
          }
 #ifdef CYCLE_SPEC_CTRL
          if (UNLIKELY(!specCtrlEqual)) {
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index f6b0d6fc..598a97e6 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -23,7 +23,7 @@
  *     virtual machine monitors.
  */
 
-#ifdef linux
+#ifdef __linux__
 /* Must come before any kernel header file --hpreg */
 #   include "driver-config.h"
 
@@ -49,7 +49,6 @@
 #include "cpuid.h"
 #include "vcpuset.h"
 #include "memtrack.h"
-#include "hashFunc.h"
 #if defined(_WIN64)
 #include "x86.h"
 #include "vmmon-asm-x86-64.h"
@@ -64,7 +63,7 @@
 #include "x86vtinstr.h"
 #include "bootstrap_vmm.h"
 #include "monLoader.h"
-
+#include "vmmblob.h"
 
 PseudoTSC pseudoTSC;
 
@@ -113,6 +112,12 @@ typedef struct {
    MSRQuery *query;
 } Vmx86GetMSRData;
 
+static Bool hostUsesNX;
+
+typedef struct NXData {
+   Atomic_uint32 responded;
+   Atomic_uint32 hasNX;
+} NXData;
 
 /*
  *----------------------------------------------------------------------
@@ -502,6 +507,194 @@ Vmx86DeleteVMFromList(VMDriver *vm)
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_Free --
+ *
+ *      A wrapper around HostIF_FreeKernelMem that checks if the given
+ *      pointer is NULL before freeing memory.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+Vmx86_Free(void *ptr)
+{
+   if (ptr != NULL) {
+      HostIF_FreeKernelMem(ptr);
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_Calloc --
+ *
+ *      A wrapper around HostIF_AllocKernelMem that zeroes memory and
+ *      fails if integer overflow would occur in the computed
+ *      allocation size.
+ *
+ * Results:
+ *      Pointer to allocated memory or NULL on failure. Use
+ *      HostIF_FreeKernelMem or Vmx86_Free to free.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void *
+Vmx86_Calloc(size_t numElements, // IN
+             size_t elementSize, // IN
+             int nonPageable)    // IN
+{
+   size_t numBytes = numElements * elementSize;
+   void *retval;
+
+   if (UNLIKELY(numBytes / numElements != elementSize)) { // Overflow.
+      return NULL;
+   }
+
+   retval = HostIF_AllocKernelMem(numBytes, nonPageable);
+   if (retval != NULL) {
+      memset(retval, 0, numBytes);
+   }
+   return retval;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86FreeVMDriver --
+ *
+ *      Release kernel memory allocated for the driver structure.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+Vmx86FreeVMDriver(VMDriver *vm)
+{
+   Vmx86_Free(vm->ptRootMpns);
+   Vmx86_Free(vm->crosspage);
+   Vmx86_Free(vm->crosscallWaitSet);
+   Vmx86_Free(vm->ptscOffsets);
+   Vmx86_Free(vm->currentHostCpu);
+   vm->ptRootMpns       = NULL;
+   vm->crosspage        = NULL;
+   vm->crosscallWaitSet = NULL;
+   vm->ptscOffsets      = NULL;
+   vm->currentHostCpu   = NULL;
+   HostIF_FreeKernelMem(vm);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86AllocVMDriver --
+ *
+ *      Allocate the driver structure for a virtual machine.
+ *
+ * Results:
+ *      Zeroed VMDriver structure or NULL on error.
+ *
+ * Side effects:
+ *      May allocate kernel memory.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+VMDriver *
+Vmx86AllocVMDriver(uint32 numVCPUs)
+{
+   VMDriver *vm = Vmx86_Calloc(1, sizeof *vm, TRUE);
+   if (vm == NULL) {
+      return NULL;
+   }
+   if ((vm->ptRootMpns =
+        Vmx86_Calloc(numVCPUs, sizeof *vm->ptRootMpns, TRUE))       != NULL &&
+       (vm->crosspage =
+        Vmx86_Calloc(numVCPUs, sizeof *vm->crosspage, TRUE))        != NULL &&
+       (vm->crosscallWaitSet =
+        Vmx86_Calloc(numVCPUs, sizeof *vm->crosscallWaitSet, TRUE)) != NULL &&
+       (vm->ptscOffsets =
+        Vmx86_Calloc(numVCPUs, sizeof *vm->ptscOffsets, TRUE))      != NULL &&
+       (vm->currentHostCpu =
+        Vmx86_Calloc(numVCPUs, sizeof *vm->currentHostCpu, TRUE))   != NULL) {
+      return vm;
+   }
+   Vmx86FreeVMDriver(vm);
+   return NULL;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86VMMPageFree --
+ *
+ *     Unmaps the VMM page corresponding to this entry from in the host
+ *     kernel. This function is used as a callback by MemTrack_Cleanup().
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86VMMPageFree(void *unused, MemTrackEntry *entry)
+{
+   ASSERT(entry->vpn != 0 && entry->mpn != 0);
+   Vmx86_UnmapPage(entry->vpn);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_CleanupVMMPages --
+ *
+ *     Ummaps all VMM pages from the host kernel address space and frees
+ *     the VMM MemTracker.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_CleanupVMMPages(VMDriver *vm)
+{
+   MemTrack_Cleanup(vm->vmmTracker, Vmx86VMMPageFree, NULL);
+   vm->vmmTracker = NULL;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -529,13 +722,20 @@ Vmx86FreeAllVMResources(VMDriver *vm)
 
       Vmx86_SetHostClockRate(vm, 0);
 
-      if (vm->ptpTracker) {
+      if (vm->ptpTracker != NULL) {
          Task_SwitchPTPPageCleanup(vm);
       }
+      if (vm->vmmTracker != NULL) {
+         Vmx86_CleanupVMMPages(vm);
+      }
+      if (vm->blobInfo != NULL) {
+         VmmBlob_Cleanup(vm->blobInfo);
+         vm->blobInfo = NULL;
+      }
 
       HostIF_FreeAllResources(vm);
 
-      HostIF_FreeKernelMem(vm);
+      Vmx86FreeVMDriver(vm);
    }
 }
 
@@ -659,6 +859,64 @@ Vmx86UnreserveFreePages(VMDriver *vm,
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86GetNX --
+ *
+ *       Checks whether NX is enabled on the current CPU.
+ *
+ * Results:
+ *       None.
+ *
+ * Side effects:
+ *       Increments responded-CPU counter, may increment NX CPU counter.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86GetNX(void *clientData) // IN/OUT: A NXData *
+{
+   NXData *nxData = (NXData *)clientData;
+   uint64 efer = __GET_MSR(MSR_EFER);
+
+   Atomic_Inc32(&nxData->responded);
+   if ((efer & MSR_EFER_NXE) == MSR_EFER_NXE) {
+      Atomic_Inc32(&nxData->hasNX);
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_CacheNXState --
+ *
+ *       Checks whether every CPU on the host has NX/XD enabled and
+ *       caches this value.
+ *
+ * Results:
+ *       None.
+ *
+ * Side effects:
+ *       Caches host NX value.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_CacheNXState(void)
+{
+   NXData nxData;
+   Atomic_Write32(&nxData.responded, 0);
+   Atomic_Write32(&nxData.hasNX, 0);
+   HostIF_CallOnEachCPU(Vmx86GetNX, &nxData);
+   hostUsesNX = Atomic_Read32(&nxData.hasNX) ==
+                Atomic_Read32(&nxData.responded);
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -676,33 +934,43 @@ Vmx86UnreserveFreePages(VMDriver *vm,
  */
 
 VMDriver *
-Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize)
+Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
 {
    VMDriver *vm;
    Vcpuid v;
    void *bsBuf = NULL;
    BSVMM_HostParams *bsParams;
 
+   /* Disallow VM creation if the vmx passes us an invalid number of vcpus. */
+   if (numVCPUs == 0 || numVCPUs > MAX_VCPUS) {
+      return NULL;
+   }
+
    /* Disallow VM creation if HV is not available, as the VM cannot be run. */
    if (!CPUID_HostSupportsHV()) {
       return NULL;
    }
 
-   vm = HostIF_AllocKernelMem(sizeof *vm, TRUE);
+   /* Disallow VM creation if NX is disabled on the host as VMM requires NX. */
+   if (!hostUsesNX) {
+      Log("NX/XD must be enabled.  Cannot create VM.\n");
+      return NULL;
+   }
+
+   vm = Vmx86AllocVMDriver(numVCPUs);
    if (vm == NULL) {
       return NULL;
    }
-   memset(vm, 0, sizeof *vm);
 
    vm->userID = 0;
+   vm->numVCPUs = numVCPUs;
    vm->memInfo.admitted = FALSE;
-   for (v = 0; v < MAX_INITBLOCK_CPUS; v++) {
-      vm->currentHostCpu[v] = INVALID_PCPU;
-   }
-   for (v = 0; v < MAX_VCPUS; v++) {
+
+   for (v = 0; v < numVCPUs; v++) {
+      Atomic_Write32(&vm->currentHostCpu[v], INVALID_PCPU);
       vm->ptRootMpns[v] = INVALID_MPN;
    }
-   if (HostIF_Init(vm)) {
+   if (HostIF_Init(vm, numVCPUs)) {
       goto cleanup;
    }
    bsBuf = HostIF_AllocKernelMem(bsBlobSize, FALSE);
@@ -717,7 +985,6 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize)
       Warning("Could not validate the VMM bootstrap blob");
       goto cleanup;
    }
-   memcpy(&vm->bsParams, bsParams, sizeof *bsParams);
 
    if (!Task_CreateCrossGDT(&bsParams->gdtInit)) {
       goto cleanup;
@@ -726,6 +993,10 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize)
    if (vm->ptpTracker == NULL) {
       goto cleanup;
    }
+   vm->vmmTracker = MemTrack_Init(vm);
+   if (vm->vmmTracker == NULL) {
+      goto cleanup;
+   }
 
    HostIF_GlobalLock(0);
 
@@ -785,8 +1056,6 @@ Vmx86SetPageTableRoots(VMDriver *vm, UserVA64 *ptRootVAs, uint16 numVCPUs)
 {
    uint16 vcpu;
 
-   ASSERT_ON_COMPILE(MAX_VCPUS == MAX_INITBLOCK_CPUS);
-
    if (numVCPUs > vm->numVCPUs) {
       return FALSE;
    }
@@ -797,11 +1066,14 @@ Vmx86SetPageTableRoots(VMDriver *vm, UserVA64 *ptRootVAs, uint16 numVCPUs)
          return FALSE;
       }
       ASSERT(vm->ptRootMpns[vcpu] == INVALID_MPN);
+      HostIF_VMLock(vm, 38);
       if (HostIF_LookupUserMPN(vm, ptRootVAs[vcpu], &vm->ptRootMpns[vcpu]) !=
           PAGE_LOOKUP_SUCCESS) {
+         HostIF_VMUnlock(vm, 38);
          Warning("Failure looking up page table root MPN for VCPU %d\n", vcpu);
          return FALSE;
       }
+      HostIF_VMUnlock(vm, 38);
    }
    return TRUE;
 }
@@ -859,61 +1131,36 @@ Vmx86_ProcessBootstrap(VMDriver *vm,
                        UserVA64 *ptRootVAs,
                        VMSharedRegion *shRegions)
 {
-   void *blobHdr = NULL;
+   VmmBlobInfo *bi = NULL;
    unsigned errLine;
    Vcpuid errVcpu;
    MonLoaderError ret;
-   MonLoaderHeader *header;
-   Bool res = FALSE;
    MonLoaderArgs args;
 
-   /*
-    * Only the beginning of the blob may be passed in: the header at
-    * offset 0, which must fit on one page.
-    */
-   if (numBytes > PAGE_SIZE || headerOffset != 0 ||
-       MonLoader_GetFixedHeaderSize() > numBytes) {
-      Warning("Invalid arguments for processing bootstrap. "
-              "Header offset: %d, Fixed header size: %zd bytes, "
-              "Blob size: %d bytes\n",
-              headerOffset, MonLoader_GetFixedHeaderSize(), numBytes);
-      goto cleanup;
-   }
-   blobHdr = HostIF_AllocKernelMem(numBytes, FALSE);
-   if (blobHdr == NULL) {
-      Warning("Failure allocating kernel buffer for bootstrap blob\n");
-      goto cleanup;
-   }
-   if (HostIF_CopyFromUser(blobHdr, bsBlobAddr, numBytes) != 0) {
-      Warning("Failure copying bootstrap blob from userspace\n");
-      goto cleanup;
-   }
-   ASSERT(headerOffset == 0);
-   header = (MonLoaderHeader *)blobHdr;
-   if (MonLoader_GetFullHeaderSize(header) > numBytes) {
-      Warning("Invalid arguments for processing bootstrap. "
-              "Full header size: %zd bytes, Blob size: %d bytes\n",
-              MonLoader_GetFullHeaderSize(header), numBytes);
-      goto cleanup;
+   if (!VmmBlob_Load(bsBlobAddr, numBytes, headerOffset, &bi)) {
+      Warning("Error loading VMM bootstrap blob\n");
+      goto error;
    }
+   vm->blobInfo = bi;
    if (!Vmx86SetPageTableRoots(vm, ptRootVAs, numVCPUs)) {
-      goto cleanup;
+      goto error;
    }
    args.vm = vm;
    args.shRegions = shRegions;
-   ret = MonLoader_Process(header, numVCPUs, &args, &errLine, &errVcpu);
+   ret = MonLoader_Process(bi->header, numVCPUs, &args, &errLine, &errVcpu);
    if (ret != ML_OK) {
       Warning("Error processing bootstrap: error %d at line %u, vcpu %u\n",
                ret, errLine, errVcpu);
-      goto cleanup;
+      goto error;
    }
-   res = TRUE;
+   return TRUE;
 
-cleanup:
-   if (blobHdr != NULL) {
-      HostIF_FreeKernelMem(blobHdr);
+error:
+   if (bi != NULL) {
+      VmmBlob_Cleanup(bi);
+      vm->blobInfo = NULL;
    }
-   return res;
+   return FALSE;
 }
 
 
@@ -1051,12 +1298,11 @@ Vmx86_InitVM(VMDriver *vm,          // IN
 
       return 1;
    }
-   if (initParams->numVCPUs > MAX_INITBLOCK_CPUS) {
-      Warning("Too many VCPUs for init block %d\n", initParams->numVCPUs);
+   if (vm->numVCPUs == 0 || vm->numVCPUs > MAX_VCPUS) {
+      Warning("Invalid number of VCPUs %d\n", vm->numVCPUs);
 
       return 1;
    }
-   vm->numVCPUs = initParams->numVCPUs;
 
    /*
     * Initialize the driver's part of the cross-over page used to
@@ -1398,6 +1644,7 @@ Vmx86_MonTimerIPI(void)
    for (vm = vmDriverList; vm != NULL; vm = vm->nextDriver) {
       Vcpuid v;
       VCPUSet expiredVCPUs;
+      Bool hasWork = FALSE;
       VCPUSet_Empty(&expiredVCPUs);
 
       for (v = 0; v < vm->numVCPUs; v++) {
@@ -1409,12 +1656,11 @@ Vmx86_MonTimerIPI(void)
          expiry = crosspage->crosspageData.monTimerExpiry;
          if (expiry != 0 && expiry <= pNow) {
             VCPUSet_Include(&expiredVCPUs, v);
+            hasWork = TRUE;
          }
       }
-      if (!VCPUSet_IsEmpty(&expiredVCPUs) &&
-          HostIF_IPI(vm, &expiredVCPUs) == IPI_BROADCAST) {
-         // no point in doing a broadcast for more than one VM.
-         break;
+      if (hasWork) {
+         HostIF_IPI(vm, &expiredVCPUs);
       }
    }
    HostIF_GlobalUnlock(21);
@@ -1854,6 +2100,42 @@ Vmx86_FreeLockedPages(VMDriver *vm,         // IN: VM instance pointer
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_AllocLowPage --
+ *
+ *      Allocate a zeroed locked low page.
+ *
+ * Results:
+ *      Allocated MPN on success. INVALID_MPN on failure.
+ *
+ * Side effects:
+ *      Number of global and per-VM locked pages is increased.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+MPN
+Vmx86_AllocLowPage(VMDriver *vm,      // IN: VMDriver
+                   Bool ignoreLimits) // IN: should limits be ignored?
+{
+   MPN mpn;
+
+   if (!Vmx86ReserveFreePages(vm, 1, ignoreLimits)) {
+      return INVALID_MPN;
+   }
+
+   mpn = HostIF_AllocLowPage(vm);
+
+   if (mpn == INVALID_MPN) {
+      Vmx86UnreserveFreePages(vm, 1);
+   }
+
+   return mpn;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -2259,7 +2541,7 @@ Vmx86VMXEnabled(void)
 static void
 Vmx86EnableHVOnCPU(void)
 {
-   if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
+   if (CPUID_HostSupportsSVM()) {
       uint64 vmCR = __GET_MSR(MSR_VM_CR);
       if (!SVM_LockedFromFeatures(vmCR)) {
          CPUIDRegs regs;
@@ -2269,13 +2551,11 @@ Vmx86EnableHVOnCPU(void)
                                   MSR_VM_CR_SVM_LOCK);
          }
       }
-   } else if (CPUID_GetVendor() == CPUID_VENDOR_INTEL) {
+   } else if (CPUID_HostSupportsVT()) {
       uint64 featCtl = __GET_MSR(MSR_FEATCTL);
       if (!VT_LockedFromFeatures(featCtl)) {
          __SET_MSR(MSR_FEATCTL, featCtl | MSR_FEATCTL_LOCK | MSR_FEATCTL_VMXE);
       }
-   } else {
-      NOT_REACHED();
    }
 }
 
@@ -2347,6 +2627,10 @@ Vmx86_InitPseudoTSC(PTSCInitParams *params) // IN/OUT
    HostIF_GlobalLock(36);
 
    if (!pseudoTSC.initialized) {
+      Bool logParams = pseudoTSC.hz != params->tscHz ||
+                       pseudoTSC.hwTSCsSynced != params->hwTSCsSynced ||
+                       pseudoTSC.useRefClock != params->forceRefClock;
+
       pseudoTSC.hz = params->tscHz;
       pseudoTSC.refClockToPTSC.ratio.mult  = params->refClockToPTSC.mult;
       pseudoTSC.refClockToPTSC.ratio.shift = params->refClockToPTSC.shift;
@@ -2364,10 +2648,12 @@ Vmx86_InitPseudoTSC(PTSCInitParams *params) // IN/OUT
       pseudoTSC.useRefClock           = params->forceRefClock;
       pseudoTSC.neverSwitchToRefClock = params->forceTSC;
       pseudoTSC.hwTSCsSynced          = params->hwTSCsSynced;
-      Log("PTSC: initialized at %"FMT64"u Hz using %s, TSCs are %ssynchronized.\n",
-          pseudoTSC.hz, pseudoTSC.useRefClock ? "reference clock" : "TSC",
-          pseudoTSC.hwTSCsSynced ? "" : "not ");
-
+      if (logParams) {
+         Log("PTSC: initialized at %"FMT64"u Hz using %s, TSCs are "
+             "%ssynchronized.\n", pseudoTSC.hz,
+             pseudoTSC.useRefClock ? "reference clock" : "TSC",
+             pseudoTSC.hwTSCsSynced ? "" : "not ");
+      }
       pseudoTSC.initialized = TRUE;
    }
    /*
@@ -2773,6 +3059,8 @@ Vmx86_YieldToSet(VMDriver *vm,       // IN:
 {
    VCPUSet vcpus;
 
+   ASSERT(currVcpu < vm->numVCPUs);
+   
    if (VCPUSet_IsEmpty(req)) {
       return;
    }
@@ -2796,7 +3084,7 @@ Vmx86_YieldToSet(VMDriver *vm,       // IN:
    }
 
    VCPUSet_Empty(&vcpus);
-   FOR_EACH_VCPU_IN_SET(req, vcpuid) {
+   FOR_EACH_VCPU_IN_SET_WITH_MAX(req, vcpuid, vm->numVCPUs) {
       if (vcpuid == currVcpu) {
          continue;
       }
@@ -2818,14 +3106,14 @@ Vmx86_YieldToSet(VMDriver *vm,       // IN:
        * at the current vCPU.
        */
 
-      if (vm->currentHostCpu[vcpuid] != INVALID_PCPU) {
+      if (Atomic_Read32(&vm->currentHostCpu[vcpuid]) != INVALID_PCPU) {
          VCPUSet_AtomicRemove(&vm->crosscallWaitSet[vcpuid], currVcpu);
       } else {
          if (VCPUSet_AtomicIsMember(&vm->crosscallWaitSet[vcpuid], currVcpu)) {
             VCPUSet_Include(&vcpus, vcpuid);
          }
       }
-   } ROF_EACH_VCPU_IN_SET();
+   } ROF_EACH_VCPU_IN_SET_WITH_MAX();
 
    /*
     * Wake up any threads that had previously yielded the processor to
@@ -2851,9 +3139,9 @@ Vmx86_YieldToSet(VMDriver *vm,       // IN:
     * bits anyway.
     */
 
-   FOR_EACH_VCPU_IN_SET(&vcpus, vcpuid) {
+   FOR_EACH_VCPU_IN_SET_WITH_MAX(&vcpus, vcpuid, vm->numVCPUs) {
       VCPUSet_AtomicRemove(&vm->crosscallWaitSet[vcpuid], currVcpu);
-   } ROF_EACH_VCPU_IN_SET();
+   } ROF_EACH_VCPU_IN_SET_WITH_MAX();
 
    HostIF_CancelWaitForThreads(vm, currVcpu);
 }
@@ -2896,7 +3184,7 @@ Vmx86PerfCtrInUse(Bool isGen, unsigned pmcNum, unsigned ctrlMSR,
                 PERFCTR_CORE_INST_RETIRED;
       pgcEna = CONST64U(1) << pmcNum;
    } else {
-      ASSERT(pmcNum < 3);
+      ASSERT(pmcNum < PERFCTR_CORE_NUM_FIXED_COUNTERS);
       if ((pmcCtrl & PERFCTR_CORE_FIXED_ENABLE_MASKn(pmcNum)) != 0) {
          return TRUE;
       }
@@ -2968,8 +3256,9 @@ Vmx86GetUnavailPerfCtrsOnCPU(void *data)
       }
       selBase = PERFCTR_CORE_PERFEVTSEL0_ADDR;
       ctrBase = PERFCTR_CORE_PERFCTR0_ADDR;
-   } else if (CPUID_GetVendor() == CPUID_VENDOR_AMD) {
-     if(CPUID_ISSET(0x80000001, ECX, PERFCORE,
+   } else if (CPUID_GetVendor() == CPUID_VENDOR_AMD ||
+              CPUID_GetVendor() == CPUID_VENDOR_HYGON) {
+     if (CPUID_ISSET(0x80000001, ECX, PERFCORE,
         __GET_ECX_FROM_CPUID(0x80000001))) {
          numGen  = 6;
          selBase = PERFCTR_AMD_EXT_BASE_ADDR + PERFCTR_AMD_EXT_EVENTSEL;
@@ -2997,6 +3286,7 @@ Vmx86GetUnavailPerfCtrsOnCPU(void *data)
       }
    }
    if (numFix > 0) {
+      numFix = MIN(numFix, PERFCTR_CORE_NUM_FIXED_COUNTERS);
       for (i = 0; i < numFix; i++) {
          if (Vmx86PerfCtrInUse(FALSE, i, PERFCTR_CORE_FIXED_CTR_CTRL_ADDR,
                                PERFCTR_CORE_FIXED_CTR0_ADDR + i, hasPGC)) {
@@ -3114,3 +3404,52 @@ Vmx86_UnmapPage(VPN vpn) // IN:
 {
    HostIF_UnmapPage(vpn);
 }
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetMonitorContext --
+ *
+ *      Gets most of the monitor's saved context (as of the last world switch)
+ *      from a given VCPU's crosspage.  CR3 is omitted as it is privileged,
+ *      while DS/SS/ES are returned due to their potential utility in debugging.
+ *
+ * Results:
+ *      On success, TRUE and context is (partially) populated.  FALSE otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_GetMonitorContext(VMDriver *vm,       // IN: The VM instance.
+                        Vcpuid vcpuid,      // IN: VCPU in question.
+                        Context64 *context) // OUT: context.
+{
+   VMCrossPage *crosspage;
+   VMCrossPageData *cpData;
+   if (vcpuid >= vm->numVCPUs) {
+      return FALSE;
+   }
+   crosspage = vm->crosspage[vcpuid];
+   if (!crosspage) {
+      return FALSE;
+   }
+   cpData = &crosspage->crosspageData;
+   memset(context, 0, sizeof *context);
+   context->es  = cpData->monES;
+   context->ss  = cpData->monSS;
+   context->ds  = cpData->monDS;
+   context->rbx = cpData->monRBX;
+   context->rsp = cpData->monRSP;
+   context->rbp = cpData->monRBP;
+   context->r12 = cpData->monR12;
+   context->r13 = cpData->monR13;
+   context->r14 = cpData->monR14;
+   context->r15 = cpData->monR15;
+   context->rip = cpData->monRIP;
+   return TRUE;
+}
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index 7f0f33fb..b4cedc9e 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,16 +40,13 @@
 #include "apic.h"
 #include "bootstrap_vmm.h"
 
-typedef struct PseudoTSCOffsetInfo {
-   uint32 inVMMCnt;                  /* Number of vcpus executing in the VMM. */
-   uint32 vcpuid;                    /* Index into VMDriver.ptscOffsets. */
-} PseudoTSCOffsetInfo;
-
 typedef struct TSCDelta {
    Atomic_uint64 min;
    Atomic_uint64 max;
 } TSCDelta;
 
+struct VmmBlobInfo;
+
 /*
  * VMDriver - the main data structure for the driver side of a
  *            virtual machine.
@@ -57,32 +54,33 @@ typedef struct TSCDelta {
 
 typedef struct VMDriver {
    /* Unique (in the driver), strictly positive, VM ID used by userland. */
-   int                          userID;
+   int                     userID;
+
+   Vcpuid                  numVCPUs;         /* Number of vcpus in VM. */
 
-   struct VMDriver             *nextDriver;   /* Next on list of all VMDrivers */
+   struct VMDriver        *nextDriver;       /* Next on list of all VMDrivers */
 
-   Vcpuid                       numVCPUs;     /* Number of vcpus in VM. */
-   struct VMHost               *vmhost;       /* Host-specific fields. */
+   struct VMHost          *vmhost;           /* Host-specific fields. */
 
-   BSVMM_HostParams             bsParams;
-   MPN                          ptRootMpns[MAX_VCPUS];
+   MPN                    *ptRootMpns;       /* numVCPUs-sized array. */
+   struct VmmBlobInfo     *blobInfo;         /* VMM bootstrap blob info. */
 
    /* Pointers to the crossover pages shared with the monitor. */
-   struct VMCrossPage          *crosspage[MAX_INITBLOCK_CPUS];
-   struct MemTrack             *ptpTracker;
-   volatile uint32              currentHostCpu[MAX_INITBLOCK_CPUS];
-   VCPUSet                      crosscallWaitSet[MAX_INITBLOCK_CPUS];
-   APICDescriptor               hostAPIC;
-
-   struct MemTrack             *memtracker;   /* Memory tracker pointer */
-   Bool                         checkFuncFailed;
-   struct PerfCounter          *perfCounter;
-   VMMemMgmtInfo                memInfo;
-   unsigned                     fastClockRate;/* Protected by FastClockLock. */
-
-   volatile PseudoTSCOffsetInfo ptscOffsetInfo; /* Volatile per PR 699101#29. */
-   Atomic_uint64                ptscLatest;
-   int64                        ptscOffsets[MAX_INITBLOCK_CPUS];
+   struct VMCrossPage    **crosspage;        /* numVCPUs-sized array. */
+   struct MemTrack        *ptpTracker;       /* Tracks page table patch pages */
+   struct MemTrack        *vmmTracker;       /* Tracks allocated VMM pages */
+   VCPUSet                *crosscallWaitSet; /* numVCPUs-sized array. */
+   APICDescriptor          hostAPIC;
+
+   struct MemTrack        *memtracker;       /* Memory tracker pointer */
+   Bool                    checkFuncFailed;
+   struct PerfCounter     *perfCounter;
+   VMMemMgmtInfo           memInfo;
+   unsigned                fastClockRate;    /* Protected by FastClockLock. */
+   Atomic_uint64           ptscOffsetInfo;   /* Volatile per PR 699101#29. */
+   Atomic_uint64           ptscLatest;
+   int64                  *ptscOffsets;      /* numVCPUs-sized array. */
+   Atomic_uint32          *currentHostCpu;   /* numVCPUs-sized array. */
 } VMDriver;
 
 typedef struct MonLoaderArgs {
@@ -114,7 +112,10 @@ extern PseudoTSC pseudoTSC;
 
 #define MAX_LOCKED_PAGES (-1)
 
-extern VMDriver *Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize);
+extern void Vmx86_CacheNXState(void);
+extern VMDriver *Vmx86_CreateVM(VA64 bsBlob,
+                                uint32 bsBlobSize,
+                                uint32 numVCPUs);
 extern Bool Vmx86_ProcessBootstrap(VMDriver *vm,
                                    VA64 bsBlobAddr,
                                    uint32 numBytes,
@@ -147,6 +148,11 @@ extern int Vmx86_AllocLockedPages(VMDriver *vm, VA64 addr,
 extern int Vmx86_FreeLockedPages(VMDriver *vm, VA64 addr,
                                  unsigned numPages, Bool kernelMPNBuffer);
 extern MPN Vmx86_GetNextAnonPage(VMDriver *vm, MPN mpn);
+extern MPN Vmx86_AllocLowPage(VMDriver *vm, Bool ignoreLimits);
+extern void *Vmx86_Calloc(size_t numElements,
+                          size_t elementSize,
+                          int nonPageable);
+extern void  Vmx86_Free(void *ptr);
 
 extern int32 Vmx86_GetNumVMs(void);
 extern int32 Vmx86_GetTotalMemUsage(void);
@@ -210,4 +216,11 @@ extern uint64 Vmx86_GetPseudoTSC(void);
 
 extern uint64 Vmx86_GetUnavailablePerfCtrs(void);
 
+extern Bool Vmx86_GetMonitorContext(VMDriver *vm, Vcpuid vcpuid,
+                                    Context64 *context);
+extern void Vmx86_CleanupVMMPages(VMDriver *vm);
+
+extern VPN Vmx86_MapPage(MPN mpn);
+extern void Vmx86_UnmapPage(VPN vpn);
+
 #endif
diff --git a/vmmon-only/include/basic_initblock.h b/vmmon-only/include/basic_initblock.h
index 29326559..f4b58e54 100644
--- a/vmmon-only/include/basic_initblock.h
+++ b/vmmon-only/include/basic_initblock.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006, 2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -47,13 +47,11 @@ typedef
 #include "vmware_pack_begin.h"
 struct InitBlock {
    uint32 magicNumber;     /* Magic number (INIT_BLOCK_MAGIC) */
-   Vcpuid numVCPUs;
+   uint32 vmInitFailurePeriod;
    VA64   crosspage[MAX_INITBLOCK_CPUS];
    LPN64  monStartLPN;
    LPN64  monEndLPN;
-   uint32 vmInitFailurePeriod;
-   LA64   crossGDTHKLA;
-   MPN    crossGDTMPNs[5];  // CROSSGDT_NUMPAGES
+   MPN    crossGDTMPN;
    uint16 numPTPPages;
 }
 #include "vmware_pack_end.h"
diff --git a/vmmon-only/include/circList.h b/vmmon-only/include/circList.h
index 850b8e6f..fbdd4a98 100644
--- a/vmmon-only/include/circList.h
+++ b/vmmon-only/include/circList.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -267,8 +267,8 @@ CircList_DeleteItem(ListItem *p,         // IN
 {
    ListItem *next;
 
-   ASSERT(p);
-   ASSERT(headp);
+   ASSERT(p != NULL);
+   ASSERT(headp != NULL);
 
    next = p->next;
    if (p == next) {
diff --git a/vmmon-only/include/contextinfo.h b/vmmon-only/include/contextinfo.h
index 0e6dcbb2..da1791ea 100644
--- a/vmmon-only/include/contextinfo.h
+++ b/vmmon-only/include/contextinfo.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2014,2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -26,9 +26,11 @@
 #ifndef _CONTEXTINFO_H
 #define _CONTEXTINFO_H
 
+#define INCLUDE_ALLOW_USERLEVEL
 #define INCLUDE_ALLOW_VMCORE
 #define INCLUDE_ALLOW_VMKERNEL
 #define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMX
 #include "includeCheck.h"
 
 #include "x86desc.h"
diff --git a/vmmon-only/include/cpu_defs.h b/vmmon-only/include/cpu_defs.h
index 03f7b702..40bb853f 100644
--- a/vmmon-only/include/cpu_defs.h
+++ b/vmmon-only/include/cpu_defs.h
@@ -42,7 +42,7 @@
 typedef uint32 PCPU;
 #define INVALID_PCPU		((PCPU) -1)
 
-#define MAX_PCPUS       576
+#define MAX_PCPUS       1024
 #define MAX_PCPUS_BITS  10  // MAX_PCPUS <= (1 << MAX_PCPUS_BITS)
 #define MAX_PCPUS_MASK  ((1 << MAX_PCPUS_BITS) - 1)
 
diff --git a/vmmon-only/include/cpuid_info.h b/vmmon-only/include/cpuid_info.h
index bd1cdbdc..28465dd3 100644
--- a/vmmon-only/include/cpuid_info.h
+++ b/vmmon-only/include/cpuid_info.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -70,33 +70,6 @@ typedef struct CPUIDSummary {
 } CPUIDSummary;
 
 
-/*
- *----------------------------------------------------------------------
- *
- * CPUIDSummary_RegsFromCpuid0 --
- *
- *      Fills in the given CPUIDRegs struct with the values from the CPUID0 struct.
- *
- * Results:
- *      Returns the CPUIDRegs pointer passed in.
- *
- * Side effects:
- *	None.
- *
- *----------------------------------------------------------------------
- */
-static INLINE CPUIDRegs*
-CPUIDSummary_RegsFromCpuid0(CPUID0* id0In,
-                            CPUIDRegs* id0Out)
-{
-   id0Out->eax = id0In->numEntries;
-   id0Out->ebx = *(uint32 *) (id0In->name + 0);
-   id0Out->edx = *(uint32 *) (id0In->name + 4);
-   id0Out->ecx = *(uint32 *) (id0In->name + 8);
-   return id0Out;
-}
-
-
 #if defined __cplusplus
 } // extern "C"
 #endif
diff --git a/vmmon-only/include/crossgdt.h b/vmmon-only/include/crossgdt.h
index b3374a47..3a048880 100644
--- a/vmmon-only/include/crossgdt.h
+++ b/vmmon-only/include/crossgdt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -24,6 +24,19 @@
  *      There is only one in the whole host system, shared by all VMs.
  *      It is allocated when the first VCPU is started and freed when the
  *      driver is unloaded.
+ *
+ *      The crossGDT size is exactly one page.
+ *
+ *      The hosted world switch code is based on the assumption that by
+ *      placing VMM descriptors at the end of the page, they will not
+ *      overlap with host kernel descriptors in use when "crossing over".
+ *
+ *      All necessary host segments must be from first page of GDT.
+ *      In Nov 2006, host GDT limits easily met this constraint:
+ *
+ *          Linux 64 bit:  80 (yes 80, not 7F)
+ *          MacOS 64 bit:  8F
+ *        Windows 64 bit:  6F
  */
 
 #ifndef _CROSSGDT_H_
@@ -38,31 +51,9 @@
 #include "vm_basic_defs.h"  // PAGE_SIZE
 #include "x86types.h"       // Descriptor
 
+
 typedef struct CrossGDT {
-   Descriptor gdtes[0x5000 / sizeof (Descriptor)];  // 0x5000 > GDT_LIMIT
+   Descriptor gdtes[PAGE_SIZE / sizeof(Descriptor)];
 } CrossGDT;
 
-#define CROSSGDT_NUMPAGES CEILING(sizeof (CrossGDT), PAGE_SIZE)
-
-/*
- * Out of the 5 pages, only the first and last are really used.
- *
- * All we need to map are the first and last pages.  This mask tells
- * the setup code which pages it can put stuff in and it tells the
- * mapping and invalidation code which pages are mapped and unmapped.
- */
-#define CROSSGDT_PAGEMASK 0x11
-#define CROSSGDT_GETINDEXMASK(i) (1 << ((i) * sizeof (Descriptor) / PAGE_SIZE))
-#define CROSSGDT_TESTINDEXMASK(i) (CROSSGDT_GETINDEXMASK(i) & CROSSGDT_PAGEMASK)
-
-/*
- * All necessary host segments must be below CROSSGDT_HOSTLIMIT. In Nov 2006,
- * host GDT limits for the various guest OSes were:
- *
- *     Linux 64 bit:  80 (yes 80, not 7F)
- *     MacOS 64 bit:  8F
- *   Windows 64 bit:  6F
- */
-#define CROSSGDT_HOSTLIMIT (PAGE_SIZE / sizeof (Descriptor)) /* 1st page */
-
 #endif
diff --git a/vmmon-only/include/hashFunc.h b/vmmon-only/include/hashFunc.h
deleted file mode 100644
index fec72614..00000000
--- a/vmmon-only/include/hashFunc.h
+++ /dev/null
@@ -1,345 +0,0 @@
-/*********************************************************
- * Copyright (C) 2001,2016 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef _HASH_FUNC_H
-#define _HASH_FUNC_H
-
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_VMKERNEL
-
-#include "includeCheck.h"
-
-/*
- * hashFunc.h --
- *
- *	Hash functions defined as simple wrappers around code placed
- *	in the public domain by Bob Jenkins.  His original code can
- *	be used freely for any purpose, including commercial (see the
- *	original comments in the enclosed code).
- */
-
-#include "vm_basic_types.h"
-#include "vm_basic_defs.h"
-#include "vm_assert.h"
-
-/*
- * operations
- */
-
-extern uint64 HashFunc_HashBytes(const uint8 *key,  uint32 nBytes);
-extern uint64 HashFunc_HashMoreBytes(const uint8 *key, uint32 nBytes, 
-                                     uint64 initialValue);
-extern uint64 HashFunc_HashBytesSlow(const uint8 *key, uint32 nBytes);
-extern uint64 HashFunc_HashQuads(const uint64 *key, uint32 nQuads);
-extern uint64 HashFunc_HashPage(const void *addr);
-
-/*
---------------------------------------------------------------------
-Hashes 32-bit key and returns a value that can fit into numBits bits.
---------------------------------------------------------------------
-*/
-
-static INLINE uint32
-HashFunc_TruncHash32(uint32 key, unsigned numBits)
-{
-   const uint32 hashConst = 0x9e3779b9; /* the golden ratio */
-   ASSERT(numBits > 0 && numBits <= 32);
-   return (key * hashConst) >> (32 - numBits);
-}
-
-/*
---------------------------------------------------------------------
-Hashes 64-bit key and returns a value that can fit into numBits bits.
---------------------------------------------------------------------
-*/
-
-static INLINE uint32
-HashFunc_TruncHash64(uint64 key, unsigned numBits)
-{
-   return HashFunc_TruncHash32((uint32)(key ^ (key >> 32)), numBits);
-}
-
-
-/*
- * Original Bob Jenkins public-domain code with minor modifications
- * (static functions, 32-bit length args, disabled self-test code).
- */
-
-
-typedef uint64 ub8;   /* unsigned 8-byte quantities */
-typedef uint32 ub4;   /* unsigned 4-byte quantities */
-typedef uint8  ub1;
-
-#define hashsize(n) ((ub8)1<<(n))
-#define hashmask(n) (hashsize(n)-1)
-
-/*
---------------------------------------------------------------------
-mix -- mix 3 64-bit values reversibly.
-mix() takes 48 machine instructions, but only 24 cycles on a superscalar
-  machine (like Intel's new MMX architecture).  It requires 4 64-bit
-  registers for 4::2 parallelism.
-All 1-bit deltas, all 2-bit deltas, all deltas composed of top bits of
-  (a,b,c), and all deltas of bottom bits were tested.  All deltas were
-  tested both on random keys and on keys that were nearly all zero.
-  These deltas all cause every bit of c to change between 1/3 and 2/3
-  of the time (well, only 113/400 to 287/400 of the time for some
-  2-bit delta).  These deltas all cause at least 80 bits to change
-  among (a,b,c) when the mix is run either forward or backward (yes it
-  is reversible).
-This implies that a hash using mix64 has no funnels.  There may be
-  characteristics with 3-bit deltas or bigger, I didn't test for
-  those.
---------------------------------------------------------------------
-*/
-#define mix64(a,b,c) \
-{ \
-  a -= b; a -= c; a ^= (c>>43); \
-  b -= c; b -= a; b ^= (a<<9); \
-  c -= a; c -= b; c ^= (b>>8); \
-  a -= b; a -= c; a ^= (c>>38); \
-  b -= c; b -= a; b ^= (a<<23); \
-  c -= a; c -= b; c ^= (b>>5); \
-  a -= b; a -= c; a ^= (c>>35); \
-  b -= c; b -= a; b ^= (a<<49); \
-  c -= a; c -= b; c ^= (b>>11); \
-  a -= b; a -= c; a ^= (c>>12); \
-  b -= c; b -= a; b ^= (a<<18); \
-  c -= a; c -= b; c ^= (b>>22); \
-}
-
-/*
---------------------------------------------------------------------
-hash() -- hash a variable-length key into a 64-bit value
-  k     : the key (the unaligned variable-length array of bytes)
-  len   : the length of the key, counting by bytes
-  level : can be any 8-byte value
-Returns a 64-bit value.  Every bit of the key affects every bit of
-the return value.  No funnels.  Every 1-bit and 2-bit delta achieves
-avalanche.  About 41+5len instructions.
-
-The best hash table sizes are powers of 2.  There is no need to do
-mod a prime (mod is sooo slow!).  If you need less than 64 bits,
-use a bitmask.  For example, if you need only 10 bits, do
-  h = (h & hashmask(10));
-In which case, the hash table should have hashsize(10) elements.
-
-If you are hashing n strings (ub1 **)k, do it like this:
-  for (i=0, h=0; i<n; ++i) h = hash( k[i], len[i], h);
-
-By Bob Jenkins, Jan 4 1997.  bob_jenkins@burtleburtle.net.  You may
-use this code any way you wish, private, educational, or commercial,
-as long as this whole comment accompanies it.
-
-See http://burtleburtle.net/bob/hash/evahash.html
-Use for hash table lookup, or anything where one collision in 2^^64
-is acceptable.  Do NOT use for cryptographic purposes.
---------------------------------------------------------------------
-*/
-
-static INLINE ub8 hash(register const ub1 *k, /* the key */
-                       register ub4 length,   /* the length of the key */
-                       register ub8 level)    /* the previous hash, or an arbitrary value */
-{
-  register ub8 a,b,c;
-  ub4 len;
-
-  /* Set up the internal state */
-  len = length;
-  a = b = level;                         /* the previous hash value */
-  c = CONST64U(0x9e3779b97f4a7c13); /* the golden ratio; an arbitrary value */
-
-  /*---------------------------------------- handle most of the key */
-  while (len >= 24)
-  {
-    a += (k[0]        +((ub8)k[ 1]<< 8)+((ub8)k[ 2]<<16)+((ub8)k[ 3]<<24)
-     +((ub8)k[4 ]<<32)+((ub8)k[ 5]<<40)+((ub8)k[ 6]<<48)+((ub8)k[ 7]<<56));
-    b += (k[8]        +((ub8)k[ 9]<< 8)+((ub8)k[10]<<16)+((ub8)k[11]<<24)
-     +((ub8)k[12]<<32)+((ub8)k[13]<<40)+((ub8)k[14]<<48)+((ub8)k[15]<<56));
-    c += (k[16]       +((ub8)k[17]<< 8)+((ub8)k[18]<<16)+((ub8)k[19]<<24)
-     +((ub8)k[20]<<32)+((ub8)k[21]<<40)+((ub8)k[22]<<48)+((ub8)k[23]<<56));
-    mix64(a,b,c);
-    k += 24; len -= 24;
-  }
-
-  /*------------------------------------- handle the last 23 bytes */
-  c += length;
-  switch(len)              /* all the case statements fall through */
-  {
-  case 23: c+=((ub8)k[22]<<56);
-  case 22: c+=((ub8)k[21]<<48);
-  case 21: c+=((ub8)k[20]<<40);
-  case 20: c+=((ub8)k[19]<<32);
-  case 19: c+=((ub8)k[18]<<24);
-  case 18: c+=((ub8)k[17]<<16);
-  case 17: c+=((ub8)k[16]<<8);
-    /* the first byte of c is reserved for the length */
-  case 16: b+=((ub8)k[15]<<56);
-  case 15: b+=((ub8)k[14]<<48);
-  case 14: b+=((ub8)k[13]<<40);
-  case 13: b+=((ub8)k[12]<<32);
-  case 12: b+=((ub8)k[11]<<24);
-  case 11: b+=((ub8)k[10]<<16);
-  case 10: b+=((ub8)k[ 9]<<8);
-  case  9: b+=((ub8)k[ 8]);
-  case  8: a+=((ub8)k[ 7]<<56);
-  case  7: a+=((ub8)k[ 6]<<48);
-  case  6: a+=((ub8)k[ 5]<<40);
-  case  5: a+=((ub8)k[ 4]<<32);
-  case  4: a+=((ub8)k[ 3]<<24);
-  case  3: a+=((ub8)k[ 2]<<16);
-  case  2: a+=((ub8)k[ 1]<<8);
-  case  1: a+=((ub8)k[ 0]);
-    /* case 0: nothing left to add */
-  }
-  mix64(a,b,c);
-  /*-------------------------------------------- report the result */
-  return c;
-}
-
-/*
---------------------------------------------------------------------
- This works on all machines, is identical to hash() on little-endian 
- machines, and it is much faster than hash(), but it requires
- -- that the key be an array of ub8's, and
- -- that all your machines have the same endianness, and
- -- that the length be the number of ub8's in the key
---------------------------------------------------------------------
-*/
-static INLINE ub8 hash2(register const ub8 *k, /* the key */
-                        register ub4 length,   /* the length of the key */
-                        register ub8 level)    /* the previous hash, or an arbitrary value */
-{
-  register ub8 a,b,c;
-  ub4 len;
-
-  /* Set up the internal state */
-  len = length;
-  a = b = level;                         /* the previous hash value */
-  c = CONST64U(0x9e3779b97f4a7c13); /* the golden ratio; an arbitrary value */
-
-  /*---------------------------------------- handle most of the key */
-  while (len >= 3)
-  {
-    a += k[0];
-    b += k[1];
-    c += k[2];
-    mix64(a,b,c);
-    k += 3; len -= 3;
-  }
-
-  /*-------------------------------------- handle the last 2 ub8's */
-  c += length;
-  switch(len)              /* all the case statements fall through */
-  {
-    /* c is reserved for the length */
-  case  2: b+=k[1];
-  case  1: a+=k[0];
-    /* case 0: nothing left to add */
-  }
-  mix64(a,b,c);
-  /*-------------------------------------------- report the result */
-  return c;
-}
-
-/*
---------------------------------------------------------------------
- This is identical to hash() on little-endian machines, and it is much
- faster than hash(), but a little slower than hash2(), and it requires
- -- that all your machines be little-endian, for example all Intel x86
-    chips or all VAXen.  It gives wrong results on big-endian machines.
---------------------------------------------------------------------
-*/
-
-static INLINE ub8 hash3(register const ub1 *k, /* the key */
-                        register ub4 length,   /* the length of the key */
-                        register ub8 level)    /* the previous hash, or an arbitrary value */
-{
-  register ub8 a,b,c;
-  ub4 len;
-
-  /* Set up the internal state */
-  len = length;
-  a = b = level;                         /* the previous hash value */
-  c = CONST64U(0x9e3779b97f4a7c13); /* the golden ratio; an arbitrary value */
-
-  /*---------------------------------------- handle most of the key */
-  if (((size_t)k)&7)
-  {
-    while (len >= 24)
-    {
-      a += (k[0]        +((ub8)k[ 1]<< 8)+((ub8)k[ 2]<<16)+((ub8)k[ 3]<<24)
-       +((ub8)k[4 ]<<32)+((ub8)k[ 5]<<40)+((ub8)k[ 6]<<48)+((ub8)k[ 7]<<56));
-      b += (k[8]        +((ub8)k[ 9]<< 8)+((ub8)k[10]<<16)+((ub8)k[11]<<24)
-       +((ub8)k[12]<<32)+((ub8)k[13]<<40)+((ub8)k[14]<<48)+((ub8)k[15]<<56));
-      c += (k[16]       +((ub8)k[17]<< 8)+((ub8)k[18]<<16)+((ub8)k[19]<<24)
-       +((ub8)k[20]<<32)+((ub8)k[21]<<40)+((ub8)k[22]<<48)+((ub8)k[23]<<56));
-      mix64(a,b,c);
-      k += 24; len -= 24;
-    }
-  }
-  else
-  {
-    while (len >= 24)    /* aligned */
-    {
-      a += *(ub8 *)(k+0);
-      b += *(ub8 *)(k+8);
-      c += *(ub8 *)(k+16);
-      mix64(a,b,c);
-      k += 24; len -= 24;
-    }
-  }
-
-  /*------------------------------------- handle the last 23 bytes */
-  c += length;
-  switch(len)              /* all the case statements fall through */
-  {
-  case 23: c+=((ub8)k[22]<<56);
-  case 22: c+=((ub8)k[21]<<48);
-  case 21: c+=((ub8)k[20]<<40);
-  case 20: c+=((ub8)k[19]<<32);
-  case 19: c+=((ub8)k[18]<<24);
-  case 18: c+=((ub8)k[17]<<16);
-  case 17: c+=((ub8)k[16]<<8);
-    /* the first byte of c is reserved for the length */
-  case 16: b+=((ub8)k[15]<<56);
-  case 15: b+=((ub8)k[14]<<48);
-  case 14: b+=((ub8)k[13]<<40);
-  case 13: b+=((ub8)k[12]<<32);
-  case 12: b+=((ub8)k[11]<<24);
-  case 11: b+=((ub8)k[10]<<16);
-  case 10: b+=((ub8)k[ 9]<<8);
-  case  9: b+=((ub8)k[ 8]);
-  case  8: a+=((ub8)k[ 7]<<56);
-  case  7: a+=((ub8)k[ 6]<<48);
-  case  6: a+=((ub8)k[ 5]<<40);
-  case  5: a+=((ub8)k[ 4]<<32);
-  case  4: a+=((ub8)k[ 3]<<24);
-  case  3: a+=((ub8)k[ 2]<<16);
-  case  2: a+=((ub8)k[ 1]<<8);
-  case  1: a+=((ub8)k[ 0]);
-    /* case 0: nothing left to add */
-  }
-  mix64(a,b,c);
-  /*-------------------------------------------- report the result */
-  return c;
-}
-
-#endif //_HASH_FUNC_H
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index d7688962..6c227369 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -44,6 +44,7 @@
 #include "pageLock_defs.h"
 #include "numa_defs.h"
 #include "bootstrap_vmm.h"
+#include "contextinfo.h"
 
 #if defined __cplusplus
 extern "C" {
@@ -138,13 +139,12 @@ PtrToVA64(void const *ptr) // IN
  * vmcore, and rest-of-bora. The vmmon driver is largely outside
  * vmcore and vmcore imports functionality from vmmon. Addition,
  * deletion or modification of an iocontrol used only by rest-of-bora
- * does not break vmcore compatibility. 
+ * does not break vmcore compatibility.
  *
  * See bora/doc/vmcore details.
- *
  */
 
-#define VMMON_VERSION           (331 << 16 | 0)
+#define VMMON_VERSION           (360 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -158,8 +158,8 @@ PtrToVA64(void const *ptr) // IN
 #else
 #define MAX_VMS 64
 #endif
-/* 
- * MsgWaitForMultipleObjects doesn't scale well enough on Win32. 
+/*
+ * MsgWaitForMultipleObjects doesn't scale well enough on Win32.
  * Allocate with MAX_VMS so static buffers are large, but do
  * admissions control with this value on Win32 until we check
  * scalability (probably in authd).
@@ -231,13 +231,10 @@ enum IOCTLCmd {
    IOCTLCMD(UNLOCK_PAGE_BY_MPN),
     /* AWE calls */
    IOCTLCMD(ALLOC_LOCKED_PAGES),
-   IOCTLCMD(FREE_LOCKED_PAGES),
    IOCTLCMD(GET_NEXT_ANON_PAGE),
 
    IOCTLCMD(GET_ALL_MSRS),
 
-   IOCTLCMD(COUNT_PRESENT_PAGES),
-  
    IOCTLCMD(GET_REFERENCE_CLOCK_HZ),
    IOCTLCMD(INIT_PSEUDO_TSC),
    IOCTLCMD(CHECK_PSEUDO_TSC),
@@ -247,6 +244,7 @@ enum IOCTLCmd {
 
    IOCTLCMD(GET_IPI_VECTORS),
    IOCTLCMD(SEND_IPI),
+   IOCTLCMD(SEND_ONE_IPI),
 
    /*
     * Keep host-specific calls at the end so they can be undefined
@@ -269,8 +267,8 @@ enum IOCTLCmd {
    IOCTLCMD(FREE_CONTIG_PAGES),
    IOCTLCMD(HARD_LIMIT_MONITOR_STATUS), // used by vmauthd on Windows
    IOCTLCMD(CHANGE_HARD_LIMIT),         // used by vmauthd on Windows
-   IOCTLCMD(GET_KERNEL_PROC_ADDRESS),
-   IOCTLCMD(READ_VA64),
+   IOCTLCMD(READ_DISASM_PROC_BINARY),
+   IOCTLCMD(CHECK_CANDIDATE_VA64),
    IOCTLCMD(SET_MEMORY_PARAMS),
    IOCTLCMD(REMEMBER_KHZ_ESTIMATE),
    IOCTLCMD(REMAP_SCATTER_LIST),
@@ -288,6 +286,7 @@ enum IOCTLCmd {
 #endif
 
    IOCTLCMD(GET_UNAVAIL_PERF_CTRS),
+   IOCTLCMD(GET_MONITOR_CONTEXT),
    // Must be last.
    IOCTLCMD(LAST)
 };
@@ -322,6 +321,7 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_INIT_VM             VMIOCTL_BUFFERED(INIT_VM)
 #define IOCTL_VMX86_RUN_VM              VMIOCTL_NEITHER(RUN_VM)
 #define IOCTL_VMX86_SEND_IPI            VMIOCTL_NEITHER(SEND_IPI)
+#define IOCTL_VMX86_SEND_ONE_IPI        VMIOCTL_BUFFERED(SEND_ONE_IPI)
 #define IOCTL_VMX86_GET_IPI_VECTORS     VMIOCTL_BUFFERED(GET_IPI_VECTORS)
 #define IOCTL_VMX86_LOOK_UP_MPN         VMIOCTL_BUFFERED(LOOK_UP_MPN)
 #define IOCTL_VMX86_LOCK_PAGE           VMIOCTL_BUFFERED(LOCK_PAGE)
@@ -346,11 +346,12 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_LOCK_PAGE_NEW       VMIOCTL_BUFFERED(LOCK_PAGE_NEW)
 #define IOCTL_VMX86_UNLOCK_PAGE_BY_MPN  VMIOCTL_BUFFERED(UNLOCK_PAGE_BY_MPN)
 #define IOCTL_VMX86_ALLOC_LOCKED_PAGES  VMIOCTL_BUFFERED(ALLOC_LOCKED_PAGES)
-#define IOCTL_VMX86_FREE_LOCKED_PAGES   VMIOCTL_BUFFERED(FREE_LOCKED_PAGES)
 #define IOCTL_VMX86_GET_NEXT_ANON_PAGE  VMIOCTL_BUFFERED(GET_NEXT_ANON_PAGE)
 
-#define IOCTL_VMX86_GET_KERNEL_PROC_ADDRESS  VMIOCTL_BUFFERED(GET_KERNEL_PROC_ADDRESS)
-#define IOCTL_VMX86_READ_VA64           VMIOCTL_BUFFERED(READ_VA64)
+#define IOCTL_VMX86_READ_DISASM_PROC_BINARY \
+                                      VMIOCTL_BUFFERED(READ_DISASM_PROC_BINARY)
+#define IOCTL_VMX86_CHECK_CANDIDATE_VA64 VMIOCTL_BUFFERED(CHECK_CANDIDATE_VA64)
+
 #define IOCTL_VMX86_SET_MEMORY_PARAMS   VMIOCTL_BUFFERED(SET_MEMORY_PARAMS)
 
 #define IOCTL_VMX86_REMEMBER_KHZ_ESTIMATE VMIOCTL_BUFFERED(REMEMBER_KHZ_ESTIMATE)
@@ -362,6 +363,7 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_CHECK_PSEUDO_TSC         VMIOCTL_BUFFERED(CHECK_PSEUDO_TSC)
 #define IOCTL_VMX86_GET_PSEUDO_TSC           VMIOCTL_NEITHER(GET_PSEUDO_TSC)
 #define IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS    VMIOCTL_NEITHER(GET_UNAVAIL_PERF_CTRS)
+#define IOCTL_VMX86_GET_MONITOR_CONTEXT      VMIOCTL_BUFFERED(GET_MONITOR_CONTEXT)
 #define IOCTL_VMX86_REMAP_SCATTER_LIST VMIOCTL_BUFFERED(REMAP_SCATTER_LIST)
 #define IOCTL_VMX86_UNMAP_SCATTER_LIST VMIOCTL_BUFFERED(UNMAP_SCATTER_LIST)
 #endif
@@ -396,18 +398,18 @@ VMLockPage;
 
 typedef struct VMAPICInfo {
    uint32 flags;
-} VMAPICInfo; 
+} VMAPICInfo;
 
-#define VMX86_DRIVER_VCPUID_OFFSET	1000
+#define VMX86_DRIVER_VCPUID_OFFSET 1000
 
 
 /*
  * We keep track of 3 different limits on the number of pages we can lock.
  * The host limit is determined at driver load time (in windows only) to
  * make sure we do not starve the host by locking too many pages.
- * The static limit is user defined in the UI and the dynamic limit is 
+ * The static limit is user defined in the UI and the dynamic limit is
  * set by authd's hardLimitMonitor code (windows only), which queries
- * host load and adjusts the limit accordingly.  We lock the minimum of 
+ * host load and adjusts the limit accordingly.  We lock the minimum of
  * all these values at any given time.
  */
 typedef struct LockedPageLimit {
@@ -464,7 +466,7 @@ typedef struct VMMemMgmtInfoPatch {
  */
 
 typedef struct VMMemInfoArgs {
-   uint64          currentTime;        // Host time in secs of the call. 
+   uint64          currentTime;        // Host time in secs of the call.
    uint32          minVmMemPct;        // % of vm that must fit in memory
    uint32          globalMinAllocation;// pages that must fit in maxLockedPages
    uint32          numLockedPages;     // total locked pages by all vms
@@ -491,13 +493,6 @@ typedef struct VMMPNList {
    VA64      mpnList;    // IN: User VA of an array of 64-bit MPNs.
 } VMMPNList;
 
-typedef struct VARange {
-   VA64     addr;
-   VA64     bv;
-   unsigned len;
-   uint32   pad;
-} VARange;
-
 typedef struct VMMUnlockPageByMPN {
    MPN       mpn;
    VA64      uAddr;         /* IN: User VA of the page (optional). */
@@ -508,11 +503,6 @@ typedef struct VMMReadWritePage {
    VA64         uAddr; // IN: User VA of a PAGE_SIZE-large buffer.
 } VMMReadWritePage;
 
-struct passthrough_iorange {
-   unsigned short ioBase;   /* Base of range to pass through. */
-   unsigned short numPorts; /* Length of range. */
-};
-
 /*
  * Data structure for the INIT_PSEUDO_TSC and CHECK_PSEUDO_TSC.
  */
@@ -539,14 +529,9 @@ typedef struct PTSCCheckParams {
 
 typedef struct IPIVectors {
    /*
-    * Vector(s) the host uses for its own IPIs; we use this as a performance
-    * hint.
-    */
-   uint8 hostIPIVectors[2];
-   /* 
     * Vectors we have allocated or stolen for the monitor interrupts.
     */
-   uint8 monitorIPIVector; 
+   uint8 monitorIPIVector;
    uint8 hvIPIVector;
 } IPIVectors;
 
@@ -558,6 +543,7 @@ typedef struct IPIVectors {
 typedef struct VMCreateBlock {
    VA64               bsBlob;        // IN: User VA of the VMM bootstrap blob.
    uint32             bsBlobSize;    // IN: Size of VMM bootstrap blob.
+   uint32             numVCPUs;      // IN: Number of VCPUs.
    uint16             vmid;          // OUT: VM ID for the created VM.
 } VMCreateBlock;
 
@@ -582,6 +568,14 @@ typedef struct VMProcessBootstrapBlock {
    VMSharedRegion shRegions[ML_SHARED_REGIONS_MAX]; // IN: Shared regions.
 } VMProcessBootstrapBlock;
 
+/*
+ * Arguments for VMM context retrieval.
+ */
+typedef union {
+   Vcpuid vcpuid;     // IN
+   Context64 context; // OUT
+} VMMonContext;
+
 #if defined __linux__
 
 /*
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index b54872f1..ef244df2 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -41,14 +41,17 @@
 #include "modulecallstructs.h"
 #include "mon_assert.h"
 
-#define NUM_EXCEPTIONS 20       /* EXC_DE ... EXC_XF. */
- 
+#define NUM_EXCEPTIONS   20     /* EXC_DE ... EXC_XF. */
+#define CP_STUB_SIZE 16     /* A relative jmp instruction (5 bytes)
+                               padded to the next 16 byte boundary. */
+
 #define MODULECALL_TABLE                                                      \
    MC(INTR)                                                                   \
    MC(SEMAWAIT)                                                               \
    MC(SEMASIGNAL)                                                             \
    MC(SEMAFORCEWAKEUP)                                                        \
-   MC(IPI)          /* Hit thread with IPI. */                                \
+   MC(IPI)          /* Hit multiple threads with IPI. */                      \
+   MC(ONE_IPI)      /* Hit a single thread with IPI. */                       \
    MC(USERRETURN)   /* Return codes for user calls. */                        \
    MC(GET_RECYCLED_PAGES)                                                     \
    MC(RELEASE_ANON_PAGES)                                                     \
@@ -58,7 +61,12 @@
    MC(ALLOC_TMP_GDT)                                                          \
    MC(PIN_MPN)                                                                \
    MC(VMCLEAR_VMCS_ALL_CPUS)                                                  \
-   MC(GET_PAGE_ROOT)
+   MC(GET_PAGE_ROOT)                                                          \
+   MC(ALLOC_ANON_LOW_PAGE)                                                    \
+   MC(GET_MON_IPI_VECTOR)                                                     \
+   MC(GET_HV_IPI_VECTOR)                                                      \
+   MC(GET_HOST_TIMER_VECTORS)                                                 \
+   MC(BOOTSTRAP_CLEANUP)
 
 /*
  *----------------------------------------------------------------------
@@ -67,9 +75,6 @@
  *
  *      Enumeration of support calls done by the module.
  *
- *      If anything changes in the enum, please update kstatModuleCallPtrs
- *      for stats purposes.
- *
  *----------------------------------------------------------------------
  */
 
@@ -126,15 +131,6 @@ typedef enum UCCostStamp {
 } UCCostStamp;
 #endif // VMX86_SERVER
 
-typedef
-#include "vmware_pack_begin.h"
-struct CodeOffsets {
-   uint16 hostToVmm;
-   uint16 vmmToHost;
-}
-#include "vmware_pack_end.h"
-CodeOffsets;
-
 #define SHADOW_DR(cpData, n)    (cpData)->shadowDR[n].ureg64
 
 
@@ -143,12 +139,12 @@ CodeOffsets;
  * MAX_SWITCH_PT_PATCHES
  *
  *   This is the maximum number of patches that must be placed into
- *   the monitor page tables so that two pages of the host GDT and the
- *   crosspage can be accessed during worldswitch.
+ *   the monitor page tables so that the host GDT and the crosspage
+ *   can be accessed during worldswitch.
  *
  *----------------------------------------------------------------------
  */
-#define MAX_SWITCH_PT_PATCHES 3
+#define MAX_SWITCH_PT_PATCHES 2
 
 /*----------------------------------------------------------------------
  *
@@ -214,6 +210,7 @@ struct VMMPageTablePatch {
    uint32   level;              /* [0, 4]  (maximal size: 3 bits) */
    uint32   pteIdx;             /* Index of the PTE in the page table. */
    uint64   pteGlobalIdx;       /* Global index of the PTE in 'level'. */
+   LPN      lpn;                /* Logical page number mapped by patch. */
    VM_PDPTE pte;                /* PTE.                                */
 }
 #include "vmware_pack_end.h"
@@ -221,6 +218,23 @@ VMMPageTablePatch;
 
 #define MODULECALL_NUM_ARGS  4
 
+/*
+ * The cross page contains tiny stacks upon which interrupt and exception
+ * handlers in the switch path may temporarily run.  Each stack must be
+ * large enough for the sum of:
+ *
+ * - 1 #DB exception frame (5 * uint64)
+ * - 1 #NMI exception frame (5 * uint64)
+ * - 1 #MCE exception frame (5 * uint64)
+ * - the largest stack use instantaneously possible by #MCE handling code
+ * - the largest stack use instantaneously possible by #NMI handling code
+ * - the largest stack use instantaneously possible by #DB handling code
+ * - one high-water uint32 used to detect stack overflows when debugging
+ *
+ * 184 bytes is slightly more than enough as of 2015/03/17 -- fjacobs.
+ */
+#define TINY_STACK_SIZE      184
+
 /*
  *----------------------------------------------------------------------
  *
@@ -233,72 +247,71 @@ VMMPageTablePatch;
 typedef
 #include "vmware_pack_begin.h"
 struct VMCrossPageData {
+   uint32   version;           // CROSSPAGE_VERSION
+   uint32   vmmonVersion;      // VMMON_VERSION
+
    /*
-    * A tiny stack upon which interrupt and exception handlers in the switch
-    * path temporarily run.  Keep the end 16-byte aligned.  This stack must
-    * be large enough for the sum of:
-    *
-    * - 1 #DB exception frame (5 * uint64)
-    * - 1 #NMI exception frame (5 * uint64)
-    * - 1 #MCE exception frame (5 * uint64)
-    * - the largest stack use instantaneously possible by #MCE handling code
-    * - the largest stack use instantaneously possible by #NMI handling code
-    * - the largest stack use instantaneously possible by #DB handling code
-    * - one high-water uint32 used to detect stack overflows when debugging
-    * - remaining pad bytes to align to 16 bytes
-    *
-    * 184 bytes is slightly more than enough as of 2015/03/17 -- fjacobs.
+    * The following stacks and contexts are ordered for performance and code
+    * simplicity.  Both HostToVmm and VmmToHost strictly require this ordering.
+    * For any change to this data, both functions must be updated.
+    * Use VMX86_UCCOST to measure performance when changing the layout.
     */
-   uint32   tinyStack[46];
-
-   uint64   hostCR3;
-   uint32   crosspageMA;
 
-   uint8    hostDRSaved;        // Host DR spilled to hostDR[x].
-   uint8    hostDRInHW;         // 0 -> shadowDR in h/w, 1 -> hostDR in h/w.
-                                //   contains host-sized DB,NMI,MCE entries
-   uint16   hostSS;
-   uint64   hostRSP;
-   uint64   hostDR[8];
+   /* A tiny stack and the host context. */
+   uint64   hostTinyStack[TINY_STACK_SIZE / sizeof(uint64)];
+   uint64   hostCR3; /* Edge of context saved/restored in assembly. */
    uint64   hostRBX;
+   uint64   hostRBP;
    uint64   hostRSI;
    uint64   hostRDI;
-   uint64   hostRBP;
    uint64   hostR12;
    uint64   hostR13;
    uint64   hostR14;
    uint64   hostR15;
+   uint64   hostRSP;
+   uint16   hostSS;  /* Edge of context saved/restored in assembly. */
+   uint16   hostDS;  /* Not saved/restored in assembly switch */
+   uint16   hostES;  /* Not saved/restored in assembly switch */
+   uint16   hostPad;
+
+   /* A tiny stack and the monitor context. */
+   uint64   monTinyStack[TINY_STACK_SIZE / sizeof(uint64)];
+   uint64   monCR3; /* Edge of context saved/restored in assembly. */
+   uint64   monRBX;
+   uint64   monRBP;
+   uint64   monR12;
+   uint64   monR13;
+   uint64   monR14;
+   uint64   monR15;
+   uint64   monRSP;
+   uint16   monSS;  /* Edge of context saved/restored in assembly. */
+   uint16   monDS;  /* Not saved/restored in assembly switch */
+   uint16   monES;  /* Not saved/restored in assembly switch */
+   uint16   monPad;
+
+   uint64   crosspageMA;
+
+   uint64   hostDR[8];
    LA64     hostCrossPageLA;   // where host has crosspage mapped
    uint16   hostInitial64CS;
-   uint16   _pad0[3];
+   uint8    hostDRSaved;       // Host DR spilled to hostDR[x].
+   uint8    hostDRInHW;        // 0 -> shadowDR in h/w, 1 -> hostDR in h/w.
+   uint32   _pad0;
 
    uint64   wsCR0;
    uint64   wsCR4;
 
    DTR64    crossGDTHKLADesc;   // always uses host kernel linear address
    uint16   _pad1[3];
-   DTR64    mon64GDTR;
-   uint16   mon64ES;
-   uint16   mon64SS;
-   uint16   mon64DS;
-   uint64   mon64CR3;
-   uint64   mon64RBX;
-   uint64   mon64RSP;
-   uint64   mon64RBP;
-   uint64   mon64RSI;
-   uint64   mon64RDI;
-   uint64   mon64R12;
-   uint64   mon64R13;
-   uint64   mon64R14;
-   uint64   mon64R15;
-   uint64   mon64RIP;
-   Task64   monTask64;          /* vmm64's task */
+   DTR64    monGDTR;
+   uint16   _pad2[3];
+   /* A hardcoded value for monitor %rip which facilitates backtraces. */
+   uint64   monRIP;
+   Task64   monTask;          /* vmm's task */
 
    VMMPageTablePatch vmmPTP[MAX_SWITCH_PT_PATCHES]; /* page table patch */
-   LA64              vmm64CrossPageLA;
-   LA64              vmm64CrossGDTLA;   // where crossGDT mapped by PT patch
-                                        //  64-bit host: host kernel linear
-                                        // address
+   LA64              vmmCrossPageLA;
+   LA64              vmmCrossGDTLA;   // where crossGDT is mapped by PT patch
 
    /*
     * The monitor may requests up to two actions when returning to the
@@ -318,12 +331,12 @@ struct VMCrossPageData {
    int            userCallType;
    uint32         pcpuNum;   /* Used as extra module call arg within vmmon. */
 
-   VCPUSet        yieldVCPUs;
-
 #if !defined(VMX86_SERVER)
    uint64 ucTimeStamps[UCCOST_MAX];
 #endif
 
+   SwitchedMSRState switchedMSRState;
+
    /*
     * The values in the shadow debug registers must match those in the
     * hardware debug register immediately after a task switch in
@@ -333,8 +346,11 @@ struct VMCrossPageData {
    SharedUReg64     shadowDR[8];
    uint8            shadowDRInHW; // bit n set iff %DRn == shadowDR[n]
 
-   SwitchedMSRState switchedMSRState;
-   uint8            _pad2[7];
+   /* TRUE if no bits are set in yieldVCPUs, FALSE otherwise. */
+   Bool             yieldVCPUsIsEmpty;
+   uint8            _pad3[6];
+
+   VCPUSet          yieldVCPUs;
 
    /*
     * Adjustment for machines where the hardware TSC does not run
@@ -357,22 +373,22 @@ struct VMCrossPageData {
     * restart RunVM call, nobody else should look at it.
     */
    Bool     moduleCallInterrupted;
-   uint8    _pad3[6];
+   uint8    _pad4[6];
 
    DTR64    switchHostIDTR;   // baseLA = switchHostIDT's host kernel LA
-   uint16   _pad4[3];
-   DTR64    switchMonIDTR;    // baseLA = switchMonIDT's monitor LA
    uint16   _pad5[3];
+   DTR64    switchMonIDTR;    // baseLA = switchMonIDT's monitor LA
+   uint16   _pad6[3];
 
    /*
     * Descriptors and interrupt tables for switchNMI handlers.  Each
     * IDT has only enough space for the hardware exceptions; they are
     * sized to accommodate 64-bit descriptors.
     */
-   uint8 switchHostIDT[sizeof(Gate64) * NUM_EXCEPTIONS]; // hostCS:hostVA
-   uint8 switchMonIDT[sizeof(Gate64) * NUM_EXCEPTIONS];  // monCS:monVA
-
+   Gate64 switchHostIDT[NUM_EXCEPTIONS];      // hostCS:hostVA
+   Gate64 switchMonIDT[NUM_EXCEPTIONS];       // monCS:monVA
    volatile Bool wsException[NUM_EXCEPTIONS]; // Tracks faults in worldswitch.
+   uint8         _pad7[4];
    uint64        wsUD2;                       // IP of ud2 instr or 0 if unset.
    uint64        specCtrl; /* host MSR_SPEC_CTRL value before world switch. */
 }
@@ -389,13 +405,19 @@ VMCrossPageData;
  *
  *----------------------------------------------------------------------
  */
+
+#define CODE_BLOCK_SIZE (PAGE_SIZE - sizeof(VMCrossPageData) - \
+                         (2 + NUM_EXCEPTIONS) * CP_STUB_SIZE)
+
 typedef
 #include "vmware_pack_begin.h"
 struct VMCrossPageCode {
-   uint16        size;           // Size of the code module.
-   uint32        vmmonVersion;   // VMMON_VERSION
-   CodeOffsets   offsets;        // Offsets to handlers.
-   uint8         codeBlock[512]; // Code for worldswitch and fault handling.
+   uint8         toVmmFunc[CP_STUB_SIZE];    // Fixed-position stubs to jump
+   uint8         toHostFunc[CP_STUB_SIZE];   // to world switch functions
+   uint8         gateStubs[NUM_EXCEPTIONS *
+                           CP_STUB_SIZE];    // Stubs for crossIDT.
+   uint8         codeBlock[CODE_BLOCK_SIZE]; // Code for worldswitch and
+                                             // fault handling.
 }
 #include "vmware_pack_end.h"
 VMCrossPageCode;
@@ -408,10 +430,10 @@ VMCrossPageCode;
  *
  *      Data structure shared between the monitor and the module
  *      that is used for crossing between the two.
- *      Accessible as vm->cross (kernel module) and CROSS_PAGE
+ *      Accessible as vm->crosspage (kernel module) and CROSS_PAGE
  *      (monitor)
  *
- *      Exactly one page long
+ *      Must be exactly one page long.
  *
  *----------------------------------------------------------------------
  */
@@ -419,19 +441,13 @@ VMCrossPageCode;
 typedef
 #include "vmware_pack_begin.h"
 struct VMCrossPage {
-   uint32          version;         /* 4 bytes. Must be at offset zero. */
-   uint32          crosspage_size;  /* 4 bytes. Must be at offset 4.    */
    VMCrossPageData crosspageData;
    VMCrossPageCode crosspageCode;
-   uint8           _pad[PAGE_SIZE - (sizeof(uint32) /* version */        +
-                                     sizeof(uint32) /* crosspage_size */ +
-                                     sizeof(VMCrossPageData)             +
-                                     sizeof(VMCrossPageCode))];
 }
 #include "vmware_pack_end.h"
 VMCrossPage;
 
-#define CROSSPAGE_VERSION_BASE 0xbfc /* increment by 1 */
+#define CROSSPAGE_VERSION_BASE 0xc09 /* increment by 1 */
 #define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
 
 #if !defined(VMX86_SERVER) && defined(VMM)
diff --git a/vmmon-only/include/monAddrLayout.h b/vmmon-only/include/monAddrLayout.h
index f47800df..130124c0 100644
--- a/vmmon-only/include/monAddrLayout.h
+++ b/vmmon-only/include/monAddrLayout.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005,2007,2009,2013,2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 /*
  * monAddrLayout.h --
  *
- *    Address layout of the monitor
+ *    Address layout of the monitor.
  */
 
 #ifndef _MON_ADDR_LAYOUT_H
@@ -33,25 +33,25 @@
 
 #pragma pack(push, 1)
 typedef struct VMM64_AddrLayout {
-   /* 
+   /*
     *All address are VPNs and all lengths are numPages
     */
    uint64 monBase;            // MONITOR_BASE_VPN
-   uint64 mmuRootStart;       // MMU_ROOT_START
-   uint32 mmuRootLen;         // MMU_ROOT_LEN
-   uint64 mmuL3Start;         // MMU_L3_START
-   uint32 mmuL3Len;           // MMU_L3_LEN
-   uint64 mmuL2Start;         // MMU_L2_START
-   uint32 mmuL2Len;           // MMU_L2_LEN
-   uint64 monPageTableStart;  // MON_PAGE_TABLE_START
-   uint32 monPageTableLen;    // MON_PAGE_TABLE_LEN
+   uint64 monL4Start;         // MON_PAGE_TABLE_L4_START
+   uint32 monL4Len;           // MON_PAGE_TABLE_L4_LEN
+   uint64 monL3Start;         // MON_PAGE_TABLE_L3_START
+   uint32 monL3Len;           // MON_PAGE_TABLE_L3_LEN
+   uint64 monL2Start;         // MON_PAGE_TABLE_L2_START
+   uint32 monL2Len;           // MON_PAGE_TABLE_L2_LEN
+   uint64 monL1Start;         // MON_PAGE_TABLE_L1_START
+   uint32 monL1Len;           // MON_PAGE_TABLE_L1_LEN
 #ifndef VMX86_SERVER
    uint64 monCpStart;         // CROSS_PAGE_START
 #endif
 } VMM64_AddrLayout;
 #pragma pack(pop)
 
-#define VMM_SCRATCHAS_FIRST_L4OFF   1
-#define VMM_SCRATCHAS_LAST_L4OFF  127
+#define VMM_MONAS_FIRST_L4OFF   1
+#define VMM_MONAS_LAST_L4OFF  127
 
 #endif
diff --git a/vmmon-only/include/monLoader.h b/vmmon-only/include/monLoader.h
index bd698308..22ac0ae0 100644
--- a/vmmon-only/include/monLoader.h
+++ b/vmmon-only/include/monLoader.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -59,9 +59,10 @@
  * ML_CONTENT_COPY: Allocates new MPNs, maps them and copies from the specified
  * source.
  *
- * ML_CONTENT_SHARE: Memory provided by user or host kernel and mapped into the
- * monitor address space.  The subIndex field specifies which region, as
- * multiple regions may be shared for each source.
+ * ML_CONTENT_SHARE: Memory provided by user, host kernel, or VMM blob,
+ * and mapped into the monitor address space.  The subIndex field
+ * specifies which region, as multiple regions may be shared for each
+ * source.
  *
  * Processing
  * ==========
@@ -188,7 +189,7 @@ typedef struct {
 
 /* Packed for easy consumption by bootstrap-offsets.pl. */
 #pragma pack(push, 1)
-typedef struct {
+typedef struct MonLoaderHeader {
    uint64         magic;
    uint32         entrySize;
    uint32         count;
@@ -204,29 +205,29 @@ typedef struct {
 
 /* Environment context structure, defined by the environment. */
 struct MonLoaderEnvContext;
-typedef struct MonLoaderEnvContext MonLoaderEnvContext;
 
 /* Callout prototypes */
-MPN  MonLoaderCallout_AllocMPN(MonLoaderEnvContext *, Vcpuid);
-void MonLoaderCallout_CleanUp(MonLoaderEnvContext *);
-Bool MonLoaderCallout_CopyFromBlob(MonLoaderEnvContext *, uint64, size_t, MPN,
-                                   Vcpuid);
-Bool MonLoaderCallout_FillPage(MonLoaderEnvContext *, uint8, MPN, Vcpuid);
-MPN  MonLoaderCallout_GetPageRoot(MonLoaderEnvContext *, Vcpuid);
-Bool MonLoaderCallout_GetPTE(MonLoaderEnvContext *, MPN, unsigned, Vcpuid,
-                             PT_L1E *);
-Bool MonLoaderCallout_ImportPage(MonLoaderEnvContext *, MPN, Vcpuid);
-Bool MonLoaderCallout_Init(void *, MonLoaderEnvContext **);
-Bool MonLoaderCallout_MapMPNInPTE(MonLoaderEnvContext *, MPN, unsigned, uint64,
-                                  MPN, Vcpuid);
-MPN  MonLoaderCallout_GetSharedUserPage(MonLoaderEnvContext *, uint64, unsigned,
-                                        Vcpuid);
-MPN  MonLoaderCallout_GetSharedHostPage(MonLoaderEnvContext *, uint64, unsigned,
-                                        Vcpuid);
-Bool MonLoaderCallout_IsPrivileged(MonLoaderEnvContext *);
-Bool MonLoaderCallout_SetEntrypoint(MonLoaderEnvContext *, uint16, VA64, uint16,
-                                    VA64);
-MPN  MonLoaderCallout_GetBlobMpn(MonLoaderEnvContext *, uint64);
+MPN  MonLoaderCallout_AllocMPN(struct MonLoaderEnvContext *, Vcpuid);
+void MonLoaderCallout_CleanUp(struct MonLoaderEnvContext *);
+Bool MonLoaderCallout_CopyFromBlob(struct MonLoaderEnvContext *, uint64,
+                                   size_t, MPN, Vcpuid);
+Bool MonLoaderCallout_FillPage(struct MonLoaderEnvContext *, uint8, MPN,
+                               Vcpuid);
+MPN  MonLoaderCallout_GetPageRoot(struct MonLoaderEnvContext *, Vcpuid);
+Bool MonLoaderCallout_GetPTE(struct MonLoaderEnvContext *, MPN, unsigned,
+                             Vcpuid, PT_L1E *);
+Bool MonLoaderCallout_ImportPage(struct MonLoaderEnvContext *, MPN, Vcpuid);
+Bool MonLoaderCallout_Init(void *, struct MonLoaderEnvContext **);
+Bool MonLoaderCallout_MapMPNInPTE(struct MonLoaderEnvContext *, MPN, unsigned,
+                                  uint64, MPN, Vcpuid);
+MPN  MonLoaderCallout_GetSharedUserPage(struct MonLoaderEnvContext *, uint64,
+                                        unsigned, Vcpuid);
+MPN  MonLoaderCallout_GetSharedHostPage(struct MonLoaderEnvContext *, uint64,
+                                        unsigned, Vcpuid);
+Bool MonLoaderCallout_IsPrivileged(struct MonLoaderEnvContext *);
+Bool MonLoaderCallout_SetEntrypoint(struct MonLoaderEnvContext *, uint16, VA64,
+                                    uint16, VA64);
+MPN  MonLoaderCallout_GetBlobMpn(struct MonLoaderEnvContext *, uint64);
 
 typedef enum MonLoaderError {
    ML_OK = 0,
@@ -259,7 +260,7 @@ typedef enum MonLoaderError {
 
 
 /* A subindex above shared area subindices for sharing of MonLoaderHeader. */
-#define MONLOADER_HEADER_IDX (NUM_SHARED_AREAS + 1)
+#define MONLOADER_HEADER_IDX 6
 
 
 MonLoaderError MonLoader_Process(MonLoaderHeader *header, unsigned numVCPUs,
diff --git a/vmmon-only/include/monitorAction_exported.h b/vmmon-only/include/monitorAction_exported.h
index 745b1d91..08d732ea 100644
--- a/vmmon-only/include/monitorAction_exported.h
+++ b/vmmon-only/include/monitorAction_exported.h
@@ -26,137 +26,16 @@
 #define INCLUDE_ALLOW_DISTRIBUTE
 #include "includeCheck.h"
 
-#include "vm_assert.h"
-#include "vm_atomic.h"
 #include "vm_basic_types.h"
 
 #if defined __cplusplus
 extern "C" {
 #endif
 
-
-/*
- * Please bump the version number if your change will break the
- * compatability to the drivers.
- */
-#define ACTION_EXPORTED_VERSION   2
-
-#define ACTION_WORD_SIZE   (sizeof(uint64) * 8)
-#define ACTION_NUM_WORDS   (2)
-#define ACTION_NUM_IDS     (ACTION_NUM_WORDS * ACTION_WORD_SIZE)
-
 #define MONACTION_INVALID  MAX_UINT32
 
 typedef uint32 MonitorIdemAction;
 
-/*
- * Representation of a set of actions.
- */
-typedef struct MonitorActionSet {
-   volatile uint64 word[ACTION_NUM_WORDS];
-} MonitorActionSet;
-
-#ifndef __cplusplus
-typedef enum MonitorActionSetName MonitorActionSetName;
-#endif
-
-/*
- * Summary of action and interrupt states.
- */
-typedef struct MonitorActionIntr {
-   MonitorActionSet  pendingSet;
-   volatile Bool     action;
-   Bool              intr;
-   Bool              nmi;
-   Bool              db;
-   uint32            _pad;
-} MonitorActionIntr;
-
-/*
- *------------------------------------------------------------------------
- * MonitorActionSet_AtomicInclude --
- *
- *    This function atomically adds an action to an action set.
- *
- * Results:
- *    TRUE if the action being added did not exist in the action set.
- *    FALSE otherwise.
- *
- * Side effects:
- *    The given action set will be updated.
- *------------------------------------------------------------------------
- */
-static INLINE Bool
-MonitorActionSet_AtomicInclude(MonitorActionSet *set, const uint32 actionID)
-{
-   Atomic_uint64 *atomicSet =
-      Atomic_VolatileToAtomic64(&set->word[actionID / ACTION_WORD_SIZE]);
-   uint64 mask = (uint64)1 << (actionID % ACTION_WORD_SIZE);
-   uint64 oldWord;
-   uint64 newWord;
-
-   ASSERT_ON_COMPILE((ACTION_WORD_SIZE & (ACTION_WORD_SIZE - 1)) == 0);
-#ifdef VMX86_DEBUG
-   /* If ASSERT is not desirable, do explicit check. Please see PR 567811. */
-#ifdef MODULE
-   if (UNLIKELY(actionID / ACTION_WORD_SIZE >= ACTION_NUM_WORDS)) {
-      return FALSE;
-   }
-#else
-   ASSERT(actionID / ACTION_WORD_SIZE < ACTION_NUM_WORDS);
-#endif // MODULE
-#endif // VMX86_DEBUG
-   do {
-      oldWord = Atomic_Read64(atomicSet);
-      newWord = oldWord | mask;
-   } while (!Atomic_CMPXCHG64(atomicSet, oldWord, newWord));
-   return (oldWord & mask) == 0;
-}
-
-
-/*
- *----------------------------------------------------------------------------
- * MonitorAction_SetBits --
- *
- *      The core logic for posting an action. Update the set of pending
- *      actions of the target VCPU in the shared area to mark the action
- *      as present. Make sure the bit is set in the pendingSet first to
- *      avoid a race with the drain loop.
- *
- *      It's the responsibility of the callers to ensure that the change
- *      to actionIntr->action is globally visible before any IPI is sent
- *      (the change to pendingSet is pushed out by the cmpxchg in
- *      MonitorActionSet_AtomicInclude).
- *
- * Results:
- *      TRUE if the action being posted was not pending before.
- *      FALSE otherwise (other threads could have posted the same action).
- *
- * Side effects:
- *      None.
- *----------------------------------------------------------------------------
- */
-static INLINE Bool
-MonitorAction_SetBits(MonitorActionIntr *actionIntr, MonitorIdemAction actionID)
-{
-   /* Careful if optimizing this: see PR70016. */
-   Bool newAction =
-      MonitorActionSet_AtomicInclude(&actionIntr->pendingSet, actionID);
-   actionIntr->action = TRUE;
-   return newAction;
-}
-
-/*
- * C1 states entered by monitor while waiting for an action
- */
-typedef enum {
-   VMM_C1_STATE_INVALID = 0,
-   VMM_C1_STATE_HLT,
-   VMM_C1_STATE_MWAIT,
-   VMM_C1_STATE_PAUSE
-} vmmC1StateType;
-
-
 #if defined __cplusplus
 } // extern "C"
 #endif
diff --git a/vmmon-only/include/numa_defs.h b/vmmon-only/include/numa_defs.h
index fd2a0fc5..4df0a6b9 100644
--- a/vmmon-only/include/numa_defs.h
+++ b/vmmon-only/include/numa_defs.h
@@ -48,7 +48,11 @@ typedef uint8  NUMA_MemRangeID;
  */
 #define NUMA_MAX_NODES              64
 #define NUMA_MAX_CPUS_PER_NODE      (vmx86_server ? MAX_PCPUS : 32)
-#define NUMA_MAX_MEM_RANGES         (vm_arm_64 ? 128 : 64)
+#ifdef VMKBOOT
+#define NUMA_MAX_MEM_RANGES         64
+#else
+#define NUMA_MAX_MEM_RANGES         256
+#endif
 #define INVALID_NUMANODE            ((NUMA_Node)-1)
 #define NUMA_NODE_MASK_ANY          ((NUMA_NodeMask)-1)
 #define NUMA_NODE_MASK_NONE         ((NUMA_NodeMask)0)
@@ -70,4 +74,10 @@ typedef struct NUMA_MemRangesList {
    NUMA_MemRange memRange[NUMA_MAX_MEM_RANGES];
 } NUMA_MemRangesList;
 
+
+typedef struct NUMA_MemRangesListRef {
+   uint64        numMemRanges;
+   const NUMA_MemRange *memRange;
+} NUMA_MemRangesListRef;
+
 #endif // _NUMA_DEFS_H
diff --git a/vmmon-only/include/pcip_defs.h b/vmmon-only/include/pcip_defs.h
index a00520bb..b7620a92 100644
--- a/vmmon-only/include/pcip_defs.h
+++ b/vmmon-only/include/pcip_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2009-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2009-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -65,16 +65,6 @@ typedef struct FPTIntrProxyInfo {
    uint32            adapterIndex;
    uint32            vectorIndex;
    MonitorIdemAction actionID;
-   uint32 _pad0;
-
-   /*
-    * These addresses are only needed for hosted platforms, where our kernel
-    * modules lack a SharedArea API.
-    */
-#ifndef VMX86_SERVER
-   VA64              notifyUVA;
-   VA64              vectorIndexUVA;
-#endif
 } FPTIntrProxyInfo;
 
 typedef struct UPTIntrProxyInfo {
diff --git a/vmmon-only/include/pshare_ext.h b/vmmon-only/include/pshare_ext.h
index 2fab2abc..3a3063c9 100644
--- a/vmmon-only/include/pshare_ext.h
+++ b/vmmon-only/include/pshare_ext.h
@@ -41,8 +41,8 @@
  */
 
 #define PSHARE_PAGELIST_MAX             (PAGELIST_MAX)
-#define PSHARE_P2M_BUFFER_MPNS_MAX      (16)
-#define PSHARE_P2M_BUFFER_MPNS_DEFAULT  (4)
+#define PSHARE_P2M_BUFFER_MPNS_MAX      (32)
+#define PSHARE_P2M_BUFFER_MPNS_DEFAULT  (5)
 #define PSHARE_P2M_BUFFER_SLOTS_PER_MPN (PAGE_SIZE / sizeof(PShare_P2MUpdate))
 #define PSHARE_P2M_BUFFER_SLOTS_MIN     (2)
 
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
index 584cf19c..e82db063 100644
--- a/vmmon-only/include/ptsc.h
+++ b/vmmon-only/include/ptsc.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -97,6 +97,7 @@ extern PTSCInfo ptscInfo;
 Bool PTSC_Init(uint64 tscHz);
 VmAbsoluteTS PTSC_InitialCount(const char *module,
                                const char *option,
+                               Bool stress,
                                VmIntervalTS freq,
                                VmAbsoluteTS defaultCnt);
 Bool PTSC_HasPerfectlySynchronizedTSCs(void);
diff --git a/vmmon-only/include/vcpuid.h b/vmmon-only/include/vcpuid.h
index a1bde887..ca327315 100644
--- a/vmmon-only/include/vcpuid.h
+++ b/vmmon-only/include/vcpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014, 2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014, 2016-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -50,9 +50,9 @@ typedef uint32 Vcpuid;                 // VCPU number
 #define BOOT_VCPU_ID     0
 #define IS_BOOT_VCPUID(vcpuid)  ((vcpuid) == BOOT_VCPU_ID)
 
-#define MAX_VCPUS      192
-
+#define MAX_VCPUS            2048
 #define MAX_CORES_PER_SOCKET   64
+#define MAX_VCPU_SOCKETS      128
 
 #ifdef VMM
 #include "vcpuset.h"
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
index 838726e6..1cc97a2f 100644
--- a/vmmon-only/include/vcpuset.h
+++ b/vmmon-only/include/vcpuset.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 /*
  * vcpuset.h --
  *
- *	ADT for a set of VCPUs.  Implemented as an array of bitmasks.
+ *      ADT for a set of VCPUs.  Implemented as an array of bitmasks.
  *
  */
 
@@ -80,18 +80,35 @@
 
 extern VCPUSet  vcpuSetFull;
 
-#define FOR_EACH_VCPU_IN_SET(_vcpuSet, _v)                                    \
-   do {                                                                       \
-      Vcpuid  _v;                                                             \
-      VCPUSet __vcs;                                                          \
-      VCPUSet_Copy(&__vcs, _vcpuSet);                                         \
-      while ((_v = VCPUSet_FindFirst(&__vcs)) != VCPUID_INVALID) {            \
-         VCPUSet_Remove(&__vcs, _v);
+#define FOR_EACH_VCPU_IN_SET_WITH_MAX(_vcpuSet, _v, _numVcpus)                 \
+   do {                                                                        \
+      Vcpuid _v;                                                               \
+      const VCPUSet *__vcs = (_vcpuSet);                                       \
+      unsigned _subsetIdx = 0;                                                 \
+      uint64 _subset = VCPUSet_Subset(__vcs, _subsetIdx);                      \
+      unsigned _maxSubsets = VCS_VCPUID_SUBSET_IDX((_numVcpus) - 1) + 1;       \
+      ASSERT(_maxSubsets <= VCS_SUBSET_COUNT);                                 \
+      while ((_v = VCPUSet_FindFirstInSubset(__vcs, &_subset, &_subsetIdx,     \
+                                             _maxSubsets)) != VCPUID_INVALID) {\
+
+#define ROF_EACH_VCPU_IN_SET_WITH_MAX()                                 \
+      }                                                                 \
+   } while (0)
 
-#define ROF_EACH_VCPU_IN_SET()                                                \
-      }                                                                       \
+
+#define FOR_EACH_VCPU_IN_SET(_vcpuSet, _v)                              \
+   FOR_EACH_VCPU_IN_SET_WITH_MAX(_vcpuSet, _v, MAX_VCPUS)
+
+#define ROF_EACH_VCPU_IN_SET()                                          \
+      }                                                                 \
    } while (0)
 
+#define FOR_EACH_VCPU_IN_POPULATED_VCPUS(_vcpuSet, _v)                  \
+   FOR_EACH_VCPU_IN_SET_WITH_MAX(_vcpuSet, _v, NumVCPUs())
+
+#define ROF_EACH_VCPU_IN_POPULATED_VCPUS()                              \
+      }                                                                 \
+   } while (0)
 
 #define FOR_EACH_SUBSET_IN_SET(_setIndex)                                     \
    do {                                                                       \
@@ -113,10 +130,10 @@ extern VCPUSet  vcpuSetFull;
    } while (0)
 
 
-#define FOR_EACH_POPULATED_SUBSET_IN_SET(_setIndex)                           \
+#define FOR_EACH_POPULATED_SUBSET_IN_SET(_setIndex, _numVcpus)                \
    do {                                                                       \
       int _setIndex;                                                          \
-      int _maxSubsets = VCS_VCPUID_SUBSET_IDX(NumVCPUs() - 1);                \
+      int _maxSubsets = VCS_VCPUID_SUBSET_IDX(_numVcpus - 1);                 \
       for (_setIndex = 0; _setIndex <= _maxSubsets; _setIndex++) {
 
 #define ROF_EACH_POPULATED_SUBSET_IN_SET()                                    \
@@ -128,7 +145,7 @@ extern VCPUSet  vcpuSetFull;
  *----------------------------------------------------------------------
  *
  * VCPUSet_Empty --
- *      
+ *
  *      Clear all bits in a VCPUSet.
  *
  *----------------------------------------------------------------------
@@ -147,7 +164,7 @@ VCPUSet_Empty(VCPUSet *vcs)
  *----------------------------------------------------------------------
  *
  * VCPUSet_IsEmpty --
- *      
+ *
  *      Return TRUE iff a VCPUSet has no bits set.
  *
  *----------------------------------------------------------------------
@@ -192,7 +209,7 @@ VCPUSet_Full(void)
  *----------------------------------------------------------------------
  *
  * VCPUSet_Copy --
- *      
+ *
  *      Copy one VCPUSet's contents to another.
  *
  *----------------------------------------------------------------------
@@ -211,7 +228,7 @@ VCPUSet_Copy(VCPUSet *dest, const VCPUSet *src)
  *----------------------------------------------------------------------
  *
  * VCPUSet_Equals --
- *      
+ *
  *      Compare two VCPUSets, return TRUE iff their contents match.
  *
  *----------------------------------------------------------------------
@@ -233,7 +250,7 @@ VCPUSet_Equals(const VCPUSet *vcs1, const VCPUSet *vcs2)
  *----------------------------------------------------------------------
  *
  * VCPUSet_IsMember --
- *      
+ *
  *      Return TRUE iff the given Vcpuid is present in a VCPUSet.
  *
  *----------------------------------------------------------------------
@@ -252,7 +269,7 @@ VCPUSet_IsMember(const VCPUSet *vcs, Vcpuid v)
  *----------------------------------------------------------------------
  *
  * VCPUSet_AtomicIsMember --
- *      
+ *
  *      Return TRUE iff the given Vcpuid is present in a VCPUSet.
  *
  *----------------------------------------------------------------------
@@ -273,7 +290,7 @@ VCPUSet_AtomicIsMember(VCPUSet *vcs, Vcpuid v)
  *
  * VCPUSet_FindFirst --
  * VCPUSet_FindLast --
- *      
+ *
  *      Find the first (lowest-numbered) or last (highest-numbered)
  *      Vcpuid in a VCPUSet.
  *
@@ -309,12 +326,56 @@ VCPUSet_FindLast(const VCPUSet *vcs)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_FindFirstInSubset --
+ *
+ *      Find the first (lowest-numbered) Vcpuid in the given subset of a
+ *      VCPUSet object.  It is required that *subset is initialized to
+ *      a subset of *vcs and *subsetIdx must hold the index of the subset
+ *      stored in *subset.
+ *
+ * Results:
+ *      Vcpuid if at least one is present in a set.
+ *      VCPUID_INVALID if the set is empty.
+ *
+ * Side effects:
+ *      This function is intended to be used for iterating over all bits
+ *      of a VCPUSet, it will modify *subset to clear the bit associated
+ *      with the returned Vcpuid (if any).  The *subsetIdx argument may
+ *      also be updated.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Vcpuid
+VCPUSet_FindFirstInSubset(const VCPUSet *vcs, uint64 *subset,
+                          unsigned *subsetIdx, unsigned maxSubsets)
+{
+   ASSERT(*subsetIdx < maxSubsets && maxSubsets <= VCS_SUBSET_COUNT);
+   do {
+      if (*subset != 0) {
+         int bit;
+         bit = lssb64_0(*subset);
+         *subset &= ~(CONST64U(1) << bit);
+         return bit + (*subsetIdx << VCS_SUBSET_SHIFT);
+      }
+      ++*subsetIdx;
+      if (*subsetIdx < maxSubsets) {
+         *subset = vcs->subset[*subsetIdx];
+      }
+   } while (*subsetIdx < maxSubsets);
+   return VCPUID_INVALID;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
  * VCPUSet_Remove --
  * VCPUSet_AtomicRemove --
- *      
+ *
  *      Remove or atomically remove a single Vcpuid from a VCPUSet.
  *
  *----------------------------------------------------------------------
@@ -371,7 +432,7 @@ VCPUSet_RemoveSet(VCPUSet *dest, const VCPUSet *src)
  *
  * VCPUSet_Include --
  * VCPUSet_AtomicInclude --
- *      
+ *
  *      Add or atomically add a single Vcpuid to a VCPUSet.
  *
  *----------------------------------------------------------------------
@@ -394,12 +455,33 @@ VCPUSet_AtomicInclude(VCPUSet *vcs, Vcpuid v)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * VCPUSet_AtomicTestInclude  --
+ *
+ *      Atomically add a single Vcpuid to a VCPUSet, and
+ *      return TRUE iff the given Vcpuid was present in the VCPUSet.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE Bool
+VCPUSet_AtomicTestInclude(VCPUSet *vcs, Vcpuid v)
+{
+   volatile uint64 *subset = &vcs->subset[VCS_VCPUID_SUBSET_IDX(v)];
+   ASSERT(v < MAX_VCPUS);
+   return Atomic_TestSetBit64(Atomic_VolatileToAtomic64(subset),
+                              v & VCS_SUBSET_MASK);
+}
+
+
 #if defined(VMM) && !defined(MONITOR_APP)
 /*
  *----------------------------------------------------------------------
  *
  * VCPUSet_PackCareful --
- *      
+ *
  *      Pack a VCPUSet into the bytes at "ptr".
  *
  *----------------------------------------------------------------------
@@ -416,7 +498,7 @@ VCPUSet_PackCareful(unsigned numVCPUs, const VCPUSet *vcs, void *ptr)
  *----------------------------------------------------------------------
  *
  * VCPUSet_UnpackCareful --
- *      
+ *
  *      Unpack a VCPUSet from the bytes at "ptr".
  *
  *----------------------------------------------------------------------
@@ -483,7 +565,7 @@ VCPUSet_Populate(VCPUSet *vcs, unsigned numVCPUs)
  *----------------------------------------------------------------------
  *
  * VCPUSet_Subset --
- *      
+ *
  *      Return the specified subset of a VCPUSet.
  *
  *----------------------------------------------------------------------
@@ -502,7 +584,7 @@ VCPUSet_Subset(const VCPUSet *vcs,
  *----------------------------------------------------------------------
  *
  * VCPUSet_SubsetPtr --
- *      
+ *
  *      Return a pointer to the specified subset of a VCPUSet.
  *
  *----------------------------------------------------------------------
@@ -520,7 +602,7 @@ VCPUSet_SubsetPtr(VCPUSet *vcs, unsigned subset)
  *----------------------------------------------------------------------
  *
  * VCPUSet_IsSupersetOrEqual --
- *      
+ *
  *      Return TRUE iff vcs1 contains a superset of the VCPUs in vcs2
  *      or vcs1 and vcs2 contain exactly the same VCPUs.
  *
@@ -543,7 +625,7 @@ VCPUSet_IsSupersetOrEqual(const VCPUSet *vcs1, const VCPUSet *vcs2)
  *----------------------------------------------------------------------
  *
  * VCPUSet_IsSubsetOrEqual --
- *      
+ *
  *      Return TRUE iff vcs1 contains a subset of the VCPUs in vcs2
  *      or vcs1 and vcs2 contain exactly the same VCPUs.
  *
@@ -561,7 +643,7 @@ VCPUSet_IsSubsetOrEqual(const VCPUSet *vcs1, const VCPUSet *vcs2)
  *----------------------------------------------------------------------
  *
  * VCPUSet_MakeSingleton --
- *      
+ *
  *      Add a single Vcpuid to a VCPUSet and remove all others.
  *
  *----------------------------------------------------------------------
@@ -578,27 +660,31 @@ VCPUSet_MakeSingleton(VCPUSet *vcs, Vcpuid v)
 /*
  *----------------------------------------------------------------------
  *
- * VCPUSet_IsSingleton --
- *      
- *      Return TRUE iff vcs contains exactly one VCPU.
+ * VCPUSet_FindSingleton --
+ *
+ *      Return the VCPU in the set iff vcs contains exactly one VCPU.
+ *      Return VCPUID_INVALID otherwise.
  *
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
-VCPUSet_IsSingleton(const VCPUSet *vcs)
+static INLINE Vcpuid
+VCPUSet_FindSingleton(const VCPUSet *vcs)
 {
-   Bool foundOnce = FALSE;
+   uint64 foundSub = 0;
+   uint32 foundIdx;
    FOR_EACH_SUBSET_IN_SET(idx) {
       uint64 sub = vcs->subset[idx];
       if (sub != 0) {
-         if (foundOnce || (sub & (sub - 1)) != 0) {
-            return FALSE;
+         if (foundSub != 0 || (sub & (sub - 1)) != 0) {
+            return VCPUID_INVALID;
          }
-         foundOnce = TRUE;
+         foundSub = sub;
+         foundIdx = idx;
       }
    } ROF_EACH_SUBSET_IN_SET();
-   return foundOnce;
+   return foundSub != 0 ? lssb64_0(foundSub) + (foundIdx << VCS_SUBSET_SHIFT) :
+                          VCPUID_INVALID;
 }
 
 
@@ -622,7 +708,7 @@ VCPUSet_IsFull(const VCPUSet *vcs)
  *----------------------------------------------------------------------
  *
  * VCPUSet_AtomicReadWriteSubset --
- *      
+ *
  *      For the nth aligned 64-VCPU subset of a VCPU set, atomically
  *      read then write.  Return the contents read.  Set 0 is VCPUs
  *      0-63 and set 1 is VCPUs 64-127.
@@ -667,7 +753,7 @@ VCPUSet_Size(const VCPUSet *vcs)
  *----------------------------------------------------------------------
  *
  * VCPUSet_UnionSubset --
- *      
+ *
  *      Given an 64-bit value and a subset number, add the VCPUs
  *      represented to the set.
  *
@@ -686,7 +772,7 @@ VCPUSet_UnionSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
  *----------------------------------------------------------------------
  *
  * VCPUSet_SubtractSubset --
- *      
+ *
  *      Given an 64-bit value and a subset number, remove the VCPUs
  *      represented in the subset from the set.
  *
@@ -705,7 +791,7 @@ VCPUSet_SubtractSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
  *----------------------------------------------------------------------
  *
  * VCPUSet_AtomicUnionSubset --
- *      
+ *
  *      Given a 64-bit value and a subset number, atomically add
  *      the VCPUs represented to the set.
  *
@@ -725,7 +811,7 @@ VCPUSet_AtomicUnionSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
  *----------------------------------------------------------------------
  *
  * VCPUSet_Invert --
- *      
+ *
  *      Makes all non-present valid VCPUs in a set present and all
  *      VCPUs present non-present.
  *
@@ -746,7 +832,7 @@ VCPUSet_Invert(VCPUSet *vcs)
  *----------------------------------------------------------------------
  *
  * VCPUSet_Intersection
- *      
+ *
  *      Given two VCPUSets, populate the destination set with only the
  *      VCPUs common to both.
  *
@@ -766,7 +852,7 @@ VCPUSet_Intersection(VCPUSet *dest, const VCPUSet *src)
  *----------------------------------------------------------------------
  *
  * VCPUSet_LogFormat --
- *      
+ *
  *      Given a buffer of at least VCS_BUF_SIZE to fill, write into it a
  *      string suitable for use in Log() or LOG().
  *      Returns the buffer which was passed as an argument, after
diff --git a/vmmon-only/include/vcpuset_types.h b/vmmon-only/include/vcpuset_types.h
index 3df1f8c2..6a54f27a 100644
--- a/vmmon-only/include/vcpuset_types.h
+++ b/vmmon-only/include/vcpuset_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2013, 2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2013, 2016-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -41,7 +41,7 @@
 #define VCS_SUBSET_WIDTH                                                   64
 #define VCS_SUBSET_SHIFT                                                    6
 #define VCS_SUBSET_MASK               ((CONST64U(1) << VCS_SUBSET_SHIFT) - 1)
-#define VCS_SUBSET_COUNT                                                    4
+#define VCS_SUBSET_COUNT                                                   32
 
 
 #define VCS_VCPUID_SUBSET_IDX(v)                    ((v) >> VCS_SUBSET_SHIFT)
@@ -56,11 +56,12 @@ typedef struct VCPUSet {
 } VCPUSet;
 
 MY_ASSERTS(VCPUSET_ASSERTS,
+           ASSERT_ON_COMPILE(VCS_SUBSET_WIDTH * VCS_SUBSET_COUNT >= MAX_VCPUS);
            /*
             * Catch changes in VCPUSet which need to be reflected in
             * bora/public/iocontrolsMacosTable.h.
             */
-           ASSERT_ON_COMPILE(VCS_SUBSET_COUNT == 4);
+           ASSERT_ON_COMPILE(VCS_SUBSET_COUNT == 32);
            /*
             * There is code that depends on sizeof(VCPUSet) being a power of
             * 2 in at least vcpuHotPlug.c and possible other places.
diff --git a/vmmon-only/include/versioned_atomic.h b/vmmon-only/include/versioned_atomic.h
index 650b1e60..b58cfc02 100644
--- a/vmmon-only/include/versioned_atomic.h
+++ b/vmmon-only/include/versioned_atomic.h
@@ -144,9 +144,6 @@ VersionedAtomic_BeginWrite(VersionedAtomic *versions) // IN
    /*
     * The write to 'versions->v0' must be observed by all other OS CPUs before
     * the write(s) to the shared data.
-    *
-    * On arm64, this barrier is Full System, which is probably too strong:
-    * Inner Shareable (== all OS CPUs) should work just fine.
     */
    SMP_W_BARRIER_W();
 }
@@ -176,9 +173,6 @@ VersionedAtomic_EndWrite(VersionedAtomic *versions) // IN
    /*
     * The write(s) to the shared data must be observed by all other OS CPUs
     * before the write to 'versions->v1'.
-    *
-    * On arm64, this barrier is Full System, which is probably too strong:
-    * Inner Shareable (== all OS CPUs) should work just fine.
     */
    SMP_W_BARRIER_W();
 
@@ -223,10 +217,6 @@ VersionedAtomic_BeginTryRead(VersionedAtomic const *versions) // IN
    /*
     * The read from 'versions->v1' must happen on this CPU before the read(s)
     * from the shared data.
-    *
-    * On arm64, this barrier is Full System, which is probably too strong:
-    * Inner Shareable (== all OS CPUs) should work just fine, and maybe
-    * Non-shareable (== current CPU) would work too.
     */
    SMP_R_BARRIER_R();
 
@@ -262,10 +252,6 @@ VersionedAtomic_EndTryRead(VersionedAtomic const *versions, // IN
    /*
     * The read(s) from the shared data must happen on this CPU before the read
     * from 'versions->v0'.
-    *
-    * On arm64, this barrier is Full System, which is probably too strong:
-    * Inner Shareable (== all OS CPUs) should work just fine, and maybe
-    * Non-shareable (== current CPU) would work too.
     */
    SMP_R_BARRIER_R();
 
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index 364a4207..bfc152a5 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -66,7 +66,7 @@
  *                    ((__builtin_constant_p(expr) ? ((expr) >> 16) == 0) \
  *                                                 : sizeof(expr) <= 2)
  */
-#if (__GNUC__ >= 4) && (__GNUC_MINOR__ >= 1)
+#if (__GNUC__ >= 4) && (__GNUC_MINOR__ >= 1) && !defined(USE_UBSAN)
 #define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)                                \
    ASSERT_ON_COMPILE(sizeof(Selector) == 2 &&                                \
                      ((__builtin_constant_p(expr) && ((expr) >> 16) == 0) || \
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index 38d45fde..5fa2fcaf 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -49,38 +49,68 @@ extern "C" {
 #endif
 
 /*
- * In the Atomic_* definitions below, memory ordering and atomicity are somewhat
- * conflated in an inconsistent manner. First, we have Atomic_{Read,Write},
- * which only guarantees single copy atomicity, i.e. that the read/write occurs
- * in an atomic fashion, but have no implication on memory ordering. The second
- * class of Atomics are all the non-unfenced operations excluding
- * Atomic_{Read,Write}*, which both imply atomicity and act as a memory barrier,
- * implying sequentially consistent ordering of the atomic operation with all
- * loads/stores prior to and after it.
- *
- * Since on x86, the second class of operations are associated with LOCK
- * semantics, assumptions have been made about the ordering these operations
- * imply on surrounding code (see for example the vmkernel's RefCount
- * implementation). As a result, on arm64 we have to provide these same
- * guarantees. We do this by making use of DMB barriers both before and after
- * the atomic ldrx/strx sequences. A barrier before and after is required to
- * avoid having part of the atomic operation reordered with surrounding code,
- * e.g. a store-load reordering of the strx with a following load outside the
- * Atomic_ op. For the first class of operations, Atomic_{Read,Write}, we do not
- * implement a barrier.
- *
- * This implementation of Atomic operations is suboptimal on arm64, since
- * both atomicity and memory ordering are fused together. Ideally the Atomic
- * operations would only imply atomicity, and an explicit memory barrier in the
- * surrounding code used to enforce ordering where necessary. This would eschew
- * the need for the DMBs. A middle ground can be implemented where we use the
- * arm64 load-acquire/store-release exclusive instructions to implement Atomics.
- * This would imply sequential consistency of the Atomic operations (but not
- * with any of the surrounding non-atomic operations) without the need for a
- * DMB. Using these without a DMB today can still result in problematic
- * reordering by the processor with surrounding non-atomic operations, e.g. a
- * store-load reordering with a stlxr. Future optimization for arm64 should
- * consider the wider change required at the call sites to minimize DMBs.
+ * There are two concepts involved when dealing with atomic accesses:
+ * 1. Atomicity of the access itself
+ * 2. Ordering of the access with respect to other reads&writes (from the view
+ *    of other processors/devices).
+ *
+ * Two examples help to clarify #2:
+ * a. Inc: A caller implementing a simple independent global event counter
+ *         might not care if the compiler or processor visibly reorders the
+ *         increment around other memory accesses.
+ * b. Dec: A caller implementing a reference count absolutely *doesn't* want
+ *         the compiler or processor to visibly reordering writes after that
+ *         decrement: if that happened, the program could then end up writing
+ *         to memory that was freed by another processor.
+ *
+ * C11 has standardized a good model for expressing these orderings when doing
+ * atomics. It defines three *tiers* of ordering:
+ * 1. Sequential Consistency (every processor sees the same total order of
+ *    events)
+ *
+ * 2. Acquire/Release ordering (roughly, everybody can agree previous events
+ *    have completed, but they might disagree on the ordering of previous
+ *    independent events).
+ *
+ *    The relative ordering provided by this tier is sufficient for common
+ *    locking and initialization activities, but is insufficient for unusual
+ *    synchronization schemes (e.g. IRIW aka Independent Read Independent
+ *    Write designs such Dekker's algorithm, Peterson's algorithm, etc.)
+ *
+ *    In other words, this tier is close in behavior to Sequential Consistency
+ *    in much the same way a General-Relativity universe is close to a
+ *    Newtonian universe.
+ * 3. Relaxed (i.e unordered/unfenced)
+ *
+ * In C11 standard's terminology for atomic memory ordering,
+ * - in case (a) we want "relaxed" ordering for perf and,
+ * - in case (b) we want "sequentially consistent" ordering (or perhaps the
+ *   only slightly weaker "release" ordering) for correctness.
+ *
+ * There are standardized mappings of operations to orderings for every
+ * processor architecture. See
+ * - https://www.cl.cam.ac.uk/~pes20/cpp/cpp0xmappings.html
+ * - http://preshing.com/20120913/acquire-and-release-semantics/
+ *
+ * In this file:
+ * 1. all RMW (Read/Modify/Write) operations are sequentially consistent.
+ *    This includes operations like Atomic_IncN, Atomic_ReadIfEqualWriteN,
+ *    Atomic_ReadWriteN, etc.
+ * 2. all R and W operations are relaxed. This includes operations like
+ *    Atomic_WriteN, Atomic_ReadN, Atomic_TestBitN, etc.
+ *
+ * The below routines of course ensure both the CPU and compiler honor the
+ * ordering constraint.
+ *
+ * Notes:
+ * 1. Since R-only and W-only operations do not provide ordering, callers
+ *    using them for synchronizing operations like double-checked
+ *    initialization or releasing spinlocks must provide extra barriers.
+ * 2. This implementation of Atomic operations is suboptimal. On x86,simple
+ *    reads and writes have acquire/release semantics at the hardware level.
+ *    On arm64, we have separate instructions for sequentially consistent
+ *    reads and writes (the same instructions are used for acquire/release).
+ *    Neither of these are exposed for R-only or W-only callers.
  *
  * For further details on x86 and ARM memory ordering see
  * https://wiki.eng.vmware.com/ARM/MemoryOrdering.
@@ -118,10 +148,7 @@ typedef struct Atomic_uint128 {
 /*
  * Prototypes for msft atomics.  These are defined & inlined by the
  * compiler so no function definition is needed.  The prototypes are
- * needed for C++.  Since amd64 compiler doesn't support inline asm we
- * have to use these.  Unfortunately, we still have to use some inline asm
- * for the 32 bit code since the and/or/xor implementations didn't show up
- * until XP or 2k3.
+ * needed for C++.
  *
  * The declarations for the intrinsic functions were taken from ntddk.h
  * in the DDK. The declarations must match otherwise the 64-bit C++
@@ -130,7 +157,7 @@ typedef struct Atomic_uint128 {
  * Windows typedefs. This avoids having to include windows header files
  * to get to the windows types.
  */
-#if defined _MSC_VER && _MSC_VER >= 1310 && !defined BORA_NO_WIN32_INTRINS
+#if defined _MSC_VER && !defined BORA_NO_WIN32_INTRINS
 #ifdef __cplusplus
 extern "C" {
 #endif
@@ -222,38 +249,10 @@ Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
 
 
 /*
- * All the assembly code is tricky and written conservatively.
- * For example, to make sure gcc won't introduce copies,
- * we force the addressing mode like this:
- *
- *    "xchgl %0, (%1)"
- *    : "=r" (val)
- *    : "r" (&var->value),
- *      "0" (val)
- *    : "memory"
- *
- * - edward
- *
- * Actually - turns out that gcc never generates memory aliases (it
- * still does generate register aliases though), so we can be a bit
- * more agressive with the memory constraints. The code above can be
- * modified like this:
- *
- *    "xchgl %0, %1"
- *    : "=r" (val),
- *      "=m" (var->value),
- *    : "0" (val),
- *      "1" (var->value)
- *
- * The advantages are that gcc can use whatever addressing mode it
- * likes to access the memory value, and that we dont have to use a
- * way-too-generic "memory" clobber as there is now an explicit
- * declaration that var->value is modified.
- *
- * see also /usr/include/asm/atomic.h to convince yourself this is a
- * valid optimization.
- *
- * - walken
+ * The Read/Modify/Write operations on x86/x64 are all written using the
+ * "memory" constraint. This is to ensure the compiler treats the operation as
+ * a full barrier, flushing any pending/cached state currently residing in
+ * registers.
  */
 
 #if defined _MSC_VER && _MSC_VER < 1600 && defined __x86_64__
@@ -403,6 +402,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
       : "=q" (val),
         "+m" (var->value)
       : "0" (val)
+      : "memory"
    );
    return val;
 #elif defined _MSC_VER && _MSC_VER >= 1600
@@ -496,7 +496,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
         "+m" (var->value)
       : "q" (newVal),
         "0" (oldVal)
-      : "cc"
+      : "cc", "memory"
    );
 
    return val;
@@ -1002,26 +1002,15 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
    __asm__ __volatile__(
       "xchgl %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
+      : "memory"
    );
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    return _InterlockedExchange((long *)&var->value, (long)val);
 #else
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov eax, val
-      __asm mov ebx, var
-      __asm xchg [ebx]Atomic_uint32.value, eax
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#endif // _MSC_VER >= 1310
-#else
 #error No compiler defined for Atomic_ReadWrite
 #endif // __GNUC__
 }
@@ -1162,30 +1151,17 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
    __asm__ __volatile__(
       "lock; cmpxchgl %2, %1"
       : "=a" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "r" (newVal),
-	"0" (oldVal)
-      : "cc"
+        "0" (oldVal)
+      : "cc", "memory"
    );
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    return _InterlockedCompareExchange((long *)&var->value,
-				      (long)newVal,
-				      (long)oldVal);
-#else
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov eax, oldVal
-      __asm mov ebx, var
-      __asm mov ecx, newVal
-      __asm lock cmpxchg [ebx]Atomic_uint32.value, ecx
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#endif
+                                      (long)newVal,
+                                      (long)oldVal);
 #else
 #error No compiler defined for Atomic_ReadIfEqualWrite
 #endif
@@ -1267,17 +1243,17 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
    __asm__ __volatile__(
       "lock; cmpxchgq %2, %1"
       : "=a" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "r" (newVal),
-	"0" (oldVal)
-      : "cc"
+        "0" (oldVal)
+      : "cc", "memory"
    );
    return val;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
    return _InterlockedCompareExchange64((__int64 *)&var->value,
-					(__int64)newVal,
-					(__int64)oldVal);
+                                        (__int64)newVal,
+                                        (__int64)oldVal);
 #else
 #error No compiler defined for Atomic_ReadIfEqualWrite64
 #endif
@@ -1332,7 +1308,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
       "lock; andl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1397,7 +1373,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
       "lock; orl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1462,7 +1438,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
       "lock; xorl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1510,7 +1486,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
       "lock; xorq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif
 #elif defined _MSC_VER
@@ -1569,17 +1545,11 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
       "lock; addl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    _InterlockedExchangeAdd((long *)&var->value, (long)val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock add [ebx]Atomic_uint32.value, eax
-#endif
 #else
 #error No compiler defined for Atomic_Add
 #endif
@@ -1634,17 +1604,11 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
       "lock; subl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
-   _InterlockedExchangeAdd((long *)&var->value, (long)-val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock sub [ebx]Atomic_uint32.value, eax
-#endif
+   _InterlockedExchangeAdd((long *)&var->value, -(long)val);
 #else
 #error No compiler defined for Atomic_Sub
 #endif
@@ -1680,16 +1644,11 @@ Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
       "lock; incl %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    _InterlockedIncrement((long *)&var->value);
-#else
-   __asm mov ebx, var
-   __asm lock inc [ebx]Atomic_uint32.value
-#endif
 #else
 #error No compiler defined for Atomic_Inc
 #endif
@@ -1725,16 +1684,11 @@ Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
       "lock; decl %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    _InterlockedDecrement((long *)&var->value);
-#else
-   __asm mov ebx, var
-   __asm lock dec [ebx]Atomic_uint32.value
-#endif
 #else
 #error No compiler defined for Atomic_Dec
 #endif
@@ -1939,26 +1893,15 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
    __asm__ __volatile__(
       "lock; xaddl %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
-      : "cc"
+      : "cc", "memory"
    );
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    return _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov eax, val
-      __asm mov ebx, var
-      __asm lock xadd [ebx]Atomic_uint32.value, eax
-   }
-#pragma warning(pop)
-#endif
-#else
 #error No compiler defined for Atomic_ReadAdd32
 #endif
 }
@@ -2044,11 +1987,11 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
       "lock; cmpxchgq %3, %0" "\n\t"
       "sete %1"
       : "+m" (*var),
-	"=qm" (equal),
-	"=a" (dummy)
+        "=qm" (equal),
+        "=a" (dummy)
       : "r" (newVal),
         "2" (oldVal)
-      : "cc"
+      : "cc", "memory"
    );
 #else /* 32-bit version for non-ARM */
    typedef struct {
@@ -2088,9 +2031,9 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
       "lock; cmpxchg8b (%3)" "\n\t"
       "xchgl %%ebx, %6"      "\n\t"
       "sete %0"
-      :	"=qm" (equal),
-	"=a" (dummy1),
-	"=d" (dummy2)
+      : "=qm" (equal),
+        "=a" (dummy1),
+        "=d" (dummy2)
       : /*
          * See the "Rules for __asm__ statements in __PIC__ code" above: %3
          * must use a register class which does not contain %ebx.
@@ -2111,14 +2054,14 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
       "lock; cmpxchg8b %0" "\n\t"
       "sete %1"
       : "+m" (*var),
-	"=qm" (equal),
-	"=a" (dummy1),
-	"=d" (dummy2)
+        "=qm" (equal),
+        "=a" (dummy1),
+        "=d" (dummy2)
       : "2" (((S_uint64 *)&oldVal)->lowValue),
         "3" (((S_uint64 *)&oldVal)->highValue),
         "b" (((S_uint64 *)&newVal)->lowValue),
         "c" (((S_uint64 *)&newVal)->highValue)
-      : "cc"
+      : "cc", "memory"
    );
 #   endif
 #endif
@@ -2166,11 +2109,11 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
       "lock; cmpxchgl %3, %0" "\n\t"
       "sete %1"
       : "+m" (*var),
-	"=qm" (equal),
-	"=a" (dummy)
+        "=qm" (equal),
+        "=a" (dummy)
       : "r" (newVal),
         "2" (oldVal)
-      : "cc"
+      : "cc", "memory"
    );
    return equal;
 #endif /* VM_X86_ANY */
@@ -2247,7 +2190,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
    return _InterlockedAdd64((__int64 *)&var->value, 0);
 #elif defined _MSC_VER && defined __i386__
 #   pragma warning(push)
-#   pragma warning(disable : 4035)		// disable no-return warning
+#   pragma warning(disable : 4035)      // disable no-return warning
    {
       __asm mov ecx, var
       __asm mov edx, ecx
@@ -2330,9 +2273,9 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
    __asm__ __volatile__(
       "lock; xaddq %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
-      : "cc"
+      : "cc", "memory"
    );
    return val;
 #elif defined _MSC_VER
@@ -2378,7 +2321,7 @@ Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
 #if defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
-   return Atomic_ReadAdd64(var, -val);
+   return Atomic_ReadAdd64(var, -(int64)val);
 #endif
 }
 
@@ -2425,7 +2368,7 @@ Atomic_ReadInc64(Atomic_uint64 *var) // IN/OUT
 static INLINE uint64
 Atomic_ReadDec64(Atomic_uint64 *var) // IN/OUT
 {
-   return Atomic_ReadAdd64(var, CONST64U(-1));
+   return Atomic_ReadAdd64(var, (uint64)CONST64(-1));
 }
 
 
@@ -2460,7 +2403,7 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
       "lock; addq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif
 #elif defined _MSC_VER
@@ -2502,7 +2445,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
       "lock; subq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif
 #elif defined _MSC_VER
@@ -2542,7 +2485,7 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
       "lock; incq %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined _MSC_VER
    _InterlockedIncrement64((__int64 *)&var->value);
@@ -2581,7 +2524,7 @@ Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
       "lock; decq %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined _MSC_VER
    _InterlockedDecrement64((__int64 *)&var->value);
@@ -2617,8 +2560,9 @@ Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
    __asm__ __volatile__(
       "xchgq %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
+      : "memory"
    );
    return val;
 #elif defined _MSC_VER
@@ -2726,7 +2670,7 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
       "lock; orq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined _MSC_VER
    _InterlockedOr64((__int64 *)&var->value, (__int64)val);
@@ -2773,7 +2717,7 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
       "lock; andq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined _MSC_VER
    _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
@@ -2811,29 +2755,17 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
 
 static INLINE void
 Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
-                uint64 bit)         // IN
+                unsigned bit)       // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __x86_64__ && defined __GNUC__
    ASSERT(bit <= 63);
    __asm__ __volatile__(
-      "lock; bts %1, %0"
+      "lock; btsq %1, %0"
       : "+m" (var->value)
-      : "ri" (bit)
-      : "cc"
+      : "ri" ((uint64)bit)
+      : "cc", "memory"
    );
-#elif defined _MSC_VER
-   uint64 oldVal;
-   uint64 newVal;
-   ASSERT(bit <= 63);
-   do {
-      oldVal = var->value;
-      newVal = oldVal | (CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #else
-#error No compiler defined for Atomic_SetBit64
-#endif
-#else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    ASSERT(bit <= 63);
@@ -2863,29 +2795,17 @@ Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
 
 static INLINE void
 Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
-                  uint64 bit)         // IN
+                  unsigned bit)       // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __x86_64__ && defined __GNUC__
    ASSERT(bit <= 63);
    __asm__ __volatile__(
-      "lock; btr %1, %0"
+      "lock; btrq %1, %0"
       : "+m" (var->value)
-      : "ri" (bit)
-      : "cc"
+      : "ri" ((uint64)bit)
+      : "cc", "memory"
    );
-#elif defined _MSC_VER
-   uint64 oldVal;
-   uint64 newVal;
-   ASSERT(bit <= 63);
-   do {
-      oldVal = var->value;
-      newVal = oldVal & ~(CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #else
-#error No compiler defined for Atomic_ClearBit64
-#endif
-#else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    ASSERT(bit <= 63);
@@ -2915,29 +2835,65 @@ Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
 
 static INLINE Bool
 Atomic_TestBit64(Atomic_uint64 *var, // IN
-                 uint64 bit)         // IN
+                 unsigned bit)       // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
-   Bool out = FALSE;
+   Bool out;
    ASSERT(bit <= 63);
+#if defined __x86_64__ && defined __GNUC__
    __asm__ __volatile__(
-      "bt %2, %1; setc %0"
+      "btq %2, %1; setc %0"
       : "=rm"(out)
       : "m" (var->value),
-        "rJ" (bit)
+        "rJ" ((uint64)bit)
       : "cc"
    );
+#else
+   out = (var->value & (CONST64U(1) << bit)) != 0;
+#endif
    return out;
-#elif defined _MSC_VER
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestSetBit64 --
+ *
+ *      Atomically test and set the bit 'bit' in var.
+ *      Bit must be between 0 and 63.
+ *
+ * Results:
+ *      TRUE if the tested bit was set; else FALSE.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestSetBit64(Atomic_uint64 *var, // IN/OUT
+                    unsigned bit)       // IN
+{
+#if defined __x86_64__ && defined __GNUC__
+   Bool out;
    ASSERT(bit <= 63);
-   return (var->value & (CONST64U(1) << bit)) != 0;
+   __asm__ __volatile__(
+      "lock; btsq %2, %1; setc %0"
+      : "=rm" (out), "+m" (var->value)
+      : "rJ" ((uint64)bit)
+      : "cc", "memory"
+   );
+   return out;
 #else
-#error No compiler defined for Atomic_TestBit64
-#endif
-#else // __x86_64__
+   uint64 oldVal;
+   uint64 mask;
    ASSERT(bit <= 63);
-   return (var->value & (CONST64U(1) << bit)) != 0;
+   mask = CONST64U(1) << bit;
+   do {
+      oldVal = var->value;
+   } while (!Atomic_CMPXCHG64(var, oldVal, oldVal | mask));
+   return (oldVal & mask) != 0;
 #endif
 }
 
@@ -3020,8 +2976,9 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
    __asm__ __volatile__(
       "xchgw %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
+      : "memory"
    );
    return val;
 #elif defined VM_ARM_V7
@@ -3128,10 +3085,10 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
    __asm__ __volatile__(
       "lock; cmpxchgw %2, %1"
       : "=a" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "r" (newVal),
-	"0" (oldVal)
-      : "cc"
+        "0" (oldVal)
+      : "cc", "memory"
    );
    return val;
 #elif defined VM_ARM_V7
@@ -3192,7 +3149,7 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
       "lock; andw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3249,7 +3206,7 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
       "lock; orw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3306,7 +3263,7 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
       "lock; xorw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3363,7 +3320,7 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
       "lock; addw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3420,7 +3377,7 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
       "lock; subw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3476,7 +3433,7 @@ Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
       "lock; incw %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_ANY
    Atomic_Add16(var, 1);
@@ -3512,7 +3469,7 @@ Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
       "lock; decw %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_ANY
    Atomic_Sub16(var, 1);
@@ -3582,9 +3539,9 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
    __asm__ __volatile__(
       "lock; xaddw %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
-      : "cc"
+      : "cc", "memory"
    );
    return val;
 #elif defined VM_ARM_V7
@@ -3715,7 +3672,7 @@ Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
                             in val)                                           \
    {                                                                          \
       return (out)(cast)Atomic_ReadWrite ## size(var,                         \
-		(uint ## size)(cast)val);                                     \
+                (uint ## size)(cast)val);                                     \
    }                                                                          \
                                                                               \
                                                                               \
@@ -3876,6 +3833,109 @@ MAKE_ATOMIC_TYPE(Ptr, 32, void const *, void *, uintptr_t)
 MAKE_ATOMIC_TYPE(Int, 32, int, int, int)
 MAKE_ATOMIC_TYPE(Bool, 8, Bool, Bool, Bool)
 
+/*
+ * Define arbitrary sized bit vector to be used by
+ * Atomic_TestSetBitVector and Atomic_TestClearBitVector.
+ */
+#define ATOMIC_BITVECTOR(varName, capacity) \
+      Atomic_uint8 varName[CEILING(capacity, 8)]
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestSetBitVector --
+ *
+ *      Atomically test and set the bit 'index' in bit vector var.
+ *
+ *      The index input value specifies which bit to modify and is 0-based.
+ *
+ * Results:
+ *      Returns the value of the bit before modification.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestSetBitVector(Atomic_uint8 *var, // IN/OUT
+                        unsigned index)    // IN
+{
+#if defined __x86_64__ && defined __GNUC__
+   Bool bit;
+   __asm__ __volatile__(
+      "lock; bts %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (var->value)
+      : "rI" (index)
+      : "cc", "memory"
+   );
+   return bit;
+#else
+   uint8 bit = 1 << index % 8;
+   return (Atomic_ReadOr8(var + index / 8, bit) & bit) != 0;
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestClearBitVector --
+ *
+ *      Atomically test and clear the bit 'index' in bit vector var.
+ *
+ *      The index input value specifies which bit to modify and is 0-based.
+ *
+ * Results:
+ *      Returns the value of the bit before modification.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestClearBitVector(Atomic_uint8 *var, // IN/OUT
+                          unsigned index)    // IN
+{
+#if defined __x86_64__ && defined __GNUC__
+   Bool bit;
+   __asm__ __volatile__(
+      "lock; btr %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (var->value)
+      : "rI" (index)
+      : "cc", "memory"
+   );
+   return bit;
+#else
+   uint8 bit = 1 << index % 8;
+   return (Atomic_ReadAnd8(var + index / 8, ~bit) & bit) != 0;
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestBitVector --
+ *
+ *      Test the bit 'index' (zero-based) in bit vector var.
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestBitVector(const Atomic_uint8 *var, // IN
+                     unsigned index)          // IN
+{
+   uint8 bit = 1 << index % 8;
+   return (Atomic_Read8(var + index / 8) & bit) != 0;
+}
+
+
 #ifdef VM_ARM_64
 #   include "vm_atomic_arm64_end.h"
 #endif
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index 11c3abac..79bb2789 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -1056,7 +1056,7 @@ ClearBitVector(void *var, int32 index)
       "setc %0"
       : "=qQm" (bit), "+m" (*(uint32 *)var)
       : "rI" (index)
-      : "cc"
+      : "memory", "cc"
    );
    return bit;
 #elif defined(_MSC_VER)
@@ -1078,7 +1078,7 @@ ComplementBitVector(void *var, int32 index)
       "setc %0"
       : "=qQm" (bit), "+m" (*(uint32 *)var)
       : "rI" (index)
-      : "cc"
+      : "memory", "cc"
    );
    return bit;
 #elif defined(_MSC_VER)
diff --git a/vmmon-only/include/vm_basic_asm_x86.h b/vmmon-only/include/vm_basic_asm_x86.h
index b9c684f4..e293ed25 100644
--- a/vmmon-only/include/vm_basic_asm_x86.h
+++ b/vmmon-only/include/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vm_basic_asm_x86_64.h b/vmmon-only/include/vm_basic_asm_x86_64.h
index 4f9fd4f2..f9b255a9 100644
--- a/vmmon-only/include/vm_basic_asm_x86_64.h
+++ b/vmmon-only/include/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vm_basic_asm_x86_common.h b/vmmon-only/include/vm_basic_asm_x86_common.h
index 06ae1b5f..a724178e 100644
--- a/vmmon-only/include/vm_basic_asm_x86_common.h
+++ b/vmmon-only/include/vm_basic_asm_x86_common.h
@@ -374,8 +374,8 @@ RDTSC_BARRIER(void)
  * Thanks for pasting this whole comment into every architecture header.
  *
  * On x86, we only need to care specifically about store-load reordering on
- * normal memory types. In other cases, only a compiler barrier is needed. The
- * ST_LD barrier is implemented with a locked xor operation (instead of the
+ * normal memory types. In other cases, only a compiler barrier is needed.
+ * SMP_W_BARRIER_R is implemented with a locked xor operation (instead of the
  * mfence instruction) for performance reasons. See PR 1674199 for more
  * details.
  *
@@ -389,19 +389,17 @@ SMP_W_BARRIER_R(void)
 {
    volatile long temp;
 
-   COMPILER_MEM_BARRIER();
 #if defined __GNUC__
    __asm__ __volatile__ (
-      "lock xorl $1, %0\n"
+      "lock xorl $1, %0"
       : "+m" (temp)
       : /* no additional inputs */
-      : "cc");
+      : "cc", "memory");
 #elif defined _MSC_VER
    _InterlockedXor(&temp, 1);
 #else
 #error SMP_W_BARRIER_R not defined for this compiler
 #endif
-   COMPILER_MEM_BARRIER();
 }
 
 #define SMP_R_BARRIER_R()     COMPILER_READ_BARRIER()
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index 47022384..b40e9b6a 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,12 +37,16 @@
 #include "vm_basic_types.h" // For INLINE.
 
 /* Checks for FreeBSD, filtering out VMKERNEL. */
-#define __IS_FREEBSD__ (!defined(VMKERNEL) && defined(__FreeBSD__))
+#if !defined(VMKERNEL) && defined(__FreeBSD__)
+#define __IS_FREEBSD__ 1
+#else
+#define __IS_FREEBSD__ 0
+#endif
 #define __IS_FREEBSD_VER__(ver) (__IS_FREEBSD__ && __FreeBSD_version >= (ver))
 
 #if defined _WIN32 && defined USERLEVEL
    #include <stddef.h>  /*
-                         * We redefine offsetof macro from stddef; make 
+                         * We redefine offsetof macro from stddef; make
                          * sure that it's already defined before we do that.
                          */
    #include <windows.h>	// for Sleep() and LOWORD() etc.
@@ -101,7 +105,7 @@
 
 /* The Solaris 9 cross-compiler complains about these not being used */
 #ifndef sun
-static INLINE int 
+static INLINE int
 Min(int a, int b)
 {
    return a < b ? a : b;
@@ -113,7 +117,7 @@ Min(int a, int b)
 #endif
 
 #ifndef sun
-static INLINE int 
+static INLINE int
 Max(int a, int b)
 {
    return a > b ? a : b;
@@ -168,7 +172,7 @@ Max(int a, int b)
 #endif
 
 
-/* 
+/*
  * Token concatenation
  *
  * The C preprocessor doesn't prescan arguments when they are
@@ -256,15 +260,26 @@ Max(int a, int b)
 #endif
 
 #ifndef MBYTES_2_PAGES
-#define MBYTES_2_PAGES(_nbytes) ((_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
+#define MBYTES_2_PAGES(_nbytes) \
+   ((uint64)(_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_MBYTES
 #define PAGES_2_MBYTES(_npages) ((_npages) >> (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
+#ifndef ROUNDUP_PAGES_2_MBYTES
+#define ROUNDUP_PAGES_2_MBYTES(_npages) \
+(((_npages) + MASK(MBYTES_SHIFT - PAGE_SHIFT)) >> (MBYTES_SHIFT - PAGE_SHIFT))
+#endif
+
+#ifndef ROUNDDOWN_PAGES_2_MBYTES
+#define ROUNDDOWN_PAGES_2_MBYTES(_npages) \
+((_npages) >> (MBYTES_SHIFT - PAGE_SHIFT))
+#endif
+
 #ifndef GBYTES_2_PAGES
-#define GBYTES_2_PAGES(_nbytes) ((_nbytes) << (30 - PAGE_SHIFT))
+#define GBYTES_2_PAGES(_nbytes) ((uint64)(_nbytes) << (30 - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_GBYTES
@@ -369,7 +384,7 @@ Max(int a, int b)
 #ifdef _MSC_VER
 #ifdef __cplusplus
 extern "C"
-#endif 
+#endif
 void *_ReturnAddress(void);
 #pragma intrinsic(_ReturnAddress)
 #define GetReturnAddress() _ReturnAddress()
@@ -412,22 +427,6 @@ void *_ReturnAddress(void);
 
 #ifdef USERLEVEL // {
 
-/*
- * Note this might be a problem on NT b/c while sched_yield guarantees it
- * moves you to the end of your priority list, Sleep(0) offers no such
- * guarantee.  Bummer.  --Jeremy.
- */
-
-#if defined(_WIN32)
-#      define YIELD()		Sleep(0)
-#elif defined(VMKERNEL)
-/* We don't have a YIELD macro in the vmkernel */
-#else
-#      include <sched.h>        // For sched_yield.  Don't ask.  --Jeremy.
-#      define YIELD()		sched_yield()
-#endif 
-
-
 /*
  * Standardize some Posix names on Windows.
  */
@@ -497,19 +496,8 @@ typedef int pid_t;
 
 #elif defined(__APPLE__) && defined(KERNEL)
 
-#include "availabilityMacOS.h"
-
-#if MAC_OS_X_VERSION_MIN_REQUIRED >= 1050
-// The Mac OS 10.5 kernel SDK defines va_copy in stdarg.h.
+// The macOS kernel SDK defines va_copy in stdarg.h.
 #include <stdarg.h>
-#else
-/*
- * The Mac OS 10.4 kernel SDK needs va_copy. Based on inspection of
- * stdarg.h from the MacOSX10.4u.sdk kernel framework, this should
- * work.
- */
-#define va_copy(dest, src) ((dest) = (src))
-#endif // MAC_OS_X_VERSION_MIN_REQUIRED
 
 #elif defined(__GNUC__) && (__GNUC__ < 3)
 
@@ -529,7 +517,7 @@ typedef int pid_t;
  * driver.
  */
 
-#ifdef _WIN32
+#if defined(_WIN32) && defined(_MSC_VER)
 #define PATH_MAX 256
 #ifndef strcasecmp
 #define strcasecmp(_s1,_s2)   _stricmp((_s1),(_s2))
@@ -539,29 +527,6 @@ typedef int pid_t;
 #endif
 #endif
 
-#if defined __linux__ && !defined __KERNEL__ && !defined MODULE && \
-                         !defined VMM && !defined FROBOS && !defined __ANDROID__
-#include <features.h>
-#if __GLIBC_PREREQ(2, 1) && !defined GLIBC_VERSION_21
-#define GLIBC_VERSION_21
-#endif
-#if __GLIBC_PREREQ(2, 2) && !defined GLIBC_VERSION_22
-#define GLIBC_VERSION_22
-#endif
-#if __GLIBC_PREREQ(2, 3) && !defined GLIBC_VERSION_23
-#define GLIBC_VERSION_23
-#endif
-#if __GLIBC_PREREQ(2, 4) && !defined GLIBC_VERSION_24
-#define GLIBC_VERSION_24
-#endif
-#if __GLIBC_PREREQ(2, 5) && !defined GLIBC_VERSION_25
-#define GLIBC_VERSION_25
-#endif
-#if __GLIBC_PREREQ(2, 12) && !defined GLIBC_VERSION_212
-#define GLIBC_VERSION_212
-#endif
-#endif
-
 /*
  * Convenience definitions of unicode characters.
  */
@@ -634,7 +599,7 @@ typedef int pid_t;
 #define RELEASE_ONLY(x) x
 #else
 #define vmx86_release   0
-#define RELEASE_ONLY(x) 
+#define RELEASE_ONLY(x)
 #endif
 
 #ifdef VMX86_SERVER
@@ -687,6 +652,12 @@ typedef int pid_t;
 #define vmw_apple_sandbox 0
 #endif
 
+#if defined(__APPLE__) && defined(VMW_APPLE_APP_STORE)
+#define vmw_apple_app_store 1
+#else
+#define vmw_apple_app_store 0
+#endif
+
 #ifdef VMM
 #define VMM_ONLY(x) x
 #else
@@ -699,17 +670,6 @@ typedef int pid_t;
 #define USER_ONLY(x) x
 #endif
 
-/* VMVISOR ifdef only allowed in the vmkernel */
-#ifdef VMKERNEL
-#ifdef VMVISOR
-#define vmvisor 1
-#define VMVISOR_ONLY(x) x
-#else
-#define vmvisor 0
-#define VMVISOR_ONLY(x)
-#endif
-#endif
-
 #ifdef _WIN32
 #define VMW_INVALID_HANDLE INVALID_HANDLE_VALUE
 #else
diff --git a/vmmon-only/include/vm_basic_math.h b/vmmon-only/include/vm_basic_math.h
index b6f5486b..4483131a 100644
--- a/vmmon-only/include/vm_basic_math.h
+++ b/vmmon-only/include/vm_basic_math.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index 01aa0c9f..54f3e7e7 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,24 +38,6 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
-/* STRICT ANSI means the Xserver build and X defines Bool differently. */
-#if !defined(_XTYPEDEF_BOOL) && \
-    (!defined(__STRICT_ANSI__) || defined(__FreeBSD__) || \
-      defined(__MINGW32__) || defined(__APPLE__))
-#define _XTYPEDEF_BOOL
-typedef char           Bool;
-#endif
-
-#ifndef FALSE
-#define FALSE          0
-#endif
-
-#ifndef TRUE
-#define TRUE           1
-#endif
-
-#define IS_BOOL(x)     (((x) & ~1) == 0)
-
 /*
  * Macros __i386__ and __ia64 are intrinsically defined by GCC
  */
@@ -87,7 +69,8 @@ typedef char           Bool;
  */
 
 #ifdef __i386__
-/* VM_I386 is historically synonymous with VM_X86_ANY in bora, but misleading,
+/*
+ * VM_I386 is historically synonymous with VM_X86_ANY in bora, but misleading,
  * since it is confused with the __i386__ gcc but defined for both 32- and
  * 64-bit x86. We retain it here for legacy compatibility.
  */
@@ -99,12 +82,12 @@ typedef char           Bool;
 
 #ifdef __x86_64__
 #define VM_X86_64
+#define vm_x86_64 1
 #define VM_I386
 #define VM_X86_ANY
 #define VM_64BIT
-#define vm_x86_64 (1)
 #else
-#define vm_x86_64 (0)
+#define vm_x86_64 0
 #endif
 
 #ifdef __arm__
@@ -115,13 +98,15 @@ typedef char           Bool;
 
 #ifdef __aarch64__
 #define VM_ARM_64
+#define vm_arm_64 1
 #define VM_ARM_ANY
 #define VM_64BIT
-#define vm_arm_64 (1)
 #else
-#define vm_arm_64 (0)
+#define vm_arm_64 0
 #endif
 
+#define vm_64bit (sizeof (void *) == 8)
+
 #ifdef _MSC_VER
 
 #pragma warning (3 :4505) // unreferenced local function
@@ -135,17 +120,15 @@ typedef char           Bool;
 
 #endif
 
-#if defined(__linux__) && defined(__cplusplus) && __cplusplus >= 201103L
-
+#if defined(__cplusplus) && __cplusplus >= 201103L || \
+    defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L || \
+    defined(__APPLE__) || defined(HAVE_STDINT_H)
 /*
- * We're using stdint.h instead of cstdint below because of libstdcpp.cpp.
- * It looks like a C++ file. When being preprocessed all the C++ specific
- * defines(e.g. __cplusplus) are set, but the C++ include paths are not.
+ * We're using <stdint.h> instead of <cstdint> below because some C++ code
+ * deliberately compiles without C++ include paths.
  */
 #include <stdint.h>
 
-typedef char          Bool;
-
 typedef uint64_t    uint64;
 typedef  int64_t     int64;
 typedef uint32_t    uint32;
@@ -155,56 +138,25 @@ typedef  int16_t     int16;
 typedef  uint8_t     uint8;
 typedef   int8_t      int8;
 
-typedef uint64 BA;
-typedef uint64 MA;
-typedef uint32 MPN32;
-
-#elif defined(__APPLE__) || defined(HAVE_STDINT_H)
-
-/*
- * TODO: This is a C99 standard header.  We should be able to test for
- * #if __STDC_VERSION__ >= 199901L, but that breaks the Netware build
- * (which doesn't have stdint.h).
- */
-
-#include <stdint.h>
-
-typedef uint64_t    uint64;
-typedef  int64_t     int64;
-typedef uint32_t    uint32;
-typedef  int32_t     int32;
-typedef uint16_t    uint16;
-typedef  int16_t     int16;
-typedef  uint8_t    uint8;
-typedef   int8_t     int8;
-
-/*
- * Note: C does not specify whether char is signed or unsigned, and
- * both gcc and msvc implement processor-specific signedness.  With
- * three types:
- * typeof(char) != typeof(signed char) != typeof(unsigned char)
- *
- * Be careful here, because gcc (4.0.1 and others) likes to warn about
- * conversions between signed char * and char *.
- */
-
 #else /* !HAVE_STDINT_H */
 
+/* Pre-c99 or pre-c++11; use compiler extension to get 64-bit types */
 #ifdef _MSC_VER
 
 typedef unsigned __int64 uint64;
 typedef signed __int64 int64;
 
 #elif __GNUC__
-/* The Xserver source compiles with -ansi -pendantic */
-#   if !defined(__STRICT_ANSI__) || defined(__FreeBSD__)
-#      if defined(VM_X86_64) || defined(VM_ARM_64)
+#   if defined(VM_X86_64) || defined(VM_ARM_64)
 typedef unsigned long uint64;
 typedef long int64;
-#      else
+#   else
+/*
+ * Only strict c90 (without extensions) lacks a 'long long' type.
+ * If this declaration fails ... use -std=c99 or -std=gnu90.
+ */
 typedef unsigned long long uint64;
 typedef long long int64;
-#      endif
 #   endif
 #else
 #   error - Need compiler define for int64/uint64
@@ -220,6 +172,36 @@ typedef signed char        int8;
 
 #endif /* HAVE_STDINT_H */
 
+
+/*
+ * The _XTYPEDEF_BOOL guard prevents colliding with:
+ * <X11/Xlib.h> #define Bool int
+ * <X11/Xdefs.h> typedef int Bool;
+ * If using this header AND X11 headers, be sure to #undef Bool and
+ * be careful about the different size.
+ */
+#if !defined(_XTYPEDEF_BOOL)
+#define _XTYPEDEF_BOOL
+/*
+ * C does not specify whether char is signed or unsigned, and
+ * both gcc and msvc implement it as a non-signed, non-unsigned type.
+ * Thus, (uint8_t *)&Bool and (int8_t *)&Bool are possible compile errors.
+ * This is intentional.
+ */
+typedef char           Bool;
+#endif
+
+#ifndef FALSE
+#define FALSE          0
+#endif
+
+#ifndef TRUE
+#define TRUE           1
+#endif
+
+#define IS_BOOL(x)     (((x) & ~1) == 0)
+
+
 /*
  * FreeBSD (for the tools build) unconditionally defines these in
  * sys/inttypes.h so don't redefine them if this file has already
@@ -344,6 +326,7 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
  */
 
 #ifdef _MSC_VER
+   /* MSVC added C99-compatible formatting in vs2015. */
    #define FMT64      "I64"
    #ifdef VM_X86_64
       #define FMTSZ      "I64"
@@ -355,53 +338,29 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
       #define FMTH       "I"
    #endif
 #elif defined __APPLE__
-   /* Mac OS hosts use the same formatters for 32- and 64-bit. */
-   #define FMT64 "ll"
+   /* macOS hosts use the same formatters for 32- and 64-bit. */
+   #define FMT64         "ll"
    #if KERNEL
-      #define FMTSZ "l"
-   #else
-      #define FMTSZ "z"
-   #endif
-   #define FMTPD "l"
-   #define FMTH ""
-#elif __GNUC__
-   #define FMTH ""
-   #if defined(sun)
-      #if defined(VM_X86_64) || defined(VM_ARM_64)
-         #define FMTSZ  "l"
-         #define FMTPD  "l"
-      #else
-         #define FMTSZ  ""
-         #define FMTPD  ""
-      #endif
-   #elif defined(__linux__) || \
-        (defined(__FreeBSD__) && (__FreeBSD__ + 0))\
-      || (defined(_POSIX_C_SOURCE) && _POSIX_C_SOURCE >= 200112L) \
-      || (defined(_POSIX_VERSION) && _POSIX_VERSION >= 200112L) \
-      || (defined(_POSIX2_VERSION) && _POSIX2_VERSION >= 200112L)
-      /* BSD, Linux */
-      #define FMTSZ     "z"
-
-      #if defined(VM_X86_64) || defined(VM_ARM_64)
-         #define FMTPD  "l"
-      #else
-         #define FMTPD  ""
-      #endif
+      /* macOS osfmk/kern added 'z' length specifier in 10.13 */
+      #define FMTSZ      "l"
    #else
-      /* Systems with a pre-C99 libc */
-      #define FMTSZ     "Z"
-      #if defined(VM_X86_64) || defined(VM_ARM_64)
-         #define FMTPD  "l"
-      #else
-         #define FMTPD  ""
-      #endif
+      #define FMTSZ      "z"
    #endif
+   #define FMTPD         "l"
+   #define FMTH          ""
+#elif defined __GNUC__
+   /*
+    * Every POSIX system we target has C99-compatible printf
+    * (supports 'z' for size_t and 'll' for long long).
+    */
+   #define FMTH          ""
+   #define FMTSZ         "z"
    #if defined(VM_X86_64) || defined(VM_ARM_64)
-      #define FMT64     "l"
-   #elif defined(sun) || defined(__FreeBSD__)
-      #define FMT64     "ll"
+      #define FMT64      "l"
+      #define FMTPD      "l"
    #else
-      #define FMT64     "L"
+      #define FMT64      "ll"
+      #define FMTPD      ""
    #endif
 #else
    #error - Need compiler define for FMT64 and FMTSZ
@@ -485,26 +444,23 @@ typedef uint8 *TCA;  /* Pointer into TC (usually). */
  * Type big enough to hold an integer between 0..100
  */
 typedef uint8 Percent;
-#define AsPercent(v)	((Percent)(v))
+#define AsPercent(v) ((Percent)(v))
 
 
 typedef uintptr_t VA;
 typedef uintptr_t VPN;
 
 typedef uint64    PA;
-typedef uint32    PPN;
+typedef uint64    PPN;
+typedef uint32    PPNTMP;
 
 typedef uint64    TPA;
-typedef uint32    TPPN;
+typedef uint64    TPPN;
 
 typedef uint64    PhysMemOff;
 typedef uint64    PhysMemSize;
 
-/* The Xserver source compiles with -ansi -pendantic */
-#ifndef __STRICT_ANSI__
 typedef uint64    BA;
-#endif
-
 #ifdef VMKERNEL
 typedef void     *BPN;
 #else
@@ -514,9 +470,12 @@ typedef uint64    BPN;
 #define UINT64_2_BPN(u) ((BPN)(u))
 #define BPN_2_UINT64(b) ((uint64)(b))
 
-typedef uint32    PageNum;
-typedef unsigned      MemHandle;
-typedef unsigned int  IoHandle;
+typedef uint64    PgCnt64;
+typedef uint64    PageCnt;
+typedef uint64    PgNum64;
+typedef uint64    PageNum;
+typedef unsigned  MemHandle;
+typedef unsigned  IoHandle;
 typedef int32     World_ID;
 
 /* !! do not alter the definition of INVALID_WORLD_ID without ensuring
@@ -560,11 +519,8 @@ typedef uint128 UReg128;
 typedef  Reg64  Reg;
 typedef UReg64 UReg;
 #endif
-/* The Xserver source compiles with -ansi -pendantic */
-#ifndef __STRICT_ANSI__
 typedef uint64 MA;
 typedef uint32 MPN32;
-#endif
 
 /*
  * This type should be used for variables that contain sector
@@ -615,6 +571,7 @@ typedef uint64 LA64;
 typedef uint64 LPN64;
 typedef uint64 PA64;
 typedef uint64 PPN64;
+typedef uint64 TPPN64;
 typedef uint64 MA64;
 typedef uint64 MPN;
 
@@ -640,10 +597,14 @@ typedef void * UserVA;
 #endif
 
 
+/* Maximal observable PPN value. */
 #define MAX_PPN_BITS      31
-#define MAX_PPN           (((PPN)1 << MAX_PPN_BITS) - 1) /* Maximal observable PPN value. */
-#define INVALID_PPN       ((PPN)0xffffffff)
-#define APIC_INVALID_PPN  ((PPN)0xfffffffe)
+#define MAX_PPN           (((PPN64)1 << MAX_PPN_BITS) - 1)
+
+#define INVALID_PPN       ((PPN64)0xffffffff)
+#define INVALID_PPN32     ((PPN32)0xffffffff)
+#define INVALID_PPN64     ((PPN64)0xffffffffffffffffull)
+#define APIC_INVALID_PPN  ((PPN64)0xfffffffe)
 
 #define INVALID_BPN       ((BPN)0x000000ffffffffffull)
 
@@ -663,7 +624,7 @@ typedef void * UserVA;
 #define INVALID_LPN       ((LPN)-1)
 #define INVALID_VPN       ((VPN)-1)
 #define INVALID_LPN64     ((LPN64)-1)
-#define INVALID_PAGENUM   ((PageNum)-1)
+#define INVALID_PAGENUM   ((uint32)-1)
 
 /*
  * Format modifier for printing VA, LA, and VPN.
@@ -755,6 +716,14 @@ typedef void * UserVA;
 #error "gcc version is too old to compile assembly, need gcc-3.3 or better"
 #endif
 
+/*
+ * Similarly, we require a compiler that is at least vc80 (vs2005).
+ * Enforce this here.
+ */
+#if defined _MSC_VER && _MSC_VER < 1400
+#error "cl.exe version is too old, need vc80 or better"
+#endif
+
 
 /*
  * Consider the following reasons functions are inlined:
@@ -783,7 +752,7 @@ typedef void * UserVA;
 #define INLINE_SINGLE_CALLER INLINE_ALWAYS
 
 /*
- * Used when a hard guaranteed of no inlining is needed. Very few
+ * Used when a hard guarantee of no inlining is needed. Very few
  * instances need this since the absence of INLINE is a good hint
  * that gcc will not do inlining.
  */
@@ -1086,33 +1055,6 @@ typedef void * UserVA;
 # define FMTMODE "o"
 #endif
 
-/*
- * Format modifier for printing time_t. Most platforms define a time_t to be
- * a long int, but on FreeBSD (as of 5.0, it seems), the time_t is a signed
- * size quantity. Refer to the definition of FMTSZ to see why we need silly
- * preprocessor arithmetic.
- * Use this like this: printf("The mode is %" FMTTIME ".\n", time);
- */
-#if defined(__FreeBSD__) && (__FreeBSD__ + 0) && ((__FreeBSD__ + 0) >= 5)
-#   define FMTTIME FMTSZ"d"
-#else
-#   if defined(_MSC_VER)
-#      ifndef _SAFETIME_H_
-#         if (_MSC_VER < 1400) || defined(_USE_32BIT_TIME_T)
-#             define FMTTIME "ld"
-#         else
-#             define FMTTIME FMT64"d"
-#         endif
-#      else
-#         ifndef FMTTIME
-#            error "safetime.h did not define FMTTIME"
-#         endif
-#      endif
-#   else
-#      define FMTTIME "ld"
-#   endif
-#endif
-
 #ifdef __APPLE__
 /*
  * Format specifier for all these annoying types such as {S,U}Int32
diff --git a/vmmon-only/include/vm_pagetable.h b/vmmon-only/include/vm_pagetable.h
index 1aaac73d..ddac52a1 100644
--- a/vmmon-only/include/vm_pagetable.h
+++ b/vmmon-only/include/vm_pagetable.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2014,2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2014-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -54,6 +54,7 @@ typedef enum {
    PT_LEVEL_2,
    PT_LEVEL_3,
    PT_LEVEL_4,
+   PT_LEVEL_STOP = PT_LEVEL_1,
    PT_MAX_LEVELS = PT_LEVEL_4
 } PT_Level;
 
@@ -64,6 +65,9 @@ typedef enum {
 #define PT_ENTRIES_PER_PT     (1 << PT_LEVEL_SHIFT)
 #define PT_OFF_MASK           (PT_ENTRIES_PER_PT - 1)
 
+/* Align any page number type to the 2M containing page number. */
+#define PT_2M_ALIGN_PN(x)     ((x) & ~PT_OFF_MASK)
+
 /*
  * log2 of the
  * address space size (in 4KB pages) covered by a level-_l page table entry.
diff --git a/vmmon-only/include/vmmblob.h b/vmmon-only/include/vmmblob.h
new file mode 100644
index 00000000..95e19e5c
--- /dev/null
+++ b/vmmon-only/include/vmmblob.h
@@ -0,0 +1,50 @@
+/*********************************************************
+ * Copyright (C) 2017-2018 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vmmblob.h --
+ *
+ *     VMM blob management.
+ */
+
+#ifndef VMMBLOB_H
+#define VMMBLOB_H
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+struct VMDriver;
+struct MonLoaderHeader;
+
+typedef struct VmmBlobInfo {
+   uint8                  *blobPtr;
+   uint32                  numBytes;
+   MPN                    *mpns;
+   struct MonLoaderHeader *header;
+} VmmBlobInfo;
+
+void   VmmBlob_Cleanup(VmmBlobInfo *bi);
+Bool   VmmBlob_Load(VA64 bsBlobAddr, uint32 numBytes, uint32 headerOffset,
+                    VmmBlobInfo **blobInfo);
+MPN    VmmBlob_GetMpn(struct VMDriver *vm, uint64 blobOffset);
+MPN    VmmBlob_GetHeaderMpn(struct VMDriver *vm);
+uint8 *VmmBlob_GetPtr(VMDriver *vm);
+uint64 VmmBlob_GetSize(VMDriver *vm);
+
+#endif /* VMMBLOB_H */
diff --git a/vmmon-only/include/vmmem_shared.h b/vmmon-only/include/vmmem_shared.h
index 291d1700..ffd2efc1 100644
--- a/vmmon-only/include/vmmem_shared.h
+++ b/vmmon-only/include/vmmem_shared.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2000-2015,2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2000-2015,2017-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -48,16 +48,19 @@
 
 #define VMMEM_GUEST_WRITEABLE     VMMEM_FLAG_BIT(0)
 #define VMMEM_GUEST_BREAKCOW      VMMEM_FLAG_BIT(1)
-#define VMMEM_GUEST_LARGE_PAGE    VMMEM_FLAG_BIT(2)
-#define VMMEM_GUEST_CAN_FAIL      VMMEM_FLAG_BIT(3)
-#define VMMEM_GUEST_TEST_ZEROCOW  VMMEM_FLAG_BIT(4)
-#define VMMEM_GUEST_TRY_ZEROCOW   VMMEM_FLAG_BIT(5)
-#define VMMEM_GUEST_TRY_POISONCOW VMMEM_FLAG_BIT(6)
-#define VMMEM_GUEST_PREALLOC      VMMEM_FLAG_BIT(7)
-#define VMMEM_GUEST_ALL_FLAGS     MASK(8)
+#define VMMEM_GUEST_2M_PAGE       VMMEM_FLAG_BIT(2)
+#define VMMEM_GUEST_1G_PAGE       VMMEM_FLAG_BIT(3)
+#define VMMEM_GUEST_CAN_FAIL      VMMEM_FLAG_BIT(4)
+#define VMMEM_GUEST_TEST_ZEROCOW  VMMEM_FLAG_BIT(5)
+#define VMMEM_GUEST_TRY_ZEROCOW   VMMEM_FLAG_BIT(6)
+#define VMMEM_GUEST_TRY_POISONCOW VMMEM_FLAG_BIT(7)
+#define VMMEM_GUEST_PREALLOC      VMMEM_FLAG_BIT(8)
+#define VMMEM_GUEST_ALL_FLAGS     MASK(9)
 #define VMMEM_GUEST_TRY_COW       (VMMEM_GUEST_TEST_ZEROCOW | \
                                    VMMEM_GUEST_TRY_ZEROCOW  | \
                                    VMMEM_GUEST_TRY_POISONCOW)
+#define VMMEM_GUEST_LARGE_PAGE    (VMMEM_GUEST_2M_PAGE | \
+                                   VMMEM_GUEST_1G_PAGE)
 
 #define VMMEM_PLATFORM_CHECK_OK           VMMEM_FLAG_BIT(0)
 #define VMMEM_PLATFORM_KEY_OK             VMMEM_FLAG_BIT(1)
@@ -80,11 +83,10 @@
  * Structure used to query platform about the page state.
  */
 typedef struct PlatformPageInfoList {
-   uint32 numPages;
-   uint32 _pad;
-   BPN    bpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // bpns to check
-   MPN    mpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // filled in by host
-   uint8  flags[MAX_PLATFORM_PAGE_INFO_PAGES];  // filled in by host
+   PgCnt64 numPages;
+   BPN     bpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // bpns to check
+   MPN     mpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // filled in by host
+   uint8   flags[MAX_PLATFORM_PAGE_INFO_PAGES];  // filled in by host
 } PlatformPageInfoList;
 
 #define VMMEM_SERVICES_TYPE_2_MASK(type)                  \
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index abfb0b8b..f9e6b4fa 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/x86apic.h b/vmmon-only/include/x86apic.h
index 791ca8dc..d49a0467 100644
--- a/vmmon-only/include/x86apic.h
+++ b/vmmon-only/include/x86apic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2015-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -121,7 +121,7 @@
 
 /*
  * Use APIC_MSR_BASEMASK as mask only for reading the MSR_APIC_BASE.
- * Use VMCORESHARED->reservedAPIC as mask when writing MSR_APIC_BASE.
+ * Use guestReservedAPIC as mask when writing MSR_APIC_BASE.
  */
 #define APIC_MSR_BASEMASK     CONST64U(0x0000fffffffff000)
 #define APIC_MSR_X2APIC_ENABLED 0x00000400
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index fb4d7e0f..1146bea3 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -211,6 +211,7 @@ typedef enum {
 #define CPUID_AMD_VENDOR_STRING         "AuthcAMDenti"
 #define CPUID_CYRIX_VENDOR_STRING       "CyriteadxIns"
 #define CPUID_VIA_VENDOR_STRING         "CentaulsaurH"
+#define CPUID_HYGON_VENDOR_STRING       "HygouinenGen"
 
 #define CPUID_HYPERV_HYPERVISOR_VENDOR_STRING  "Microsoft Hv"
 #define CPUID_KVM_HYPERVISOR_VENDOR_STRING     "KVMKVMKVM\0\0\0"
@@ -221,6 +222,7 @@ typedef enum {
 #define CPUID_AMD_VENDOR_STRING_FIXED   "AuthenticAMD"
 #define CPUID_CYRIX_VENDOR_STRING_FIXED "CyrixInstead"
 #define CPUID_VIA_VENDOR_STRING_FIXED   "CentaurHauls"
+#define CPUID_HYGON_VENDOR_STRING_FIXED "HygonGenuine"
 
 /*
  * FIELD can be defined to process the CPUID information provided in the
@@ -252,7 +254,7 @@ typedef enum {
  * defaultMasks (cpuidcompat.c) if defined there, and must be less than or
  * equal to the version of the cpuid leaf it's in.
  *
- * The eighth parameter describes whether the feature is capable of being used
+ * The ninth parameter describes whether the feature is capable of being used
  * by usermode code (TRUE), or just CPL0 kernel code (FALSE).
  *
  * FLAG is defined identically to FIELD, but its accessors are more appropriate
@@ -338,7 +340,7 @@ FLAG(   1,  0, ECX,  2,  1, DTES64,                            NO,   0, FALSE) \
 FLAG(   1,  0, ECX,  3,  1, MWAIT,                             YES,  4, FALSE) \
 FLAG(   1,  0, ECX,  4,  1, DSCPL,                             NO,   0, FALSE) \
 FLAG(   1,  0, ECX,  5,  1, VMX,                               YES,  4, FALSE) \
-FLAG(   1,  0, ECX,  6,  1, SMX,                               NO,   0, FALSE) \
+FLAG(   1,  0, ECX,  6,  1, SMX,                               YES, 17, FALSE) \
 FLAG(   1,  0, ECX,  7,  1, EIST,                              NO,   0, FALSE) \
 FLAG(   1,  0, ECX,  8,  1, TM2,                               NO,   0, FALSE) \
 FLAG(   1,  0, ECX,  9,  1, SSSE3,                             YES,  4, TRUE)  \
@@ -470,7 +472,7 @@ FLAG(   7,  0, EDX, 31,  1, LEVEL7EDX_RSVD2,                    NO,  0, FALSE)
 #define CPUID_FIELD_DATA_LEVEL_7                                               \
 FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                          YES,  9, FALSE) \
 FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                        ANY, 11, FALSE) \
-FLAG(   7,  0, EBX,  2,  1, SGX,                               NO,   0, FALSE) \
+FLAG(   7,  0, EBX,  2,  1, SGX,                               YES, 17, FALSE) \
 FLAG(   7,  0, EBX,  3,  1, BMI1,                              YES,  9, TRUE)  \
 FLAG(   7,  0, EBX,  4,  1, HLE,                               YES, 11, TRUE)  \
 FLAG(   7,  0, EBX,  5,  1, AVX2,                              YES, 11, TRUE)  \
@@ -489,10 +491,10 @@ FLAG(   7,  0, EBX, 17,  1, AVX512DQ,                          YES, 13, TRUE)  \
 FLAG(   7,  0, EBX, 18,  1, RDSEED,                            YES, 11, TRUE)  \
 FLAG(   7,  0, EBX, 19,  1, ADX,                               YES, 11, TRUE)  \
 FLAG(   7,  0, EBX, 20,  1, SMAP,                              YES, 11, FALSE) \
-FLAG(   7,  0, EBX, 21,  1, AVX512IFMA,                        YES, 15, TRUE)  \
+FLAG(   7,  0, EBX, 21,  1, AVX512IFMA,                        YES, 17, TRUE)  \
 FLAG(   7,  0, EBX, 23,  1, CLFLUSHOPT,                        YES, 13, TRUE)  \
 FLAG(   7,  0, EBX, 24,  1, CLWB,                              YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 25,  1, PT,                                NO,   0, FALSE) \
+FLAG(   7,  0, EBX, 25,  1, PT,                                YES, 17, FALSE) \
 FLAG(   7,  0, EBX, 26,  1, AVX512PF,                          YES, 13, TRUE)  \
 FLAG(   7,  0, EBX, 27,  1, AVX512ER,                          YES, 13, TRUE)  \
 FLAG(   7,  0, EBX, 28,  1, AVX512CD,                          YES, 13, TRUE)  \
@@ -500,10 +502,23 @@ FLAG(   7,  0, EBX, 29,  1, SHA,                               YES, 14, TRUE)  \
 FLAG(   7,  0, EBX, 30,  1, AVX512BW,                          YES, 13, TRUE)  \
 FLAG(   7,  0, EBX, 31,  1, AVX512VL,                          YES, 13, TRUE)  \
 FLAG(   7,  0, ECX,  0,  1, PREFETCHWT1,                       YES, 13, TRUE)  \
-FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                        YES, 15, TRUE)  \
+FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                        YES, 17, TRUE)  \
+FLAG(   7,  0, ECX,  2,  1, UMIP,                              NO,   0, FALSE) \
 FLAG(   7,  0, ECX,  3,  1, PKU,                               YES, 13, TRUE)  \
 FLAG(   7,  0, ECX,  4,  1, OSPKE,                             ANY, 13, TRUE)  \
-FLAG(   7,  0, ECX, 30,  1, SGX_LC,                            NO,   0, FALSE) \
+FLAG(   7,  0, ECX,  6,  1, AVX512VBMI2,                       NO,   0, TRUE)  \
+FLAG(   7,  0, ECX,  8,  1, GFNI,                              NO,   0, TRUE)  \
+FLAG(   7,  0, ECX,  9,  1, VAES,                              NO,   0, TRUE)  \
+FLAG(   7,  0, ECX, 10,  1, VPCLMULQDQ,                        NO,   0, TRUE)  \
+FLAG(   7,  0, ECX, 11,  1, AVX512VNNI,                        NO,   0, TRUE)  \
+FLAG(   7,  0, ECX, 12,  1, AVX512BITALG,                      NO,   0, TRUE)  \
+FLAG(   7,  0, ECX, 14,  1, AVX512VPOPCNTDQ,                   YES, 16, TRUE)  \
+FLAG(   7,  0, ECX, 16,  1, VA57,                              NO,   0, TRUE)  \
+FIELD(  7,  0, ECX, 17,  5, MAWA,                              NO,   0, TRUE)  \
+FLAG(   7,  0, ECX, 22,  1, RDPID,                             NO,   0, TRUE)  \
+FLAG(   7,  0, ECX, 30,  1, SGX_LC,                            YES, 17, FALSE) \
+FLAG(   7,  0, EDX,  2,  1, AVX512QVNNIW,                      YES, 16, TRUE)  \
+FLAG(   7,  0, EDX,  3,  1, AVX512QFMAPS,                      YES, 16, TRUE)  \
 FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                          ANY,  9, FALSE) \
 FLAG(   7,  0, EDX, 27,  1, STIBP,                             YES,  9, FALSE) \
 CPUID_7_EDX_28                                                                 \
@@ -634,22 +649,22 @@ FIELD( 10,  1, EDX,  0, 16, MAX_COS_NUMBER,                    NO,   0, FALSE)
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_12                                              \
-FLAG(  12,  0, EAX,  0,  1, SGX1,                              NO,   0, FALSE) \
+FLAG(  12,  0, EAX,  0,  1, SGX1,                              YES, 17, FALSE) \
 FLAG(  12,  0, EAX,  1,  1, SGX2,                              NO,   0, FALSE) \
-FLAG(  12,  0, EBX,  0,  1, SGX_MISCSELECT_EXINFO,             NO,   0, FALSE) \
+FLAG(  12,  0, EBX,  0,  1, SGX_MISCSELECT_EXINFO,             YES, 17, FALSE) \
 FIELD( 12,  0, EBX,  1, 31, SGX_MISCSELECT_RSVD,               NO,   0, FALSE) \
-FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,            NO,   0, FALSE) \
-FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,               NO,   0, FALSE) \
-FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                  NO,   0, FALSE) \
-FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                  NO,   0, FALSE) \
-FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                  NO,   0, FALSE) \
-FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                  NO,   0, FALSE) \
-FIELD( 12,  2, EAX,  0, 15, EPC00_VALID,                       NO,   0, FALSE) \
-FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                    NO,   0, FALSE) \
-FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                   NO,   0, FALSE) \
-FIELD( 12,  2, ECX,  0, 15, EPC00_PROTECTED,                   NO,   0, FALSE) \
-FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                    NO,   0, FALSE) \
-FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                   NO,   0, FALSE) \
+FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,            YES, 17, FALSE) \
+FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,               YES, 17, FALSE) \
+FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                  YES, 17, FALSE) \
+FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                  YES, 17, FALSE) \
+FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                  YES, 17, FALSE) \
+FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                  YES, 17, FALSE) \
+FIELD( 12,  2, EAX,  0, 15, EPC00_VALID,                       YES, 17, FALSE) \
+FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                    YES, 17, FALSE) \
+FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                   YES, 17, FALSE) \
+FIELD( 12,  2, ECX,  0, 15, EPC00_PROTECTED,                   YES, 17, FALSE) \
+FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                    YES, 17, FALSE) \
+FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                   YES, 17, FALSE) \
 FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                       NO,   0, FALSE) \
 FIELD( 12,  3, EAX, 12, 20, EPC01_BASE_LOW,                    NO,   0, FALSE) \
 FIELD( 12,  3, EBX,  0, 20, EPC01_BASE_HIGH,                   NO,   0, FALSE) \
@@ -659,20 +674,20 @@ FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                   NO,   0, FALSE)
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_14                                              \
-FIELD( 14,  0, EAX,  0, 32, MAX_SUB_LEAF,                        NO, 0, FALSE) \
-FLAG(  14,  0, EBX,  0,  1, CR3FTR_AND_MATCHMSR_AVAILABLE,       NO, 0, FALSE) \
-FLAG(  14,  0, EBX,  1,  1, PSB_AND_CYCLE_ACCURATE_MODE,         NO, 0, FALSE) \
-FLAG(  14,  0, EBX,  2,  1, IP_TRACESTOP_FTR_PTMSR_PERSIST,      NO, 0, FALSE) \
-FLAG(  14,  0, EBX,  3,  1, MTC_PKT_GENERATION_SUPPORTED,        NO, 0, FALSE) \
-FLAG(  14,  0, ECX,  0,  1, TOPA_OUTPUT_SUPPORTED,               NO, 0, FALSE) \
-FLAG(  14,  0, ECX,  1,  1, TOPA_ALLOW_MULTIPLE_ENTRIES,         NO, 0, FALSE) \
-FLAG(  14,  0, ECX,  2,  1, SINGLE_RANGE_OUTPUT_SCHEME,          NO, 0, FALSE) \
-FLAG(  14,  0, ECX,  3,  1, TRACE_TRANSPORT_SUBSYSTEM,           NO, 0, FALSE) \
-FLAG(  14,  0, ECX, 31,  1, LIP_PRESENT_FOR_IP_PAYLOADS,         NO, 0, FALSE) \
-FIELD( 14,  1, EAX,  0,  2, NUM_ADDR_RANGE_FOR_FILTERING,        NO, 0, FALSE) \
-FIELD( 14,  1, EAX, 16, 16, SUPPORTED_MTC_ENCODINGS,             NO, 0, FALSE) \
-FIELD( 14,  1, EBX,  0, 16, SUPPORTED_CYCLE_THRESHOLD_ENCODINGS, NO, 0, FALSE) \
-FIELD( 14,  1, EBX, 16, 16, SUPPORTED_PSB_FREQ_ENCODINGS,        NO, 0, FALSE) \
+FIELD( 14,  0, EAX,  0, 32, MAX_PT_SUB_LEAF,                   YES, 17, FALSE) \
+FLAG(  14,  0, EBX,  0,  1, CR3FTR_AND_MATCHMSR_AVAILABLE,     YES, 17, FALSE) \
+FLAG(  14,  0, EBX,  1,  1, PSB_AND_CYCLE_ACCURATE_MODE,       YES, 17, FALSE) \
+FLAG(  14,  0, EBX,  2,  1, IP_TRACESTOP_FTR_PTMSR_PERSIST,    YES, 17, FALSE) \
+FLAG(  14,  0, EBX,  3,  1, MTC_PKT_GENERATION_SUPPORTED,      YES, 17, FALSE) \
+FLAG(  14,  0, ECX,  0,  1, TOPA_OUTPUT_SUPPORTED,             YES, 17, FALSE) \
+FLAG(  14,  0, ECX,  1,  1, TOPA_ALLOW_MULTIPLE_ENTRIES,       YES, 17, FALSE) \
+FLAG(  14,  0, ECX,  2,  1, SINGLE_RANGE_OUTPUT_SCHEME,        YES, 17, FALSE) \
+FLAG(  14,  0, ECX,  3,  1, TRACE_TRANSPORT_SUBSYSTEM,         NO,   0, FALSE) \
+FLAG(  14,  0, ECX, 31,  1, LIP_PRESENT_FOR_IP_PAYLOADS,       YES, 17, FALSE) \
+FIELD( 14,  1, EAX,  0,  2, NUM_ADDR_RANGE_FOR_FILTERING,      YES, 17, FALSE) \
+FIELD( 14,  1, EAX, 16, 16, SUPPORTED_MTC_ENCODINGS,           YES, 17, FALSE) \
+FIELD( 14,  1, EBX,  0, 16, SUPPORTED_CYCLE_THRESHOLD_ENCODINGS, YES,17,FALSE) \
+FIELD( 14,  1, EBX, 16, 16, SUPPORTED_PSB_FREQ_ENCODINGS,      YES, 17, FALSE) \
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_15                                              \
@@ -939,6 +954,11 @@ FIELD( 86,  0, EDX, 18, 14, L3CACHE_SIZE,                      NA,   0, FALSE)
 
 /*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_87                                              \
+FLAG(  87,  0, EBX,  0,  1, MCA_OVERFLOW_RECOV,                NA,   0, FALSE) \
+FLAG(  87,  0, EBX,  1,  1, SUCCOR,                            NA,   0, FALSE) \
+FLAG(  87,  0, EBX,  2,  1, HWA,                               NA,   0, FALSE) \
+FLAG(  87,  0, EBX,  3,  1, SCALABLE_MCA,                      NA,   0, FALSE) \
+FLAG(  87,  0, EBX,  4,  1, PFEH_SUPPORT_PRESENT,              NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  0,  1, TS,                                NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  1,  1, FID,                               NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  2,  1, VID,                               NA,   0, FALSE) \
@@ -950,6 +970,17 @@ FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                          NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                     NA,   0, FALSE) \
 FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                   NA,   0, FALSE)
 
+#define CPUID_88_EBX_14 \
+FLAG(  88,  0, EBX, 14,  1, LEAF88_RSVD1,                       NO,  0, FALSE)
+#define CPUID_88_EBX_15 \
+FLAG(  88,  0, EBX, 15,  1, LEAF88_RSVD2,                       NO,  0, FALSE)
+#define CPUID_88_EBX_16 \
+FLAG(  88,  0, EBX, 16,  1, LEAF88_RSVD3,                       NO,  0, FALSE)
+#define CPUID_88_EBX_17 \
+FLAG(  88,  0, EBX, 17,  1, LEAF88_RSVD4,                       NO,  0, FALSE)
+#define CPUID_88_EBX_18 \
+FLAG(  88,  0, EBX, 18,  1, LEAF88_RSVD5,                       NO,  0, FALSE)
+
 /*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
 #define CPUID_FIELD_DATA_LEVEL_88                                              \
 FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                         YES,  4, FALSE) \
@@ -958,7 +989,12 @@ FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                YES,  8, FALSE) \
 FLAG(  88,  0, EBX,  0,  1, CLZERO,                            YES, 14, TRUE)  \
 FLAG(  88,  0, EBX,  1,  1, IRPERF,                            NO,   0, FALSE) \
 FLAG(  88,  0, EBX,  2,  1, XSAVE_ERR_PTR,                     NO,   0, FALSE) \
-FLAG(  88,  0, EBX, 12,  1, IBPBONLY,                          ANY,  9, FALSE) \
+FLAG(  88,  0, EBX, 12,  1, LEAF88_IBPB,                       ANY,  9, FALSE) \
+CPUID_88_EBX_14 \
+CPUID_88_EBX_15 \
+CPUID_88_EBX_16 \
+CPUID_88_EBX_17 \
+CPUID_88_EBX_18 \
 FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                 YES,  4, FALSE) \
 FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                YES,  7, FALSE) \
 FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                      NO,   0, FALSE)
@@ -989,7 +1025,7 @@ CPUID_8A_EDX_11 \
 FLAG(  8A,  0, EDX, 12,  1, SVM_PAUSE_THRESHOLD,               NO,   0, FALSE) \
 FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                          NO,   0, FALSE) \
 CPUID_8A_EDX_14 \
-FLAG(  8A,  0, EDX, 15,  1, SVM_VIRT_VMSAVE_VMLOAD,            NO,   0, FALSE) \
+FLAG(  8A,  0, EDX, 15,  1, SVM_V_VMSAVE_VMLOAD,               NO,   0, FALSE) \
 FLAG(  8A,  0, EDX, 16,  1, SVM_VGIF,                          NO,   0, FALSE) \
 FIELD( 8A,  0, EDX, 17, 15, SVMEDX_RSVD,                       NO,   0, FALSE)
 
@@ -1176,48 +1212,6 @@ enum {
 #undef FIELD
 #undef FLAG
 
-/*
- * Legal CPUID config file mask characters.  For a description of the
- * cpuid masking system, please see:
- *
- * http://vmweb.vmware.com/~mts/cgi-bin/view.cgi/Apps/CpuMigrationChecks
- */
-
-#define CPUID_MASK_HIDE_CHR    '0'
-#define CPUID_MASK_HIDE_STR    "0"
-#define CPUID_MASK_FORCE_CHR   '1'
-#define CPUID_MASK_FORCE_STR   "1"
-#define CPUID_MASK_PASS_CHR    '-'
-#define CPUID_MASK_PASS_STR    "-"
-#define CPUID_MASK_TRUE_CHR    'T'
-#define CPUID_MASK_TRUE_STR    "T"
-#define CPUID_MASK_FALSE_CHR   'F'
-#define CPUID_MASK_FALSE_STR   "F"
-#define CPUID_MASK_IGNORE_CHR  'X'
-#define CPUID_MASK_IGNORE_STR  "X"
-#define CPUID_MASK_HOST_CHR    'H'
-#define CPUID_MASK_HOST_STR    "H"
-#define CPUID_MASK_RSVD_CHR    'R'
-#define CPUID_MASK_RSVD_STR    "R"
-#define CPUID_MASK_INSTALL_CHR 'I'
-#define CPUID_MASK_INSTALL_STR "I"
-
-/*
- * When LM is disabled, we overlay the following masks onto the
- * guest's default masks.  Any level that is not defined below should
- * be treated as all "-"s
- */
-
-#define CPT_ID1ECX_LM_DISABLED  "----:----:----:----:--0-:----:----:----"
-#define CPT_ID81EDX_LM_DISABLED "--0-:----:----:----:----:----:----:----"
-#define CPT_ID81ECX_LM_DISABLED "----:----:----:----:----:----:----:---0"
-
-#define CPT_GET_LM_DISABLED_MASK(lvl, reg)                                  \
-   ((lvl == 1 && reg == CPUID_REG_ECX) ? CPT_ID1ECX_LM_DISABLED :           \
-    (lvl == 0x80000001 && reg == CPUID_REG_ECX) ? CPT_ID81ECX_LM_DISABLED : \
-    (lvl == 0x80000001 && reg == CPUID_REG_EDX) ? CPT_ID81EDX_LM_DISABLED : \
-    NULL)
-
 /*
  * CPUID_MASK --
  * CPUID_SHIFT --
@@ -1381,6 +1375,9 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 /* Effective VIA CPU Families */
 #define CPUID_FAMILY_C7               6
 
+/* Effective Hygon CPU Families. */
+#define CPUID_FAMILY_DHYANA          0x18
+
 /* Intel model information */
 #define CPUID_MODEL_PPRO              1
 #define CPUID_MODEL_PII_03            3
@@ -1420,12 +1417,14 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_ATOM_4D        0x4d  // Avoton
 #define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y / Kabylake U/Y ES
 #define CPUID_MODEL_BROADWELL_4F   0x4f  // Broadwell EP/EN/EX
+#define CPUID_MODEL_SKYLAKE_55     0x55  // Skylake EP/EN/EX
 #define CPUID_MODEL_BROADWELL_56   0x56  // Broadwell DE
 #define CPUID_MODEL_KNL_57         0x57  // Knights Landing
 #define CPUID_MODEL_ATOM_5A        0x5a  // Future Silvermont
 #define CPUID_MODEL_ATOM_5D        0x5d  // Future Silvermont
 #define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S / Kabylake S/H ES
 #define CPUID_MODEL_ATOM_5F        0x5f  // Denverton
+#define CPUID_MODEL_KNM_85         0x85  // Knights Mill
 #define CPUID_MODEL_KABYLAKE_8E    0x8e  // Kabylake U/Y QS
 #define CPUID_MODEL_KABYLAKE_9E    0x9e  // Kabylake S/H QS
 
@@ -1459,17 +1458,21 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_ZEN_1F            0x1F // Max Zen model defined in BKDG
 
 /* VIA model information */
-#define CPUID_MODEL_NANO       15     // Isaiah
+#define CPUID_MODEL_NANO                15 // Isaiah
+
+/* Hygon model information. */
+#define CPUID_MODEL_DHYANA_A             0 // Dhyana A
 
 /*
  *----------------------------------------------------------------------
  *
- * CPUID_IsVendor{AMD,Intel,VIA} --
+ * CPUID_IsVendor{AMD,Intel,VIA,Hygon} --
  *
- *      Determines if the vendor string in cpuid id0 is from {AMD,Intel,VIA}.
+ *      Determines if the vendor string in cpuid id0 is from
+ *      {AMD,Intel,VIA,Hygon}.
  *
  * Results:
- *      True iff vendor string is CPUID_{AMD,INTEL,VIA}_VENDOR_STRING
+ *      True iff vendor string is CPUID_{AMD,INTEL,VIA,HYGON}_VENDOR_STRING
  *
  * Side effects:
  *      None.
@@ -1503,6 +1506,12 @@ CPUID_IsVendorVIA(CPUIDRegs *id0)
    return CPUID_IsRawVendor(id0, CPUID_VIA_VENDOR_STRING);
 }
 
+static INLINE Bool
+CPUID_IsVendorHygon(CPUIDRegs *id0)
+{
+   return CPUID_IsRawVendor(id0, CPUID_HYGON_VENDOR_STRING);
+}
+
 static INLINE uint32
 CPUID_EFFECTIVE_FAMILY(uint32 v) /* %eax from CPUID with %eax=1. */
 {
@@ -1655,6 +1664,7 @@ CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
    return CPUID_FAMILY_IS_P6(v) &&
           ((CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E &&
             CPUID_EFFECTIVE_STEPPING(v) != CPUID_STEPPING_KABYLAKE_ES) ||
+            CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_55 ||
            (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E &&
             CPUID_EFFECTIVE_STEPPING(v) != CPUID_STEPPING_KABYLAKE_ES));
 }
@@ -1695,6 +1705,7 @@ CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
            CPUID_MODEL_IS_SKYLAKE(v));
 }
 
+
 static INLINE Bool
 CPUID_UARCH_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
@@ -1789,6 +1800,14 @@ CPUID_MODEL_IS_KNIGHTS_LANDING(uint32 v) // IN: %eax from CPUID with %eax=1.
           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KNL_57;
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_KNIGHTS_MILL(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KNM_85;
+}
+
 
 static INLINE Bool
 CPUID_FAMILY_IS_K7(uint32 eax)
@@ -1974,6 +1993,22 @@ CPUID_MODEL_IS_ZEN(uint32 eax)
           CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN_1F;
 }
 
+
+static INLINE Bool
+CPUID_FAMILY_IS_DHYANA(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_DHYANA;
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_DHYANA_A(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_DHYANA &&
+          CPUID_EFFECTIVE_MODEL(eax)  == CPUID_MODEL_DHYANA_A;
+}
+
+
 #define CPUID_TYPE_PRIMARY     0
 #define CPUID_TYPE_OVERDRIVE   1
 #define CPUID_TYPE_SECONDARY   2
diff --git a/vmmon-only/include/x86cpuid_asm.h b/vmmon-only/include/x86cpuid_asm.h
index e596accd..167486f8 100644
--- a/vmmon-only/include/x86cpuid_asm.h
+++ b/vmmon-only/include/x86cpuid_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 6e11bb66..92aca35c 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -42,6 +42,7 @@
 extern "C" {
 #endif
 
+#define SIZEOF_X86_MSR     8
 
 /*
  * Results of calling rdmsr(msrNum) on all logical processors.
@@ -82,6 +83,7 @@ MSRQuery;
 #define MSR_PLATFORM_ID       0x00000017
 #define MSR_APIC_BASE         0x0000001b
 #define MSR_SMI_COUNT         0x00000034 // Intel Nehalem Family
+#define MSR_CORE_THREAD_COUNT 0x00000035 // Intel Nehalem Family +
 #define MSR_FEATCTL           0x0000003a
 #define MSR_TSC_ADJUST        0x0000003b
 #define MSR_SPEC_CTRL         0x00000048
@@ -119,11 +121,10 @@ MSRQuery;
 #define MSR_ARCH_CAPABILITIES_IBRS_ALL            (1ULL << 1)
 #define MSR_ARCH_CAPABILITIES_RSBA                (1ULL << 2)
 
-#define MSR_FLUSH_CMD                        0x10b
-#define MSR_FLUSH_CMD_FLUSH_L1D              1
 
 #define MSR_SPEC_CTRL_IBRS                        (1UL << 0)
 #define MSR_SPEC_CTRL_STIBP                       (1UL << 1)
+
 #define MSR_PRED_CMD_IBPB                         (1UL << 0)
 
 #define MSR_MISC_FEATURES_ENABLES            0x140
@@ -388,6 +389,17 @@ typedef enum {
 #define MSR_SGX_SVN_STATUS_SINIT_SVN     CONST64U(0xff0000)
 #define MSR_SGX_SVN_STATUS_RSVD          CONST64U(0xffffffffff00fffe)
 
+/*
+ * SGX Flexible Launch Control MSRs.
+ * These MSRs store hash of Launch Enclave's public key.
+ */
+#define MSR_SGXLEPUBKEYHASH0  0x0000008c
+#define MSR_SGXLEPUBKEYHASH1  0x0000008d
+#define MSR_SGXLEPUBKEYHASH2  0x0000008e
+#define MSR_SGXLEPUBKEYHASH3  0x0000008f
+
+#define NUM_SGXLEPUBKEYHASH_MSRs (4)
+
 /* MSR_CR_PAT power-on value */
 #define MSR_CR_PAT_DEFAULT   0x0007040600070406ULL
 
@@ -426,6 +438,7 @@ typedef enum {
 #define MSR_FEATCTL_VMXE     0x00000004
 #define MSR_FEATCTL_SENTERP  0x00007F00
 #define MSR_FEATCTL_SENTERE  0x00008000
+#define MSR_FEATCTL_FLCE     0x00020000
 #define MSR_FEATCTL_SGXE     0x00040000
 #define MSR_FEATCTL_LMCE     0x00100000
 
@@ -479,6 +492,8 @@ typedef enum {
 #define MSR_GH_COFVID_CONTROL    0xc0010070  // COFVID Control Register
 #define MSR_GH_COFVID_STATUS     0xc0010071  // COFVID Status Register
 
+#define MSR_AMD_MCA_INTR_CFG     0xc0000410  // MCA Interrupt Configuration
+
 /* SVM related MSRs */
 #define MSR_VM_CR                  0xc0010114
 #define MSR_IGNNE                  0xc0010115
@@ -601,6 +616,8 @@ typedef enum {
 
 #define MTRR_MASK_VALID       0x800
 
+typedef unsigned char MTRRType;
+
 #define MTRR_TYPE_UC          0
 #define MTRR_TYPE_WC          1
 #define MTRR_TYPE_WT          4
@@ -610,6 +627,13 @@ typedef enum {
 /* UC- is equivalent to UC, except that the MTRR values take precedence */
 #define MTRR_TYPE_UCM         7
 
+/*
+ * This value is marked as reserved in the Intel manual. We use it to
+ * specify that type is unknown as it is very unlikely that Intel will
+ * use this value. Note that linux is taking the same liberty.
+ */
+#define MTRR_TYPE_UNKNOW     0xff
+
 /*
  * PERF_STATUS bits
  */
diff --git a/vmmon-only/include/x86paging_common.h b/vmmon-only/include/x86paging_common.h
index a93fd41b..128ee69a 100644
--- a/vmmon-only/include/x86paging_common.h
+++ b/vmmon-only/include/x86paging_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -54,7 +54,6 @@
 #define PTE_PAT         0x00000080
 #define PTE_G           0x00000100
 #define PTE_LARGE_PAT   0x00001000
-#define PTE_RSVD        CONST64(0x0008000000000000)
 #define PTE_NX          CONST64(0x8000000000000000)
 #define PTE_NX_SHIFT    63
 
diff --git a/vmmon-only/include/x86perfctr.h b/vmmon-only/include/x86perfctr.h
index 5ab6c8c6..b968a0a4 100644
--- a/vmmon-only/include/x86perfctr.h
+++ b/vmmon-only/include/x86perfctr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2012,2014-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2012,2014-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -45,6 +45,7 @@
 #define PERFCTR_NEHALEM_NUM_FIXED_COUNTERS       3
 #define PERFCTR_SANDYBRIDGE_NUM_GEN_COUNTERS     8 /* When HT is disabled */
 #define PERFCTR_CORE_NUM_ARCH_EVENTS             7
+#define PERFCTR_CORE_NUM_FIXED_COUNTERS          3
 #define PERFCTR_PENTIUM4_VAL_MASK                0xffffffffffLL
 #define PERFCTR_AMD_VAL_MASK                     0xffffffffffffLL
 #define PERF_EVENT_NAME_LEN                      64
@@ -109,10 +110,15 @@
 /* AMD Performance Counter MSR Definitions */
 #define PERFCTR_AMD_PERFEVTSEL0_ADDR             0xC0010000
 #define PERFCTR_AMD_PERFCTR0_ADDR                0xC0010004
+/* AMD with PerfCtrExtCore (PERFCORE) support MSR Definitions */
 #define PERFCTR_AMD_EXT_BASE_ADDR                0xC0010200
 #define PERFCTR_AMD_EXT_EVENTSEL                 0
 #define PERFCTR_AMD_EXT_CTR                      1
 #define PERFCTR_AMD_EXT_MSR_STRIDE               2
+#define PERFCTR_AMD_AMD_EXT_CNTR_BASE_ADDR \
+        (PERFCTR_AMD_EXT_BASE_ADDR + PERFCTR_AMD_EXT_CTR)
+#define PERFCTR_AMD_AMD_EXT_EVSL_BASE_ADDR \
+        (PERFCTR_AMD_EXT_BASE_ADDR + PERFCTR_AMD_EXT_EVENTSEL)
 
 /* AMD Clocks */
 #define PERFCTR_AMD_CPU_CLK_UNHALTED                           0x76
@@ -847,7 +853,7 @@ PerfCtr_PTAvailable(void)
    __GET_CPUID(0, &regs);
    if (CPUID_IsVendorIntel(&regs)) {
       __GET_CPUID2(7, 0, &regs);
-      return (regs.ecx & CPUID_INTERNAL_MASK_PT) != 0;
+      return (regs.ebx & CPUID_INTERNAL_MASK_PT) != 0;
    }
    return FALSE;
 }
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
index dc5d60a4..04a14d23 100644
--- a/vmmon-only/include/x86svm.h
+++ b/vmmon-only/include/x86svm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005-2014,2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2014,2017-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -134,8 +134,9 @@
 /* VMCB.nptCtl */
 #define SVM_VMCB_NPTCTL_NP_ENABLE          (1 << 0)
 
-/* VMCB.debugCtl */
-#define SVM_VMCB_DEBUGCTL_LBR_ENABLE       (1 << 0)
+/* VMCB.virtExt */
+#define SVM_VMCB_VIRTEXT_LBR_ENABLE        (1 << 0)
+#define SVM_VMCB_VIRTEXT_V_VMSAVE_VMLOAD   (1 << 1)
 
 /* VMCB.clean */
 #define SVMCLEAN       \
@@ -330,7 +331,7 @@ enum {
 
 #undef CLEANBIT
 };
-   
+
 static INLINE uint64
 SVM_ExecCtlBit(uint32 exitCode)
 {
@@ -389,7 +390,7 @@ SVM_ExecCtlBit(uint32 exitCode)
  *----------------------------------------------------------------------
  *
  * SVM_EnabledFromFeatures --
- * 
+ *
  *  Returns TRUE if SVM is enabled in the given VM control MSR bits.
  *
  *----------------------------------------------------------------------
@@ -405,7 +406,7 @@ SVM_EnabledFromFeatures(uint64 vmCR)
  *----------------------------------------------------------------------
  *
  * SVM_LockedFromFeatures --
- * 
+ *
  *  Returns TRUE if SVM is locked in the given VM control MSR bits.
  *
  *----------------------------------------------------------------------
@@ -461,32 +462,18 @@ SVM_CapableCPU(void)
  *   SVM-enabled monitor.  This function assumes that the processor is
  *   SVM_Capable().  We only support CPUs that populate the exitIntInfo
  *   field of the VMCB when IDT vectoring is interrupted by a task switch
- *   intercept.  That behavior was first introduced with Family 10H.
- *----------------------------------------------------------------------
- */
-static INLINE Bool
-SVM_SupportedVersion(uint32 version)
-{
-   return CPUID_EFFECTIVE_FAMILY(version) >= CPUID_FAMILY_K8L;
-}
-
-
-/*
- *
- *----------------------------------------------------------------------
- * SVM_SupportedCPU --
- *
- *   Wrapper to call SVM_SupportedVersion() with the right
- *   parameter(s) for the current CPU.
+ *   intercept.  That behavior was first introduced with AMD Family 10H.
+ *   As Hygon's Dhyana is a descendant of AMD's Zen microarchitecture
+ *   (Family 17H), SVM is always supported.
  *----------------------------------------------------------------------
  */
 static INLINE Bool
-SVM_SupportedCPU(void)
+SVM_SupportedVersion(CpuidVendor vendor, uint32 version)
 {
-   return SVM_SupportedVersion(__GET_EAX_FROM_CPUID(1));
+   return (vendor == CPUID_VENDOR_AMD &&
+           CPUID_EFFECTIVE_FAMILY(version) >= CPUID_FAMILY_K8L) ||
+          vendor == CPUID_VENDOR_HYGON;
 }
-
-
 #endif /* VMM */
 
 #endif /* _X86SVM_H_ */
diff --git a/vmmon-only/include/x86types.h b/vmmon-only/include/x86types.h
index c070e4eb..d8273e4e 100644
--- a/vmmon-only/include/x86types.h
+++ b/vmmon-only/include/x86types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -86,11 +86,12 @@ typedef uint16 Selector;
  */
 
 
+#define RSP_NUM_ENTRIES 3
 #define IST_NUM_ENTRIES 8
 #pragma pack(push, 1)
 typedef struct Task64 {
    uint32     reserved0;
-   uint64     rsp[3];   // Stacks for CPL 0-2.
+   uint64     rsp[RSP_NUM_ENTRIES];   // Stacks for CPL 0-2.
    uint64     ist[IST_NUM_ENTRIES];   // ist[0] is reserved.
    uint64     reserved1;
    uint16     reserved2;
diff --git a/vmmon-only/include/x86vendor.h b/vmmon-only/include/x86vendor.h
index 62248ec2..dabfe44c 100644
--- a/vmmon-only/include/x86vendor.h
+++ b/vmmon-only/include/x86vendor.h
@@ -1,6 +1,5 @@
-
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,6 +30,7 @@ typedef enum {
    CPUID_VENDOR_AMD,
    CPUID_VENDOR_CYRIX,
    CPUID_VENDOR_VIA,
+   CPUID_VENDOR_HYGON,
    CPUID_NUM_VENDORS
 } CpuidVendor;
 
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
index 74b9b4cc..1073e906 100644
--- a/vmmon-only/include/x86vt-vmcs-fields.h
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -76,7 +76,8 @@
 #endif
 
 /*
- * VMCS_FIELD(_name, _val, _size, _type, _index, _cache, _vvt, _access)
+ * VMCS_FIELD(_name, _val, _size, _type, _index, _cache, _vvt, _access,
+ *            _sticky)
  *    _type is one of:
  *       _TC -- control
  *       _TG -- guest-state
@@ -97,16 +98,20 @@
  *       _NA -- no access
  *       _RW -- read/write access
  *       _RO -- read-only access
+ *   _sticky is one of:
+ *       _S  -- sticky
+ *       _NS -- non-sticky
  *
+ * Fields marked sticky in the current VMCS, change only via VMWRITEs.
  */
 
 
 VMCS_SET_START(16)
 /* 16-bit control fields. */
 VMCS_GROUP_START(16, CTL)
-VMCS_FIELD(VPID,                    0x0000, _S16, _TC,  0,  _C,  _V, _NA)
-VMCS_FIELD(PI_NOTIFY,               0x0002, _S16, _TC,  1, _NC, _NV, _NA)
-VMCS_FIELD(EPTP_INDEX,              0x0004, _S16, _TC,  2, _NC,  _V, _NA)
+VMCS_FIELD(VPID,                    0x0000, _S16, _TC,  0,  _C,  _V, _NA,  _S)
+VMCS_FIELD(PI_NOTIFY,               0x0002, _S16, _TC,  1, _NC, _NV, _NA,  _S)
+VMCS_FIELD(EPTP_INDEX,              0x0004, _S16, _TC,  2, _NC,  _V, _NA, _NS)
 VMCS_UNUSED(                        0x0006, _S16, _TC,  3)
 VMCS_UNUSED(                        0x0008, _S16, _TC,  4)
 VMCS_UNUSED(                        0x000A, _S16, _TC,  5)
@@ -176,16 +181,16 @@ VMCS_GROUP_END(16, DATA)
 
 /* 16-bit guest state. */
 VMCS_GROUP_START(16, GUEST)
-VMCS_FIELD(ES,                      0x0800, _S16, _TG,  0, _NC,  _V, _RW)
-VMCS_FIELD(CS,                      0x0802, _S16, _TG,  1, _NC,  _V, _RW)
-VMCS_FIELD(SS,                      0x0804, _S16, _TG,  2, _NC,  _V, _RW)
-VMCS_FIELD(DS,                      0x0806, _S16, _TG,  3, _NC,  _V, _RW)
-VMCS_FIELD(FS,                      0x0808, _S16, _TG,  4, _NC,  _V, _RW)
-VMCS_FIELD(GS,                      0x080A, _S16, _TG,  5, _NC,  _V, _RW)
-VMCS_FIELD(LDTR,                    0x080C, _S16, _TG,  6, _NC,  _V, _RW)
-VMCS_FIELD(TR,                      0x080E, _S16, _TG,  7, _NC,  _V, _RW)
-VMCS_FIELD(INTR_STATUS,             0x0810, _S16, _TG,  8, _NC, _NV, _NA)
-VMCS_FIELD(PML_INDEX,               0x0812, _S16, _TG,  9, _NC, _NV, _NA)
+VMCS_FIELD(ES,                      0x0800, _S16, _TG,  0, _NC,  _V, _RW, _NS)
+VMCS_FIELD(CS,                      0x0802, _S16, _TG,  1, _NC,  _V, _RW, _NS)
+VMCS_FIELD(SS,                      0x0804, _S16, _TG,  2, _NC,  _V, _RW, _NS)
+VMCS_FIELD(DS,                      0x0806, _S16, _TG,  3, _NC,  _V, _RW, _NS)
+VMCS_FIELD(FS,                      0x0808, _S16, _TG,  4, _NC,  _V, _RW, _NS)
+VMCS_FIELD(GS,                      0x080A, _S16, _TG,  5, _NC,  _V, _RW, _NS)
+VMCS_FIELD(LDTR,                    0x080C, _S16, _TG,  6, _NC,  _V, _RW, _NS)
+VMCS_FIELD(TR,                      0x080E, _S16, _TG,  7, _NC,  _V, _RW, _NS)
+VMCS_FIELD(INTR_STATUS,             0x0810, _S16, _TG,  8, _NC, _NV, _NA, _NS)
+VMCS_FIELD(PML_INDEX,               0x0812, _S16, _TG,  9, _NC,  _V, _NA, _NS)
 VMCS_UNUSED(                        0x0814, _S16, _TG,  10)
 VMCS_UNUSED(                        0x0816, _S16, _TG,  11)
 VMCS_UNUSED(                        0x0818, _S16, _TG,  12)
@@ -212,13 +217,13 @@ VMCS_GROUP_END(16, GUEST)
 
 /* 16-bit host state. */
 VMCS_GROUP_START(16, HOST)
-VMCS_FIELD(HOST_ES,                 0x0C00, _S16, _TH,  0, _NC,  _V, _NA)
-VMCS_FIELD(HOST_CS,                 0x0C02, _S16, _TH,  1, _NC,  _V, _NA)
-VMCS_FIELD(HOST_SS,                 0x0C04, _S16, _TH,  2, _NC,  _V, _NA)
-VMCS_FIELD(HOST_DS,                 0x0C06, _S16, _TH,  3, _NC,  _V, _NA)
-VMCS_FIELD(HOST_FS,                 0x0C08, _S16, _TH,  4, _NC,  _V, _NA)
-VMCS_FIELD(HOST_GS,                 0x0C0A, _S16, _TH,  5, _NC,  _V, _NA)
-VMCS_FIELD(HOST_TR,                 0x0C0C, _S16, _TH,  6, _NC,  _V, _NA)
+VMCS_FIELD(HOST_ES,                 0x0C00, _S16, _TH,  0, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_CS,                 0x0C02, _S16, _TH,  1, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_SS,                 0x0C04, _S16, _TH,  2, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_DS,                 0x0C06, _S16, _TH,  3, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_FS,                 0x0C08, _S16, _TH,  4, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_GS,                 0x0C0A, _S16, _TH,  5, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_TR,                 0x0C0C, _S16, _TH,  6, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x0C0E, _S16, _TH,  7)
 VMCS_UNUSED(                        0x0C10, _S16, _TH,  8)
 VMCS_UNUSED(                        0x0C12, _S16, _TH,  9)
@@ -251,32 +256,32 @@ VMCS_SET_END(16)
 VMCS_SET_START(64)
 /* 64-bit control fields. */
 VMCS_GROUP_START(64, CTL)
-VMCS_FIELD(IOBITMAPA,               0x2000, _S64, _TC,  0, _NC,  _V, _NA)
-VMCS_FIELD(IOBITMAPB,               0x2002, _S64, _TC,  1, _NC,  _V, _NA)
-VMCS_FIELD(MSRBITMAP,               0x2004, _S64, _TC,  2, _NC,  _V, _NA)
-VMCS_FIELD(VMEXIT_MSR_STORE_ADDR,   0x2006, _S64, _TC,  3, _NC,  _V, _NA)
-VMCS_FIELD(VMEXIT_MSR_LOAD_ADDR,    0x2008, _S64, _TC,  4, _NC,  _V, _NA)
-VMCS_FIELD(VMENTRY_MSR_LOAD_ADDR,   0x200A, _S64, _TC,  5, _NC,  _V, _NA)
-VMCS_FIELD(EXECUTIVE_VMCS_PTR,      0x200C, _S64, _TC,  6, _NC,  _V, _NA)
-VMCS_FIELD(PML_ADDR,                0x200E, _S64, _TC,  7, _NC, _NV, _NA)
-VMCS_FIELD(TSC_OFF,                 0x2010, _S64, _TC,  8,  _C,  _V, _NA)
-VMCS_FIELD(VIRT_APIC_ADDR,          0x2012, _S64, _TC,  9, _NC,  _V, _NA)
-VMCS_FIELD(APIC_ACCESS_ADDR,        0x2014, _S64, _TC, 10, _NC,  _V, _NA)
-VMCS_FIELD(PI_DESC_ADDR,            0x2016, _S64, _TC, 11, _NC, _NV, _NA)
-VMCS_FIELD(VMFUNC_CTLS,             0x2018, _S64, _TC, 12, _NC,  _V, _NA)
-VMCS_FIELD(EPTP,                    0x201A, _S64, _TC, 13, _NC,  _V, _NA)
-VMCS_FIELD(EOI_EXIT0,               0x201C, _S64, _TC, 14, _NC, _NV, _NA)
-VMCS_FIELD(EOI_EXIT1,               0x201E, _S64, _TC, 15, _NC, _NV, _NA)
-VMCS_FIELD(EOI_EXIT2,               0x2020, _S64, _TC, 16, _NC, _NV, _NA)
-VMCS_FIELD(EOI_EXIT3,               0x2022, _S64, _TC, 17, _NC, _NV, _NA)
-VMCS_FIELD(EPTP_LIST_ADDR,          0x2024, _S64, _TC, 18, _NC,  _V, _NA)
-VMCS_FIELD(VMREAD_BITMAP,           0x2026, _S64, _TC, 19, _NC, _NV, _NA)
-VMCS_FIELD(VMWRITE_BITMAP,          0x2028, _S64, _TC, 20, _NC, _NV, _NA)
-VMCS_FIELD(VE_INFO_ADDR,            0x202A, _S64, _TC, 21, _NC,  _V, _NA)
-VMCS_FIELD(XSS_EXITING_BITMAP,      0x202C, _S64, _TC, 22, _NC,  _V, _NA)
-VMCS_FIELD(ENCLS_EXITING_BITMAP,    0x202E, _S64, _TC, 23, _NC, _NV, _NA)
+VMCS_FIELD(IOBITMAPA,               0x2000, _S64, _TC,  0, _NC,  _V, _NA,  _S)
+VMCS_FIELD(IOBITMAPB,               0x2002, _S64, _TC,  1, _NC,  _V, _NA,  _S)
+VMCS_FIELD(MSRBITMAP,               0x2004, _S64, _TC,  2, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMEXIT_MSR_STORE_ADDR,   0x2006, _S64, _TC,  3, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMEXIT_MSR_LOAD_ADDR,    0x2008, _S64, _TC,  4, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMENTRY_MSR_LOAD_ADDR,   0x200A, _S64, _TC,  5, _NC,  _V, _NA,  _S)
+VMCS_FIELD(EXECUTIVE_VMCS_PTR,      0x200C, _S64, _TC,  6, _NC,  _V, _NA, _NS)
+VMCS_FIELD(PML_ADDR,                0x200E, _S64, _TC,  7, _NC,  _V, _NA,  _S)
+VMCS_FIELD(TSC_OFF,                 0x2010, _S64, _TC,  8,  _C,  _V, _NA,  _S)
+VMCS_FIELD(VIRT_APIC_ADDR,          0x2012, _S64, _TC,  9, _NC,  _V, _NA,  _S)
+VMCS_FIELD(APIC_ACCESS_ADDR,        0x2014, _S64, _TC, 10, _NC,  _V, _NA,  _S)
+VMCS_FIELD(PI_DESC_ADDR,            0x2016, _S64, _TC, 11, _NC, _NV, _NA,  _S)
+VMCS_FIELD(VMFUNC_CTLS,             0x2018, _S64, _TC, 12, _NC,  _V, _NA,  _S)
+VMCS_FIELD(EPTP,                    0x201A, _S64, _TC, 13, _NC,  _V, _NA, _NS)
+VMCS_FIELD(EOI_EXIT0,               0x201C, _S64, _TC, 14, _NC, _NV, _NA,  _S)
+VMCS_FIELD(EOI_EXIT1,               0x201E, _S64, _TC, 15, _NC, _NV, _NA,  _S)
+VMCS_FIELD(EOI_EXIT2,               0x2020, _S64, _TC, 16, _NC, _NV, _NA,  _S)
+VMCS_FIELD(EOI_EXIT3,               0x2022, _S64, _TC, 17, _NC, _NV, _NA,  _S)
+VMCS_FIELD(EPTP_LIST_ADDR,          0x2024, _S64, _TC, 18, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMREAD_BITMAP,           0x2026, _S64, _TC, 19, _NC, _NV, _NA,  _S)
+VMCS_FIELD(VMWRITE_BITMAP,          0x2028, _S64, _TC, 20, _NC, _NV, _NA,  _S)
+VMCS_FIELD(VE_INFO_ADDR,            0x202A, _S64, _TC, 21, _NC,  _V, _NA,  _S)
+VMCS_FIELD(XSS_EXITING_BITMAP,      0x202C, _S64, _TC, 22, _NC,  _V, _NA,  _S)
+VMCS_FIELD(ENCLS_EXITING_BITMAP,    0x202E, _S64, _TC, 23, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x2030, _S64, _TC, 24)
-VMCS_FIELD(TSC_MULTIPLIER,          0x2032, _S64, _TC, 25, _NC, _NV, _NA)
+VMCS_FIELD(TSC_MULTIPLIER,          0x2032, _S64, _TC, 25, _NC, _NV, _NA,  _S)
 VMCS_UNUSED(                        0x2034, _S64, _TC, 26)
 VMCS_UNUSED(                        0x2036, _S64, _TC, 27)
 VMCS_UNUSED(                        0x2038, _S64, _TC, 28)
@@ -287,7 +292,7 @@ VMCS_GROUP_END(64, CTL)
 
 /* 64-bit read-only data field. */
 VMCS_GROUP_START(64, DATA)
-VMCS_FIELD(PHYSADDR,                0x2400, _S64, _TD,  0, _NC,  _V, _RO)
+VMCS_FIELD(PHYSADDR,                0x2400, _S64, _TD,  0, _NC,  _V, _RO, _NS)
 VMCS_UNUSED(                        0x2402, _S64, _TD,  1)
 VMCS_UNUSED(                        0x2404, _S64, _TD,  2)
 VMCS_UNUSED(                        0x2406, _S64, _TD,  3)
@@ -323,16 +328,16 @@ VMCS_GROUP_END(64, DATA)
 
 /* 64-bit guest state. */
 VMCS_GROUP_START(64, GUEST)
-VMCS_FIELD(LINK_PTR,                0x2800, _S64, _TG,  0, _NC,  _V, _NA)
-VMCS_FIELD(DEBUGCTL,                0x2802, _S64, _TG,  1, _NC,  _V, _NA)
-VMCS_FIELD(PAT,                     0x2804, _S64, _TG,  2, _NC,  _V, _NA)
-VMCS_FIELD(EFER,                    0x2806, _S64, _TG,  3, _NC,  _V, _NA)
-VMCS_FIELD(PGC,                     0x2808, _S64, _TG,  4, _NC,  _V, _NA)
-VMCS_FIELD(PDPTE0,                  0x280A, _S64, _TG,  5, _NC,  _V, _RW)
-VMCS_FIELD(PDPTE1,                  0x280C, _S64, _TG,  6, _NC,  _V, _RW)
-VMCS_FIELD(PDPTE2,                  0x280E, _S64, _TG,  7, _NC,  _V, _RW)
-VMCS_FIELD(PDPTE3,                  0x2810, _S64, _TG,  8, _NC,  _V, _RW)
-VMCS_FIELD(BNDCFGS,                 0x2812, _S64, _TG,  9, _NC,  _V, _NA)
+VMCS_FIELD(LINK_PTR,                0x2800, _S64, _TG,  0, _NC,  _V, _NA, _NS)
+VMCS_FIELD(DEBUGCTL,                0x2802, _S64, _TG,  1, _NC,  _V, _NA, _NS)
+VMCS_FIELD(PAT,                     0x2804, _S64, _TG,  2, _NC,  _V, _NA, _NS)
+VMCS_FIELD(EFER,                    0x2806, _S64, _TG,  3, _NC,  _V, _NA, _NS)
+VMCS_FIELD(PGC,                     0x2808, _S64, _TG,  4, _NC,  _V, _NA, _NS)
+VMCS_FIELD(PDPTE0,                  0x280A, _S64, _TG,  5, _NC,  _V, _RW, _NS)
+VMCS_FIELD(PDPTE1,                  0x280C, _S64, _TG,  6, _NC,  _V, _RW, _NS)
+VMCS_FIELD(PDPTE2,                  0x280E, _S64, _TG,  7, _NC,  _V, _RW, _NS)
+VMCS_FIELD(PDPTE3,                  0x2810, _S64, _TG,  8, _NC,  _V, _RW, _NS)
+VMCS_FIELD(BNDCFGS,                 0x2812, _S64, _TG,  9, _NC,  _V, _NA, _NS)
 VMCS_UNUSED(                        0x2814, _S64, _TG,  10)
 VMCS_UNUSED(                        0x2816, _S64, _TG,  11)
 VMCS_UNUSED(                        0x2818, _S64, _TG,  12)
@@ -359,9 +364,9 @@ VMCS_GROUP_END(64, GUEST)
 
 /* 64-bit host state. */
 VMCS_GROUP_START(64, HOST)
-VMCS_FIELD(HOST_PAT,                0x2C00, _S64, _TH,  0, _NC,  _V, _NA)
-VMCS_FIELD(HOST_EFER,               0x2C02, _S64, _TH,  1, _NC,  _V, _NA)
-VMCS_FIELD(HOST_PGC,                0x2C04, _S64, _TH,  2, _NC,  _V, _NA)
+VMCS_FIELD(HOST_PAT,                0x2C00, _S64, _TH,  0, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_EFER,               0x2C02, _S64, _TH,  1, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_PGC,                0x2C04, _S64, _TH,  2, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x2C06, _S64, _TH,  3)
 VMCS_UNUSED(                        0x2C08, _S64, _TH,  4)
 VMCS_UNUSED(                        0x2C0A, _S64, _TH,  5)
@@ -398,24 +403,24 @@ VMCS_SET_END(64)
 VMCS_SET_START(32)
 /* 32-bit control fields. */
 VMCS_GROUP_START(32, CTL)
-VMCS_FIELD(PIN_VMEXEC_CTL,          0x4000, _S32, _TC,  0,  _C,  _V, _NA)
-VMCS_FIELD(CPU_VMEXEC_CTL,          0x4002, _S32, _TC,  1,  _C,  _V, _NA)
-VMCS_FIELD(XCP_BITMAP,              0x4004, _S32, _TC,  2, _NC,  _V, _NA)
-VMCS_FIELD(PF_ERR_MASK,             0x4006, _S32, _TC,  3, _NC,  _V, _NA)
-VMCS_FIELD(PF_ERR_MATCH,            0x4008, _S32, _TC,  4, _NC,  _V, _NA)
-VMCS_FIELD(CR3_TARG_COUNT,          0x400A, _S32, _TC,  5, _NC,  _V, _NA)
-VMCS_FIELD(VMEXIT_CTL,              0x400C, _S32, _TC,  6, _NC,  _V, _NA)
-VMCS_FIELD(VMEXIT_MSR_STORE_COUNT,  0x400E, _S32, _TC,  7, _NC,  _V, _NA)
-VMCS_FIELD(VMEXIT_MSR_LOAD_COUNT,   0x4010, _S32, _TC,  8, _NC,  _V, _NA)
-VMCS_FIELD(VMENTRY_CTL,             0x4012, _S32, _TC,  9, _NC,  _V, _NA)
-VMCS_FIELD(VMENTRY_MSR_LOAD_COUNT,  0x4014, _S32, _TC, 10, _NC,  _V, _NA)
-VMCS_FIELD(VMENTRY_INTR_INFO,       0x4016, _S32, _TC, 11, _NC,  _V, _NA)
-VMCS_FIELD(VMENTRY_XCP_ERR,         0x4018, _S32, _TC, 12, _NC,  _V, _NA)
-VMCS_FIELD(VMENTRY_INSTR_LEN,       0x401A, _S32, _TC, 13, _NC,  _V, _NA)
-VMCS_FIELD(TPR_THRESHOLD,           0x401C, _S32, _TC, 14,  _C,  _V, _NA)
-VMCS_FIELD(2ND_VMEXEC_CTL,          0x401E, _S32, _TC, 15,  _C,  _V, _NA)
-VMCS_FIELD(PAUSE_LOOP_GAP,          0x4020, _S32, _TC, 16, _NC,  _V, _NA)
-VMCS_FIELD(PAUSE_LOOP_WINDOW,       0x4022, _S32, _TC, 17, _NC,  _V, _NA)
+VMCS_FIELD(PIN_VMEXEC_CTL,          0x4000, _S32, _TC,  0,  _C,  _V, _NA,  _S)
+VMCS_FIELD(CPU_VMEXEC_CTL,          0x4002, _S32, _TC,  1,  _C,  _V, _NA,  _S)
+VMCS_FIELD(XCP_BITMAP,              0x4004, _S32, _TC,  2, _NC,  _V, _NA,  _S)
+VMCS_FIELD(PF_ERR_MASK,             0x4006, _S32, _TC,  3, _NC,  _V, _NA,  _S)
+VMCS_FIELD(PF_ERR_MATCH,            0x4008, _S32, _TC,  4, _NC,  _V, _NA,  _S)
+VMCS_FIELD(CR3_TARG_COUNT,          0x400A, _S32, _TC,  5, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMEXIT_CTL,              0x400C, _S32, _TC,  6, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMEXIT_MSR_STORE_COUNT,  0x400E, _S32, _TC,  7, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMEXIT_MSR_LOAD_COUNT,   0x4010, _S32, _TC,  8, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMENTRY_CTL,             0x4012, _S32, _TC,  9, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMENTRY_MSR_LOAD_COUNT,  0x4014, _S32, _TC, 10, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMENTRY_INTR_INFO,       0x4016, _S32, _TC, 11, _NC,  _V, _NA, _NS)
+VMCS_FIELD(VMENTRY_XCP_ERR,         0x4018, _S32, _TC, 12, _NC,  _V, _NA,  _S)
+VMCS_FIELD(VMENTRY_INSTR_LEN,       0x401A, _S32, _TC, 13, _NC,  _V, _NA,  _S)
+VMCS_FIELD(TPR_THRESHOLD,           0x401C, _S32, _TC, 14,  _C,  _V, _NA,  _S)
+VMCS_FIELD(2ND_VMEXEC_CTL,          0x401E, _S32, _TC, 15,  _C,  _V, _NA,  _S)
+VMCS_FIELD(PAUSE_LOOP_GAP,          0x4020, _S32, _TC, 16, _NC,  _V, _NA,  _S)
+VMCS_FIELD(PAUSE_LOOP_WINDOW,       0x4022, _S32, _TC, 17, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x4024, _S32, _TC, 18)
 VMCS_UNUSED(                        0x4026, _S32, _TC, 19)
 VMCS_UNUSED(                        0x4028, _S32, _TC, 20)
@@ -434,14 +439,14 @@ VMCS_GROUP_END(32, CTL)
 
 /* 32-bit read-only data fields. */
 VMCS_GROUP_START(32, DATA)
-VMCS_FIELD(VMINSTR_ERR,             0x4400, _S32, _TD,  0, _NC,  _V, _NA)
-VMCS_FIELD(EXIT_REASON,             0x4402, _S32, _TD,  1, _NC,  _V, _RO)
-VMCS_FIELD(EXIT_INTR_INFO,          0x4404, _S32, _TD,  2,  _C,  _V, _RO)
-VMCS_FIELD(EXIT_INTR_ERR,           0x4406, _S32, _TD,  3, _NC,  _V, _RO)
-VMCS_FIELD(IDTVEC_INFO,             0x4408, _S32, _TD,  4, _NC,  _V, _RO)
-VMCS_FIELD(IDTVEC_ERR,              0x440A, _S32, _TD,  5, _NC,  _V, _RO)
-VMCS_FIELD(INSTRLEN,                0x440C, _S32, _TD,  6, _NC,  _V, _RO)
-VMCS_FIELD(INSTR_INFO,              0x440E, _S32, _TD,  7, _NC,  _V, _RO)
+VMCS_FIELD(VMINSTR_ERR,             0x4400, _S32, _TD,  0, _NC,  _V, _NA, _NS)
+VMCS_FIELD(EXIT_REASON,             0x4402, _S32, _TD,  1, _NC,  _V, _RO, _NS)
+VMCS_FIELD(EXIT_INTR_INFO,          0x4404, _S32, _TD,  2,  _C,  _V, _RO, _NS)
+VMCS_FIELD(EXIT_INTR_ERR,           0x4406, _S32, _TD,  3, _NC,  _V, _RO, _NS)
+VMCS_FIELD(IDTVEC_INFO,             0x4408, _S32, _TD,  4, _NC,  _V, _RO, _NS)
+VMCS_FIELD(IDTVEC_ERR,              0x440A, _S32, _TD,  5, _NC,  _V, _RO, _NS)
+VMCS_FIELD(INSTRLEN,                0x440C, _S32, _TD,  6, _NC,  _V, _RO, _NS)
+VMCS_FIELD(INSTR_INFO,              0x440E, _S32, _TD,  7, _NC,  _V, _RO, _NS)
 VMCS_UNUSED(                        0x4410, _S32, _TD,  8)
 VMCS_UNUSED(                        0x4412, _S32, _TD,  9)
 VMCS_UNUSED(                        0x4414, _S32, _TD,  10)
@@ -470,30 +475,30 @@ VMCS_GROUP_END(32, DATA)
 
 /* 32-bit guest state. */
 VMCS_GROUP_START(32, GUEST)
-VMCS_FIELD(ES_LIMIT,                0x4800, _S32, _TG,  0, _NC,  _V, _RW)
-VMCS_FIELD(CS_LIMIT,                0x4802, _S32, _TG,  1, _NC,  _V, _RW)
-VMCS_FIELD(SS_LIMIT,                0x4804, _S32, _TG,  2, _NC,  _V, _RW)
-VMCS_FIELD(DS_LIMIT,                0x4806, _S32, _TG,  3, _NC,  _V, _RW)
-VMCS_FIELD(FS_LIMIT,                0x4808, _S32, _TG,  4, _NC,  _V, _RW)
-VMCS_FIELD(GS_LIMIT,                0x480A, _S32, _TG,  5, _NC,  _V, _RW)
-VMCS_FIELD(LDTR_LIMIT,              0x480C, _S32, _TG,  6, _NC,  _V, _RW)
-VMCS_FIELD(TR_LIMIT,                0x480E, _S32, _TG,  7, _NC,  _V, _RW)
-VMCS_FIELD(GDTR_LIMIT,              0x4810, _S32, _TG,  8, _NC,  _V, _RW)
-VMCS_FIELD(IDTR_LIMIT,              0x4812, _S32, _TG,  9, _NC,  _V, _RW)
-VMCS_FIELD(ES_AR,                   0x4814, _S32, _TG, 10, _NC,  _V, _RW)
-VMCS_FIELD(CS_AR,                   0x4816, _S32, _TG, 11, _NC,  _V, _RW)
-VMCS_FIELD(SS_AR,                   0x4818, _S32, _TG, 12, _NC,  _V, _RW)
-VMCS_FIELD(DS_AR,                   0x481A, _S32, _TG, 13, _NC,  _V, _RW)
-VMCS_FIELD(FS_AR,                   0x481C, _S32, _TG, 14, _NC,  _V, _RW)
-VMCS_FIELD(GS_AR,                   0x481E, _S32, _TG, 15, _NC,  _V, _RW)
-VMCS_FIELD(LDTR_AR,                 0x4820, _S32, _TG, 16, _NC,  _V, _RW)
-VMCS_FIELD(TR_AR,                   0x4822, _S32, _TG, 17, _NC,  _V, _RW)
-VMCS_FIELD(HOLDOFF,                 0x4824, _S32, _TG, 18,  _C,  _V, _RW)
-VMCS_FIELD(ACTSTATE,                0x4826, _S32, _TG, 19, _NC,  _V, _NA)
-VMCS_FIELD(SMBASE,                  0x4828, _S32, _TG, 20, _NC,  _V, _NA)
-VMCS_FIELD(SYSENTER_CS,             0x482A, _S32, _TG, 21, _NC,  _V, _RW)
+VMCS_FIELD(ES_LIMIT,                0x4800, _S32, _TG,  0, _NC,  _V, _RW, _NS)
+VMCS_FIELD(CS_LIMIT,                0x4802, _S32, _TG,  1, _NC,  _V, _RW, _NS)
+VMCS_FIELD(SS_LIMIT,                0x4804, _S32, _TG,  2, _NC,  _V, _RW, _NS)
+VMCS_FIELD(DS_LIMIT,                0x4806, _S32, _TG,  3, _NC,  _V, _RW, _NS)
+VMCS_FIELD(FS_LIMIT,                0x4808, _S32, _TG,  4, _NC,  _V, _RW, _NS)
+VMCS_FIELD(GS_LIMIT,                0x480A, _S32, _TG,  5, _NC,  _V, _RW, _NS)
+VMCS_FIELD(LDTR_LIMIT,              0x480C, _S32, _TG,  6, _NC,  _V, _RW, _NS)
+VMCS_FIELD(TR_LIMIT,                0x480E, _S32, _TG,  7, _NC,  _V, _RW, _NS)
+VMCS_FIELD(GDTR_LIMIT,              0x4810, _S32, _TG,  8, _NC,  _V, _RW, _NS)
+VMCS_FIELD(IDTR_LIMIT,              0x4812, _S32, _TG,  9, _NC,  _V, _RW, _NS)
+VMCS_FIELD(ES_AR,                   0x4814, _S32, _TG, 10, _NC,  _V, _RW, _NS)
+VMCS_FIELD(CS_AR,                   0x4816, _S32, _TG, 11, _NC,  _V, _RW, _NS)
+VMCS_FIELD(SS_AR,                   0x4818, _S32, _TG, 12, _NC,  _V, _RW, _NS)
+VMCS_FIELD(DS_AR,                   0x481A, _S32, _TG, 13, _NC,  _V, _RW, _NS)
+VMCS_FIELD(FS_AR,                   0x481C, _S32, _TG, 14, _NC,  _V, _RW, _NS)
+VMCS_FIELD(GS_AR,                   0x481E, _S32, _TG, 15, _NC,  _V, _RW, _NS)
+VMCS_FIELD(LDTR_AR,                 0x4820, _S32, _TG, 16, _NC,  _V, _RW, _NS)
+VMCS_FIELD(TR_AR,                   0x4822, _S32, _TG, 17, _NC,  _V, _RW, _NS)
+VMCS_FIELD(HOLDOFF,                 0x4824, _S32, _TG, 18,  _C,  _V, _RW, _NS)
+VMCS_FIELD(ACTSTATE,                0x4826, _S32, _TG, 19, _NC,  _V, _NA, _NS)
+VMCS_FIELD(SMBASE,                  0x4828, _S32, _TG, 20, _NC,  _V, _NA, _NS)
+VMCS_FIELD(SYSENTER_CS,             0x482A, _S32, _TG, 21, _NC,  _V, _RW, _NS)
 VMCS_UNUSED(                        0x482C, _S32, _TG, 22)
-VMCS_FIELD(TIMER,                   0x482E, _S32, _TG, 23, _NC, _NV, _NA)
+VMCS_FIELD(TIMER,                   0x482E, _S32, _TG, 23, _NC, _NV, _NA, _NS)
 VMCS_UNUSED(                        0x4830, _S32, _TG, 24)
 VMCS_UNUSED(                        0x4832, _S32, _TG, 25)
 VMCS_UNUSED(                        0x4834, _S32, _TG, 26)
@@ -507,7 +512,7 @@ VMCS_GROUP_END(32, GUEST)
 
 /* 32-bit host state. */
 VMCS_GROUP_START(32, HOST)
-VMCS_FIELD(HOST_SYSENTER_CS,        0x4C00, _S32, _TH,  0, _NC,  _V, _NA)
+VMCS_FIELD(HOST_SYSENTER_CS,        0x4C00, _S32, _TH,  0, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x4C02, _S32, _TH,  1)
 VMCS_UNUSED(                        0x4C04, _S32, _TH,  2)
 VMCS_UNUSED(                        0x4C06, _S32, _TH,  3)
@@ -546,14 +551,14 @@ VMCS_SET_END(32)
 VMCS_SET_START(NAT)
 /* natural-width control fields. */
 VMCS_GROUP_START(NAT, CTL)
-VMCS_FIELD(CR0_GHMASK,              0x6000,  _SN, _TC,  0,  _C,  _V, _NA)
-VMCS_FIELD(CR4_GHMASK,              0x6002,  _SN, _TC,  1,  _C,  _V, _NA)
-VMCS_FIELD(CR0_SHADOW,              0x6004,  _SN, _TC,  2, _NC,  _V, _NA)
-VMCS_FIELD(CR4_SHADOW,              0x6006,  _SN, _TC,  3, _NC,  _V, _NA)
-VMCS_FIELD(CR3_TARGVAL0,            0x6008,  _SN, _TC,  4, _NC,  _V, _NA)
-VMCS_FIELD(CR3_TARGVAL1,            0x600A,  _SN, _TC,  5, _NC,  _V, _NA)
-VMCS_FIELD(CR3_TARGVAL2,            0x600C,  _SN, _TC,  6, _NC,  _V, _NA)
-VMCS_FIELD(CR3_TARGVAL3,            0x600E,  _SN, _TC,  7, _NC,  _V, _NA)
+VMCS_FIELD(CR0_GHMASK,              0x6000,  _SN, _TC,  0,  _C,  _V, _NA,  _S)
+VMCS_FIELD(CR4_GHMASK,              0x6002,  _SN, _TC,  1,  _C,  _V, _NA,  _S)
+VMCS_FIELD(CR0_SHADOW,              0x6004,  _SN, _TC,  2, _NC,  _V, _NA,  _S)
+VMCS_FIELD(CR4_SHADOW,              0x6006,  _SN, _TC,  3, _NC,  _V, _NA,  _S)
+VMCS_FIELD(CR3_TARGVAL0,            0x6008,  _SN, _TC,  4, _NC,  _V, _NA,  _S)
+VMCS_FIELD(CR3_TARGVAL1,            0x600A,  _SN, _TC,  5, _NC,  _V, _NA,  _S)
+VMCS_FIELD(CR3_TARGVAL2,            0x600C,  _SN, _TC,  6, _NC,  _V, _NA,  _S)
+VMCS_FIELD(CR3_TARGVAL3,            0x600E,  _SN, _TC,  7, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x6010,  _SN, _TC,  8)
 VMCS_UNUSED(                        0x6012,  _SN, _TC,  9)
 VMCS_UNUSED(                        0x6014,  _SN, _TC,  10)
@@ -581,12 +586,12 @@ VMCS_UNUSED(                        0x603E,  _SN, _TC,  31)
 VMCS_GROUP_END(NAT, CTL)
 
 VMCS_GROUP_START(NAT, DATA)
-VMCS_FIELD(EXIT_QUAL,               0x6400,  _SN, _TD,  0, _NC,  _V, _RO)
-VMCS_FIELD(IO_RCX,                  0x6402,  _SN, _TD,  1, _NC,  _V, _RO)
-VMCS_FIELD(IO_RSI,                  0x6404,  _SN, _TD,  2, _NC,  _V, _RO)
-VMCS_FIELD(IO_RDI,                  0x6406,  _SN, _TD,  3, _NC,  _V, _RO)
-VMCS_FIELD(IO_RIP,                  0x6408,  _SN, _TD,  4, _NC,  _V, _RO)
-VMCS_FIELD(LINEAR_ADDR,             0x640A,  _SN, _TD,  5, _NC,  _V, _RO)
+VMCS_FIELD(EXIT_QUAL,               0x6400,  _SN, _TD,  0, _NC,  _V, _RO, _NS)
+VMCS_FIELD(IO_RCX,                  0x6402,  _SN, _TD,  1, _NC,  _V, _RO, _NS)
+VMCS_FIELD(IO_RSI,                  0x6404,  _SN, _TD,  2, _NC,  _V, _RO, _NS)
+VMCS_FIELD(IO_RDI,                  0x6406,  _SN, _TD,  3, _NC,  _V, _RO, _NS)
+VMCS_FIELD(IO_RIP,                  0x6408,  _SN, _TD,  4, _NC,  _V, _RO, _NS)
+VMCS_FIELD(LINEAR_ADDR,             0x640A,  _SN, _TD,  5, _NC,  _V, _RO, _NS)
 VMCS_UNUSED(                        0x640C,  _SN, _TD,  6)
 VMCS_UNUSED(                        0x640E,  _SN, _TD,  7)
 VMCS_UNUSED(                        0x6410,  _SN, _TD,  8)
@@ -617,26 +622,26 @@ VMCS_GROUP_END(NAT, DATA)
 
 /* natural-width guest state. */
 VMCS_GROUP_START(NAT, GUEST)
-VMCS_FIELD(CR0,                     0x6800,  _SN, _TG,  0, _NC,  _V, _NA)
-VMCS_FIELD(CR3,                     0x6802,  _SN, _TG,  1, _NC,  _V, _RW)
-VMCS_FIELD(CR4,                     0x6804,  _SN, _TG,  2, _NC,  _V, _RW)
-VMCS_FIELD(ES_BASE,                 0x6806,  _SN, _TG,  3, _NC,  _V, _RW)
-VMCS_FIELD(CS_BASE,                 0x6808,  _SN, _TG,  4, _NC,  _V, _RW)
-VMCS_FIELD(SS_BASE,                 0x680A,  _SN, _TG,  5, _NC,  _V, _RW)
-VMCS_FIELD(DS_BASE,                 0x680C,  _SN, _TG,  6, _NC,  _V, _RW)
-VMCS_FIELD(FS_BASE,                 0x680E,  _SN, _TG,  7, _NC,  _V, _RW)
-VMCS_FIELD(GS_BASE,                 0x6810,  _SN, _TG,  8, _NC,  _V, _RW)
-VMCS_FIELD(LDTR_BASE,               0x6812,  _SN, _TG,  9, _NC,  _V, _RW)
-VMCS_FIELD(TR_BASE,                 0x6814,  _SN, _TG, 10, _NC,  _V, _RW)
-VMCS_FIELD(GDTR_BASE,               0x6816,  _SN, _TG, 11, _NC,  _V, _RW)
-VMCS_FIELD(IDTR_BASE,               0x6818,  _SN, _TG, 12, _NC,  _V, _RW)
-VMCS_FIELD(DR7,                     0x681A,  _SN, _TG, 13, _NC,  _V, _NA)
-VMCS_FIELD(RSP,                     0x681C,  _SN, _TG, 14, _NC,  _V, _RW)
-VMCS_FIELD(RIP,                     0x681E,  _SN, _TG, 15, _NC,  _V, _RW)
-VMCS_FIELD(RFLAGS,                  0x6820,  _SN, _TG, 16, _NC,  _V, _RW)
-VMCS_FIELD(PENDDBG,                 0x6822,  _SN, _TG, 17, _NC,  _V, _RW)
-VMCS_FIELD(SYSENTER_ESP,            0x6824,  _SN, _TG, 18, _NC,  _V, _RW)
-VMCS_FIELD(SYSENTER_EIP,            0x6826,  _SN, _TG, 19, _NC,  _V, _RW)
+VMCS_FIELD(CR0,                     0x6800,  _SN, _TG,  0, _NC,  _V, _NA, _NS)
+VMCS_FIELD(CR3,                     0x6802,  _SN, _TG,  1, _NC,  _V, _RW, _NS)
+VMCS_FIELD(CR4,                     0x6804,  _SN, _TG,  2, _NC,  _V, _RW, _NS)
+VMCS_FIELD(ES_BASE,                 0x6806,  _SN, _TG,  3, _NC,  _V, _RW, _NS)
+VMCS_FIELD(CS_BASE,                 0x6808,  _SN, _TG,  4, _NC,  _V, _RW, _NS)
+VMCS_FIELD(SS_BASE,                 0x680A,  _SN, _TG,  5, _NC,  _V, _RW, _NS)
+VMCS_FIELD(DS_BASE,                 0x680C,  _SN, _TG,  6, _NC,  _V, _RW, _NS)
+VMCS_FIELD(FS_BASE,                 0x680E,  _SN, _TG,  7, _NC,  _V, _RW, _NS)
+VMCS_FIELD(GS_BASE,                 0x6810,  _SN, _TG,  8, _NC,  _V, _RW, _NS)
+VMCS_FIELD(LDTR_BASE,               0x6812,  _SN, _TG,  9, _NC,  _V, _RW, _NS)
+VMCS_FIELD(TR_BASE,                 0x6814,  _SN, _TG, 10, _NC,  _V, _RW, _NS)
+VMCS_FIELD(GDTR_BASE,               0x6816,  _SN, _TG, 11, _NC,  _V, _RW, _NS)
+VMCS_FIELD(IDTR_BASE,               0x6818,  _SN, _TG, 12, _NC,  _V, _RW, _NS)
+VMCS_FIELD(DR7,                     0x681A,  _SN, _TG, 13, _NC,  _V, _NA, _NS)
+VMCS_FIELD(RSP,                     0x681C,  _SN, _TG, 14, _NC,  _V, _RW, _NS)
+VMCS_FIELD(RIP,                     0x681E,  _SN, _TG, 15, _NC,  _V, _RW, _NS)
+VMCS_FIELD(RFLAGS,                  0x6820,  _SN, _TG, 16, _NC,  _V, _RW, _NS)
+VMCS_FIELD(PENDDBG,                 0x6822,  _SN, _TG, 17, _NC,  _V, _RW, _NS)
+VMCS_FIELD(SYSENTER_ESP,            0x6824,  _SN, _TG, 18, _NC,  _V, _RW, _NS)
+VMCS_FIELD(SYSENTER_EIP,            0x6826,  _SN, _TG, 19, _NC,  _V, _RW, _NS)
 VMCS_UNUSED(                        0x6828,  _SN, _TG, 20)
 VMCS_UNUSED(                        0x682A,  _SN, _TG, 21)
 VMCS_UNUSED(                        0x682C,  _SN, _TG, 22)
@@ -653,18 +658,18 @@ VMCS_GROUP_END(NAT, GUEST)
 
 /* natural-width host state. */
 VMCS_GROUP_START(NAT, HOST)
-VMCS_FIELD(HOST_CR0,                0x6C00,  _SN, _TH,  0, _NC,  _V, _NA)
-VMCS_FIELD(HOST_CR3,                0x6C02,  _SN, _TH,  1, _NC,  _V, _NA)
-VMCS_FIELD(HOST_CR4,                0x6C04,  _SN, _TH,  2, _NC,  _V, _NA)
-VMCS_FIELD(HOST_FSBASE,             0x6C06,  _SN, _TH,  3, _NC,  _V, _NA)
-VMCS_FIELD(HOST_GSBASE,             0x6C08,  _SN, _TH,  4, _NC,  _V, _NA)
-VMCS_FIELD(HOST_TRBASE,             0x6C0A,  _SN, _TH,  5, _NC,  _V, _NA)
-VMCS_FIELD(HOST_GDTRBASE,           0x6C0C,  _SN, _TH,  6, _NC,  _V, _NA)
-VMCS_FIELD(HOST_IDTRBASE,           0x6C0E,  _SN, _TH,  7, _NC,  _V, _NA)
-VMCS_FIELD(HOST_SYSENTER_ESP,       0x6C10,  _SN, _TH,  8, _NC,  _V, _NA)
-VMCS_FIELD(HOST_SYSENTER_EIP,       0x6C12,  _SN, _TH,  9, _NC,  _V, _NA)
-VMCS_FIELD(HOST_RSP,                0x6C14,  _SN, _TH, 10, _NC,  _V, _NA)
-VMCS_FIELD(HOST_RIP,                0x6C16,  _SN, _TH, 11, _NC,  _V, _NA)
+VMCS_FIELD(HOST_CR0,                0x6C00,  _SN, _TH,  0, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_CR3,                0x6C02,  _SN, _TH,  1, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_CR4,                0x6C04,  _SN, _TH,  2, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_FSBASE,             0x6C06,  _SN, _TH,  3, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_GSBASE,             0x6C08,  _SN, _TH,  4, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_TRBASE,             0x6C0A,  _SN, _TH,  5, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_GDTRBASE,           0x6C0C,  _SN, _TH,  6, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_IDTRBASE,           0x6C0E,  _SN, _TH,  7, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_SYSENTER_ESP,       0x6C10,  _SN, _TH,  8, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_SYSENTER_EIP,       0x6C12,  _SN, _TH,  9, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_RSP,                0x6C14,  _SN, _TH, 10, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_RIP,                0x6C16,  _SN, _TH, 11, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x6C18,  _SN, _TH, 12)
 VMCS_UNUSED(                        0x6C1A,  _SN, _TH, 13)
 VMCS_UNUSED(                        0x6C1C,  _SN, _TH, 14)
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
index 2ca47e02..fc1dae49 100644
--- a/vmmon-only/include/x86vt.h
+++ b/vmmon-only/include/x86vt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2004-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2004-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -286,7 +286,7 @@ enum {
    VMX_CPU2(INVPCID,            12)                      \
    VMX_CPU2(VMFUNC,             13)                      \
    VMX_CPU2(VMCS_SHADOW,        14)                      \
-   VMX_CPU2(ENCL,               15)                      \
+   VMX_CPU2(ENCLS,              15)                      \
    VMX_CPU2(RDSEED,             16)                      \
    VMX_CPU2(PML,                17)                      \
    VMX_CPU2(EPT_VIOL_VE,        18)                      \
@@ -640,7 +640,7 @@ enum {
 #define VT_HOLDOFF_MOVSS       0x00000002
 #define VT_HOLDOFF_SMI         0x00000004
 #define VT_HOLDOFF_NMI         0x00000008
-#define VT_HOLDOFF_ENCLAVE     0x00000010
+#define VT_ENCLAVE_INTR        0x00000010
 #define VT_HOLDOFF_INST        (VT_HOLDOFF_STI | VT_HOLDOFF_MOVSS)
 #define VT_HOLDOFF_RSV         0xFFFFFFE0
 
@@ -668,6 +668,7 @@ enum {
 #define VT_EPT_QUAL_GUEST_RW           (1 << 10)
 #define VT_EPT_QUAL_GUEST_NX           (1 << 11)
 #define VT_EPT_QUAL_NMIUNMASK          (1 << 12)
+#define VT_EPT_QUAL_SYNTH_PML_FULL     (1 << 31)
 
 
 /* IOIO Qualification */
@@ -753,6 +754,10 @@ enum {
 #define VT_TSQUAL_JMP   2
 #define VT_TSQUAL_GATE  3
 
+/* PML Constants */
+#define VT_MAX_PML_INDEX   511
+#define VT_PML_ENTRY_MASK  (~(QWORD(0, PAGE_MASK)))
+
 typedef union {
    struct {
       unsigned selVal:16;
@@ -815,6 +820,23 @@ typedef union {
    uint32 flat;
 } VTIOQualifier;
 
+#define VT_APICACCESSQUAL_TYPE_LINEAR_READ  0
+#define VT_APICACCESSQUAL_TYPE_LINEAR_WRITE 1
+#define VT_APICACCESSQUAL_TYPE_LINEAR_INSTR 2
+#define VT_APICACCESSQUAL_TYPE_LINEAR_EVENT 3
+#define VT_APICACCESSQUAL_TYPE_PHYS_EVENT   10
+#define VT_APICACCESSQUAL_TYPE_PHYS_INSTR   15
+
+/* APIC Access intercept qualifier */
+typedef union {
+   struct {
+      uint64 offset:12;
+      uint64 type  :4;
+      uint64 rsvd  :48;
+   } bits;
+   uint64 flat;
+} VTAPICAccessQualifier;
+
 #define VT_IINFO_SCALE1    0
 #define VT_IINFO_SCALE2    1
 #define VT_IINFO_SCALE4    2
@@ -1081,11 +1103,8 @@ VT_SupportedCPU(void)
                                       __GET_MSR(MSR_VMX_TRUE_EXIT_CTLS),
                                       __GET_MSR(MSR_VMX_BASIC));
    } else {
-      return VT_SupportedFromFeatures(__GET_MSR(MSR_VMX_PINBASED_CTLS),
-                                      __GET_MSR(MSR_VMX_PROCBASED_CTLS),
-                                      __GET_MSR(MSR_VMX_ENTRY_CTLS),
-                                      __GET_MSR(MSR_VMX_EXIT_CTLS),
-                                      __GET_MSR(MSR_VMX_BASIC));
+      /* Bug 1914425 - VMM no longer supports CPUs without TRUE_xxx_CTLS */
+      return FALSE;
    }
 }
 
@@ -1141,5 +1160,4 @@ VT_ConfigMSRNum(unsigned index)
    return MSR_VMX_BASIC + index;
 }
 
-
 #endif /* _X86VT_H_ */
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 1905aa49..3dc5dd3f 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -65,8 +65,8 @@
 #include "hostif_priv.h"
 #include "vmhost.h"
 
-static void LinuxDriverQueue(VMLinux *vmLinux);
-static void LinuxDriverDequeue(VMLinux *vmLinux);
+static void LinuxDriverQueue(Device *device);
+static void LinuxDriverDequeue(Device *device);
 static Bool LinuxDriverCheckPadding(void);
 
 #define VMMON_UNKNOWN_SWAP_SIZE -1ULL
@@ -284,6 +284,7 @@ init_module(void)
    }
 
    CPUID_Init();
+   Vmx86_CacheNXState();
 
    if (!Task_Initialize()) {
       return -ENOEXEC;
@@ -404,18 +405,18 @@ static int
 LinuxDriver_Open(struct inode *inode, // IN
                  struct file *filp)   // IN
 {
-   VMLinux *vmLinux;
+   Device *device;
 
-   vmLinux = kmalloc(sizeof *vmLinux, GFP_KERNEL);
-   if (vmLinux == NULL) {
+   device = kmalloc(sizeof *device, GFP_KERNEL);
+   if (device == NULL) {
       return -ENOMEM;
    }
-   memset(vmLinux, 0, sizeof *vmLinux);
+   memset(device, 0, sizeof *device);
 
-   sema_init(&vmLinux->lock4Gb, 1);
+   sema_init(&device->lock4Gb, 1);
 
-   filp->private_data = vmLinux;
-   LinuxDriverQueue(vmLinux);
+   filp->private_data = device;
+   LinuxDriverQueue(device);
 
    Vmx86_Open();
 
@@ -517,17 +518,17 @@ LinuxDriverAllocPages(unsigned int gfpFlag, // IN
  */
 
 static void
-LinuxDriverDestructor4Gb(VMLinux *vmLinux) // IN
+LinuxDriverDestructor4Gb(Device *device) // IN
 {
    unsigned int pg;
 
-   if (!vmLinux->size4Gb) {
+   if (!device->size4Gb) {
       return;
    }
-   for (pg = 0; pg < vmLinux->size4Gb; pg++) {
-      put_page(vmLinux->pages4Gb[pg]);
+   for (pg = 0; pg < device->size4Gb; pg++) {
+      put_page(device->pages4Gb[pg]);
    }
-   vmLinux->size4Gb = 0;
+   device->size4Gb = 0;
 }
 
 
@@ -547,15 +548,15 @@ static int
 LinuxDriver_Close(struct inode *inode, // IN
                   struct file *filp)   // IN
 {
-   VMLinux *vmLinux;
+   Device *device;
 
-   vmLinux = (VMLinux *)filp->private_data;
-   ASSERT(vmLinux);
+   device = (Device *)filp->private_data;
+   ASSERT(device);
 
-   LinuxDriverDequeue(vmLinux);
-   if (vmLinux->vm != NULL) {
-      Vmx86_ReleaseVM(vmLinux->vm);
-      vmLinux->vm = NULL;
+   LinuxDriverDequeue(device);
+   if (device->vm != NULL) {
+      Vmx86_ReleaseVM(device->vm);
+      device->vm = NULL;
    }
 
    Vmx86_Close();
@@ -566,9 +567,9 @@ LinuxDriver_Close(struct inode *inode, // IN
     * uses it anymore, and we do not need to hold the semaphore.
     */
 
-   LinuxDriverDestructor4Gb(vmLinux);
+   LinuxDriverDestructor4Gb(device);
 
-   kfree(vmLinux);
+   kfree(device);
    filp->private_data = NULL;
 
    return 0;
@@ -605,16 +606,16 @@ LinuxDriverFault(struct vm_area_struct *vma, //IN
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
    struct vm_area_struct *vma = fault->vma;
 #endif
-   VMLinux *vmLinux = (VMLinux *) vma->vm_file->private_data;
+   Device *device = (Device *) vma->vm_file->private_data;
    unsigned long pg;
    struct page* page;
 
    pg = fault->pgoff;
    pg = VMMON_MAP_OFFSET(pg);
-   if (pg >= vmLinux->size4Gb) {
+   if (pg >= device->size4Gb) {
       return VM_FAULT_SIGBUS;
    }
-   page = vmLinux->pages4Gb[pg];
+   page = device->pages4Gb[pg];
    get_page(page);
    fault->page = page;
    return 0;
@@ -640,7 +641,7 @@ LinuxDriverFault(struct vm_area_struct *vma, //IN
  *-----------------------------------------------------------------------------
  */
 
-static int LinuxDriverAllocContig(VMLinux *vmLinux,
+static int LinuxDriverAllocContig(Device *device,
                                   struct vm_area_struct *vma,
                                   unsigned long off,
                                   unsigned long size)
@@ -686,9 +687,9 @@ static int LinuxDriverAllocContig(VMLinux *vmLinux,
       return -ENOMEM;
    }
    /* Sorry. Only one mmap per one open. */
-   down(&vmLinux->lock4Gb);
-   if (vmLinux->size4Gb) {
-      up(&vmLinux->lock4Gb);
+   down(&device->lock4Gb);
+   if (device->size4Gb) {
+      up(&device->lock4Gb);
       return -EINVAL;
    }
    vmaAllocSize = 1 << vmaOrder;
@@ -696,18 +697,18 @@ static int LinuxDriverAllocContig(VMLinux *vmLinux,
       int err;
 
       err = LinuxDriverAllocPages(gfpFlag, vmaOrder,
-                                  vmLinux->pages4Gb + i, size - i);
+                                  device->pages4Gb + i, size - i);
       if (err) {
          while (i > 0) {
-            put_page(vmLinux->pages4Gb[--i]);
+            put_page(device->pages4Gb[--i]);
          }
-         up(&vmLinux->lock4Gb);
+         up(&device->lock4Gb);
 
          return err;
       }
    }
-   vmLinux->size4Gb = size;
-   up(&vmLinux->lock4Gb);
+   device->size4Gb = size;
+   up(&device->lock4Gb);
    vma->vm_ops = &vmuser_mops;
 
    return 0;
@@ -737,7 +738,7 @@ static int
 LinuxDriverMmap(struct file *filp,
                 struct vm_area_struct *vma)
 {
-   VMLinux *vmLinux = (VMLinux *) filp->private_data;
+   Device *device = (Device *) filp->private_data;
    unsigned long size;
    int err;
 
@@ -752,10 +753,10 @@ LinuxDriverMmap(struct file *filp,
    if (size < 1) {
       return -EINVAL;
    }
-   if (vmLinux->vm) {
+   if (device->vm) {
       err = -EINVAL;
    } else {
-      err = LinuxDriverAllocContig(vmLinux, vma, vma->vm_pgoff, size);
+      err = LinuxDriverAllocContig(device, vma, vma->vm_pgoff, size);
    }
    if (err) {
       return err;
@@ -1032,16 +1033,16 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
                   u_int iocmd,          // IN:
                   unsigned long ioarg)  // IN:
 {
-   VMLinux *vmLinux = (VMLinux *) filp->private_data;
+   Device *device = (Device *) filp->private_data;
    int retval = 0;
    Vcpuid vcpuid;
    VMDriver *vm;
 
-   if (vmLinux == NULL) {
+   if (device == NULL) {
       return -EINVAL;
    }
 
-   vm = vmLinux->vm;
+   vm = device->vm;
 
    /*
     * Validate the VM pointer for those IOCTLs that require it.
@@ -1093,12 +1094,12 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       if (retval != 0) {
          break;
       }
-      vm = Vmx86_CreateVM(args.bsBlob, args.bsBlobSize);
+      vm = Vmx86_CreateVM(args.bsBlob, args.bsBlobSize, args.numVCPUs);
 
       if (vm == NULL) {
          retval = -ENOMEM;
       } else {
-         vmLinux->vm = vm;
+         device->vm = vm;
          args.vmid = vm->userID;
          retval = HostIF_CopyToUser((VA64)ioarg, &args, sizeof args);
       }
@@ -1107,14 +1108,19 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
 
    case IOCTL_VMX86_PROCESS_BOOTSTRAP: {
       VMProcessBootstrapBlock *args;
+      VA64 uAddr;
       Bool res;
 
+      retval = HostIF_CopyFromUser(&uAddr, (VA64)ioarg, sizeof uAddr);
+      if (retval != 0) {
+         break;
+      }
       args = HostIF_AllocKernelMem(sizeof *args, TRUE);
       if (args == NULL) {
          retval = -ENOMEM;
          break;
       }
-      retval = HostIF_CopyFromUser(args, (VA64)ioarg, sizeof *args);
+      retval = HostIF_CopyFromUser(args, uAddr, sizeof *args);
       if (retval != 0) {
          HostIF_FreeKernelMem(args);
          break;
@@ -1134,22 +1140,27 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    }
 
    case IOCTL_VMX86_RELEASE_VM:
-      vmLinux->vm = NULL;
+      device->vm = NULL;
       Vmx86_ReleaseVM(vm);
       break;
 
    case IOCTL_VMX86_INIT_VM: {
       InitBlock *initParams;
+      VA64 uAddr;
 
+      retval = HostIF_CopyFromUser(&uAddr, (VA64)ioarg, sizeof uAddr);
+      if (retval != 0) {
+         break;
+      }
       initParams = HostIF_AllocKernelMem(sizeof *initParams, TRUE);
       if (initParams == NULL) {
          retval = -ENOMEM;
          break;
       }
-      retval = HostIF_CopyFromUser(initParams, ioarg, sizeof *initParams);
+      retval = HostIF_CopyFromUser(initParams, uAddr, sizeof *initParams);
       if (retval == 0) {
          if (Vmx86_InitVM(vm, initParams) == 0) {
-            retval = HostIF_CopyToUser(ioarg, initParams, sizeof *initParams);
+            retval = HostIF_CopyToUser(uAddr, initParams, sizeof *initParams);
          } else {
             retval = -EINVAL;
          }
@@ -1176,18 +1187,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
 #endif
       break;
 
-   case IOCTL_VMX86_LOCK_PAGE: {
-      VMLockPage args;
-
-      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
-      if (retval) {
-         break;
-      }
-      args.ret.status = Vmx86_LockPage(vm, args.uAddr, FALSE, &args.ret.mpn);
-      retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
-      break;
-   }
-
+   case IOCTL_VMX86_LOCK_PAGE:
    case IOCTL_VMX86_LOCK_PAGE_NEW: {
       VMLockPage args;
 
@@ -1195,7 +1195,9 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       if (retval) {
          break;
       }
-      args.ret.status = Vmx86_LockPage(vm, args.uAddr, TRUE, &args.ret.mpn);
+      args.ret.status = Vmx86_LockPage(vm, args.uAddr,
+                                       iocmd == IOCTL_VMX86_LOCK_PAGE_NEW,
+                                       &args.ret.mpn);
       retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
       break;
    }
@@ -1356,6 +1358,16 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       retval = -Vmx86_SetHostClockRate(vm, (unsigned)ioarg);
       break;
 
+   case IOCTL_VMX86_SEND_ONE_IPI: {
+      Vcpuid v = ioarg;
+      if (v < vm->numVCPUs) {
+         HostIF_OneIPI(vm, v);
+      } else {
+         retval = -EINVAL;
+      }
+      break;
+   }
+
    case IOCTL_VMX86_SEND_IPI: {
       VCPUSet ipiTargets;
 
@@ -1371,14 +1383,8 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_GET_IPI_VECTORS: {
       IPIVectors ipiVectors;
 
-      ipiVectors.hostIPIVectors[0] = CALL_FUNCTION_VECTOR;
-#ifdef CALL_FUNCTION_SINGLE_VECTOR
-      ipiVectors.hostIPIVectors[1] = CALL_FUNCTION_SINGLE_VECTOR;
-#else
-      ipiVectors.hostIPIVectors[1] = 0;
-#endif
-      ipiVectors.monitorIPIVector = monitorIPIVector;
-      ipiVectors.hvIPIVector      = hvIPIVector;
+      ipiVectors.monitorIPIVector = HostIF_GetMonitorIPIVector();
+      ipiVectors.hvIPIVector      = HostIF_GetHVIPIVector();
 
       retval = HostIF_CopyToUser(ioarg, &ipiVectors, sizeof ipiVectors);
       break;
@@ -1484,22 +1490,16 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
-   case IOCTL_VMX86_ALLOC_LOCKED_PAGES:
-   case IOCTL_VMX86_FREE_LOCKED_PAGES: {
+   case IOCTL_VMX86_ALLOC_LOCKED_PAGES: {
          VMMPNList req;
 
          retval = HostIF_CopyFromUser(&req, ioarg, sizeof req);
          if (retval) {
-           break;
-         }
-         if (iocmd == IOCTL_VMX86_ALLOC_LOCKED_PAGES) {
-            retval = Vmx86_AllocLockedPages(vm, req.mpnList,
-                                            req.mpnCount, FALSE,
-                                            req.ignoreLimits);
-         } else {
-            retval = Vmx86_FreeLockedPages(vm, req.mpnList,
-                                           req.mpnCount, FALSE);
+            break;
          }
+         retval = Vmx86_AllocLockedPages(vm, req.mpnList,
+                                         req.mpnCount, FALSE,
+                                         req.ignoreLimits);
          break;
       }
 
@@ -1517,7 +1517,6 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    }
 
    case IOCTL_VMX86_READ_PAGE: {
-         void *tempPage;
          VMMReadWritePage req;
 
          retval = HostIF_CopyFromUser(&req, ioarg, sizeof req);
@@ -1525,19 +1524,8 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
             break;
          }
 
-         tempPage = HostIF_AllocPage();
-         if (tempPage == NULL) {
-            retval = -ENOMEM;
-            break;
-         }
-
-         retval = HostIF_ReadPhysical(vm, MPN_2_MA(req.mpn),
-                                      PtrToVA64(tempPage), TRUE, PAGE_SIZE);
-         if (retval == 0) {
-            retval = HostIF_CopyToUser(req.uAddr, tempPage, PAGE_SIZE);
-         }
-
-         HostIF_FreePage(tempPage);
+         retval = HostIF_ReadPhysical(vm, MPN_2_MA(req.mpn), req.uAddr, FALSE,
+                                      PAGE_SIZE);
          break;
       }
 
@@ -1621,6 +1609,20 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
+   case IOCTL_VMX86_GET_MONITOR_CONTEXT: {
+      VMMonContext args;
+      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
+      if (retval != 0) {
+         break;
+      }
+      if (!Vmx86_GetMonitorContext(vm, args.vcpuid, &args.context)) {
+         retval = -EINVAL;
+      } else {
+         retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
+      }
+      break;
+   }
+
    default:
       Warning("Unknown ioctl %d\n", iocmd);
       retval = -EINVAL;
@@ -1636,7 +1638,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
  *
  * LinuxDriverQueue --
  *
- *      add the vmLinux to the global queue
+ *      add the device to the global queue
  *
  * Results:
  *
@@ -1648,7 +1650,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
  */
 
 static void
-LinuxDriverQueue(VMLinux *vmLinux)  // IN/OUT:
+LinuxDriverQueue(Device *device)  // IN/OUT:
 {
    /*
     * insert in global vm queue
@@ -1656,8 +1658,8 @@ LinuxDriverQueue(VMLinux *vmLinux)  // IN/OUT:
 
    HostIF_GlobalLock(12);
 
-   vmLinux->next = linuxState.head;
-   linuxState.head = vmLinux;
+   device->next = linuxState.head;
+   linuxState.head = device;
 
    HostIF_GlobalUnlock(12);
 }
@@ -1680,16 +1682,16 @@ LinuxDriverQueue(VMLinux *vmLinux)  // IN/OUT:
  */
 
 static void
-LinuxDriverDequeue(VMLinux *vmLinux)  // IN/OUT:
+LinuxDriverDequeue(Device *device)  // IN/OUT:
 {
-   VMLinux **p;
+   Device **p;
 
    HostIF_GlobalLock(13);
-   for (p = &linuxState.head; *p != vmLinux; p = &(*p)->next) {
+   for (p = &linuxState.head; *p != device; p = &(*p)->next) {
       ASSERT(*p != NULL);
    }
-   *p = vmLinux->next;
-   vmLinux->next = NULL;
+   *p = device->next;
+   device->next = NULL;
    HostIF_GlobalUnlock(13);
 }
 
diff --git a/vmmon-only/linux/driver.h b/vmmon-only/linux/driver.h
index 650acc03..189734fb 100644
--- a/vmmon-only/linux/driver.h
+++ b/vmmon-only/linux/driver.h
@@ -53,8 +53,8 @@ struct VMDriver;
 /* 16 pages (64KB) looks as a good limit for one allocation */
 #define VMMON_MAX_LOWMEM_PAGES  16
 
-typedef struct VMLinux {
-   struct VMLinux *next;
+typedef struct Device {
+   struct Device   *next;
    struct VMDriver *vm;
 
    /*
@@ -66,7 +66,7 @@ typedef struct VMLinux {
    struct semaphore lock4Gb;
    unsigned int size4Gb;
    struct page *pages4Gb[VMMON_MAX_LOWMEM_PAGES];
-} VMLinux;
+} Device;
 
 
 /*
@@ -82,7 +82,7 @@ typedef struct VMXLinuxState {
    struct miscdevice misc;
    char deviceName[VM_DEVICE_NAME_SIZE];
    char buf[LINUXLOG_BUFFER_SIZE];
-   VMLinux *head;
+   Device *head;
 
    struct task_struct *fastClockThread;
    unsigned fastClockRate;
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index b793539c..21758c2c 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -177,6 +177,8 @@ static struct {
    put_page(pfn_to_page(_pfn));                          \
 } while (0)
 
+static void UnlockEntry(void *clientData, MemTrackEntry *entryPtr);
+
 uint8 monitorIPIVector;
 uint8 hvIPIVector;
 
@@ -340,6 +342,7 @@ Bool
 HostIF_PrepareWaitForThreads(VMDriver *vm,     // IN:
                              Vcpuid currVcpu)  // IN:
 {
+   ASSERT(currVcpu < vm->numVCPUs);
    set_current_state(TASK_INTERRUPTIBLE);
    vm->vmhost->vcpuSemaTask[currVcpu] = current;
    return FALSE;
@@ -392,6 +395,7 @@ void
 HostIF_CancelWaitForThreads(VMDriver *vm,     // IN:
                             Vcpuid currVcpu)  // IN:
 {
+   ASSERT(currVcpu < vm->numVCPUs);
    vm->vmhost->vcpuSemaTask[currVcpu] = NULL;
    set_current_state(TASK_RUNNING);
 }
@@ -430,17 +434,19 @@ HostIF_WakeUpYielders(VMDriver *vm,     // IN:
     * fully coherent snapshot, as long as the subset copy-and-remove is atomic
     * so no VCPU added is lost entirely.
     */
-
+   ASSERT(currVcpu < vm->numVCPUs);
    VCPUSet_Empty(&req);
-   FOR_EACH_SUBSET_IN_SET(subIdx) {
+   FOR_EACH_POPULATED_SUBSET_IN_SET(subIdx, vm->numVCPUs) {
       subset = VCPUSet_AtomicReadWriteSubset(&vm->crosscallWaitSet[currVcpu],
                                              0, subIdx);
       VCPUSet_UnionSubset(&req, subset, subIdx);
-   } ROF_EACH_SUBSET_IN_SET();
+   } ROF_EACH_POPULATED_SUBSET_IN_SET();
 
    preempt_disable();
    while ((vcpuid = VCPUSet_FindFirst(&req)) != VCPUID_INVALID) {
-      struct task_struct *t = vm->vmhost->vcpuSemaTask[vcpuid];
+      struct task_struct *t;
+      ASSERT(vcpuid < vm->numVCPUs);
+      t = vm->vmhost->vcpuSemaTask[vcpuid];
       VCPUSet_Remove(&req, vcpuid);
       if (t && (t->state & TASK_INTERRUPTIBLE)) {
          wake_up_process(t);
@@ -906,6 +912,128 @@ HostIF_FreeLockedPages(VMDriver *vm,         // IN: VM instance pointer
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_AllocLowPage --
+ *
+ *      Allocate a zeroed locked low page.
+ *
+ * Results:
+ *      Allocated MPN on success. INVALID_MPN on failure.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+HostIF_AllocLowPage(VMDriver *vm) //  IN: VM instance pointer
+{
+   unsigned int gfpFlag;
+   struct page* pg;
+   MPN mpn = INVALID_MPN;
+
+#ifdef GFP_DMA32
+   gfpFlag = GFP_USER | GFP_DMA32;
+#else
+   gfpFlag = GFP_USER | GFP_DMA;
+#endif
+
+   pg = alloc_page(gfpFlag);
+
+   if (pg != NULL) {
+      void *addr;
+      VMHost *vmh;
+
+      // zero page
+      addr = kmap(pg);
+      memset(addr, 0, PAGE_SIZE);
+      kunmap(pg);
+
+      mpn = (MPN)page_to_pfn(pg);
+
+      HostIF_VMLock(vm, 40);
+      vmh = vm->vmhost;
+      if (vmh->AWEPages != NULL) {
+         if (PhysTrack_Test(vmh->AWEPages, mpn)) {
+            Warning("%s: duplicate MPN %016" FMT64 "x\n", __func__, mpn);
+         }
+         PhysTrack_Add(vmh->AWEPages, mpn);
+      } else {
+         __free_page(pg);
+         mpn = INVALID_MPN;
+      }
+      HostIF_VMUnlock(vm, 40);
+   }
+   return mpn;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFFreeVMHost --
+ *
+ *      Releases the memory allocated for the host-dependent part of
+ *      the driver.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+HostIFFreeVMHost(VMHost *vmhost) // IN:
+{
+   ASSERT(vmhost->lockedPages == NULL &&
+          vmhost->AWEPages    == NULL &&
+          vmhost->crosspagePagesCount == 0 &&
+          !vmhost->hostAPICIsMapped);
+   Vmx86_Free(vmhost->crosspagePages);
+   Vmx86_Free(vmhost->vcpuSemaTask);
+   vmhost->crosspagePages = NULL;
+   vmhost->vcpuSemaTask   = NULL;
+   HostIF_FreeKernelMem(vmhost);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFAllocVMHost --
+ *
+ *      Allocate memory for the host-dependent part of the driver.
+ *
+ * Results:
+ *      Pointer to allocated structure on success, NULL on error.
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static VMHost *
+HostIFAllocVMHost(uint32 numVCPUs) // IN:
+{
+   VMHost *vmhost = Vmx86_Calloc(1, sizeof *vmhost, TRUE);
+   if (vmhost == NULL) {
+      return NULL;
+   }
+   if ((vmhost->crosspagePages =
+        Vmx86_Calloc(numVCPUs, sizeof *vmhost->crosspagePages, TRUE)) != NULL &&
+       (vmhost->vcpuSemaTask =
+        Vmx86_Calloc(numVCPUs, sizeof *vmhost->vcpuSemaTask, TRUE))   != NULL) {
+      return vmhost;
+   }
+   HostIFFreeVMHost(vmhost);
+   return NULL;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -914,34 +1042,44 @@ HostIF_FreeLockedPages(VMDriver *vm,         // IN: VM instance pointer
  *      Initialize the host-dependent part of the driver.
  *
  * Results:
- *     zero on success, non-zero on error.
+ *      zero on success, non-zero on error.
  *
  * Side effects:
- *     None
+ *      None
  *
  *----------------------------------------------------------------------
  */
 
 int
-HostIF_Init(VMDriver *vm)  // IN:
+HostIF_Init(VMDriver *vm, uint32 numVCPUs)
 {
    vm->memtracker = MemTrack_Init(vm);
    if (vm->memtracker == NULL) {
       return -1;
    }
 
-   vm->vmhost = (VMHost *) HostIF_AllocKernelMem(sizeof *vm->vmhost, TRUE);
+   vm->vmhost = HostIFAllocVMHost(numVCPUs);
    if (vm->vmhost == NULL) {
-      return -1;
+      goto error;
    }
-   memset(vm->vmhost, 0, sizeof *vm->vmhost);
 
-   if (HostIFHostMemInit(vm)) {
-      return -1;
+   if (HostIFHostMemInit(vm) != 0) {
+      goto error;
    }
    MutexInit(&vm->vmhost->vmMutex, "vm");
 
    return 0;
+error:
+   if (vm->vmhost != NULL) {
+      HostIFHostMemCleanup(vm);
+      HostIFFreeVMHost(vm->vmhost);
+      vm->vmhost = NULL;
+   }
+   if (vm->memtracker != NULL) {
+      MemTrack_Cleanup(vm->memtracker, UnlockEntry, vm);
+      vm->memtracker = NULL;
+   }
+   return -1;
 }
 
 
@@ -1310,6 +1448,7 @@ HostIF_FreeAllResources(VMDriver *vm) // IN
       vm->memtracker = NULL;
    }
    if (vm->vmhost) {
+      ASSERT(vm->vmhost->crosspagePagesCount <= vm->numVCPUs);
       for (cnt = vm->vmhost->crosspagePagesCount; cnt > 0; ) {
          struct page* p = vm->vmhost->crosspagePages[--cnt];
          UnmapCrossPage(p, vm->crosspage[cnt]);
@@ -1321,7 +1460,7 @@ HostIF_FreeAllResources(VMDriver *vm) // IN
          vm->hostAPIC.base = NULL;
          vm->vmhost->hostAPICIsMapped = FALSE;
       }
-      HostIF_FreeKernelMem(vm->vmhost);
+      HostIFFreeVMHost(vm->vmhost);
       vm->vmhost = NULL;
    }
 }
@@ -1908,15 +2047,10 @@ HostIF_CopyToUser(VA64 dst,         // OUT
  *
  * HostIF_MapCrossPage --
  *
- *    Obtain kernel pointer to crosspage.
- *
- *    We must return a VA that is obtained through a kernel mapping, so that
- *    the mapping never goes away (see bug 29753).
- *
- *    However, the LA corresponding to that VA must not overlap with the
- *    monitor (see bug 32922). The userland code ensures that by only
- *    allocating cross pages from low memory. For those pages, the kernel
- *    uses a permanent mapping, instead of a temporary one with a high LA.
+ *    Map the cross page in the kernel address space given a user VA.  The
+ *    kernel mapping must not overlap the monitor's 64MB VA space (bug 32922).
+ *    In practice, the host kernel does not return mappings in that range.
+ *    This is checked in TaskCreatePTPatch() which gracefully fails if it must.
  *
  * Results:
  *    The kernel virtual address on success
@@ -1942,7 +2076,7 @@ HostIF_MapCrossPage(VMDriver *vm, // IN
    }
    vPgAddr = (VA) MapCrossPage(page);
    HostIF_VMLock(vm, 27);
-   if (vm->vmhost->crosspagePagesCount >= MAX_INITBLOCK_CPUS) {
+   if (vm->vmhost->crosspagePagesCount >= vm->numVCPUs) {
       HostIF_VMUnlock(vm, 27);
       UnmapCrossPage(page, (void*)vPgAddr);
 
@@ -1962,7 +2096,8 @@ HostIF_MapCrossPage(VMDriver *vm, // IN
  *
  * HostIF_AllocKernelPages --
  *
- *      Allocates and maps a set of locked pages.
+ *      Allocates and maps a set of locked pages. The pages might not
+ *      be physically contiguous.
  *
  * Results:
  *      On success: Host kernel virtual address of the first page.
@@ -1981,27 +2116,16 @@ void *
 HostIF_AllocKernelPages(unsigned numPages, // IN: Number of pages
                         MPN     *mpns)     // OUT: Array of MPNs
 {
-   MPN startMPN;
-   struct page *pages;
    unsigned i;
-   void *ptr;
-
-   for (i = 0; (1 << i) < numPages; i++) { }
-   /* Allocates physically contiguous pages. */
-   pages = alloc_pages(GFP_KERNEL, i);
+   void *ptr = vmalloc(numPages * PAGE_SIZE);
 
-   if (pages == NULL) {
+   if (ptr == NULL) {
       return NULL;
    }
-
-   startMPN = page_to_pfn(pages);
-
+   ASSERT((PtrToVA64(ptr) & (PAGE_SIZE - 1)) == 0);
    for (i = 0; i < numPages; i++) {
-      mpns[i] = startMPN + i;
+      mpns[i] = vmalloc_to_pfn((uint8 *)ptr + i * PAGE_SIZE);
    }
-   ptr = (void *)page_address(pages);
-   ASSERT(!(PtrToVA64(ptr) & (PAGE_SIZE - 1))); /* Page-aligned */
-
    return ptr;
 }
 
@@ -2026,10 +2150,7 @@ void
 HostIF_FreeKernelPages(unsigned numPages, // IN: Number of pages
                        void    *ptr)      // IN: Kernel VA of first page
 {
-   unsigned i;
-
-   for (i = 0; (1 << i) < numPages; i++) { }
-   free_pages((VA)ptr, i);
+   vfree(ptr);
 }
 
 
@@ -2330,6 +2451,80 @@ HostIF_APICInit(VMDriver *vm,   // IN:
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_GetTimerVectors --
+ *
+ *      Determine which vectors the host might be using for timer
+ *      interrupts.
+ *
+ * Results:
+ *      The host-specific timer interrupt vectors.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_GetTimerVectors(uint8 *v0, // OUT:
+                       uint8 *v1) // OUT:
+{
+   *v0 = 0xef; // APIC
+   *v1 = 0x20; // PIC
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_GetMonitorIPIVector --
+ *
+ *      Return a dedicated vector the monitor can use for sending
+ *      IPIs.
+ *
+ * Results:
+ *     The vector determined by HostIF_APICInit.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint8
+HostIF_GetMonitorIPIVector(void)
+{
+   return monitorIPIVector;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_GetHVIPIVector --
+ *
+ *      Return a dedicated vector the monitor can use for posted
+ *      interrupts.
+ *
+ * Results:
+ *     The vector determined by HostIF_APICInit.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint8
+HostIF_GetHVIPIVector(void)
+{
+   return hvIPIVector;
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2359,6 +2554,8 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
    int timeoutms = args[2];
    uint64 value;
 
+   ASSERT(vcpuid < vm->numVCPUs);
+
    file = vmware_fget(waitFD);
    if (file == NULL) {
       return MX_WAITERROR;
@@ -2449,13 +2646,13 @@ void
 HostIF_SemaphoreForceWakeup(VMDriver *vm,       // IN:
                             const VCPUSet *vcs) // IN:
 {
-   FOR_EACH_VCPU_IN_SET(vcs, vcpuid) {
+   FOR_EACH_VCPU_IN_SET_WITH_MAX(vcs, vcpuid, vm->numVCPUs) {
       struct task_struct *t = vm->vmhost->vcpuSemaTask[vcpuid];
       vm->vmhost->vcpuSemaTask[vcpuid] = NULL;
       if (t && (t->state & TASK_INTERRUPTIBLE)) {
          wake_up_process(t);
       }
-   } ROF_EACH_VCPU_IN_SET();
+   } ROF_EACH_VCPU_IN_SET_WITH_MAX();
 }
 
 
@@ -2534,6 +2731,35 @@ HostIF_SemaphoreSignal(uint64 *args)  // IN:
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_OneIPI --
+ *
+ *    If the passed VCPU thread is on some CPU in the system,
+ *    attempt to hit it with an IPI.
+ *
+ * Result:
+ *    None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_OneIPI(VMDriver *vm,                // IN:
+              Vcpuid v)                    // IN:
+{
+   uint32 targetHostCpu;
+
+   ASSERT(v < vm->numVCPUs);
+   targetHostCpu = Atomic_Read32(&vm->currentHostCpu[v]);
+   if (targetHostCpu != INVALID_PCPU) {
+      ASSERT(targetHostCpu < MAX_PCPUS);
+      arch_send_call_function_single_ipi(targetHostCpu);
+   }
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -2542,32 +2768,19 @@ HostIF_SemaphoreSignal(uint64 *args)  // IN:
  *    If the passed VCPU threads are on some CPUs in the system,
  *    attempt to hit them with an IPI.
  *
- *    On older Linux systems we do a broadcast.
- *
  * Result:
- *    The mode used to send IPIs.
+ *    None.
  *
  *----------------------------------------------------------------------
  */
 
-HostIFIPIMode
+void
 HostIF_IPI(VMDriver *vm,                // IN:
            const VCPUSet *ipiTargets)   // IN:
 {
-   HostIFIPIMode mode = IPI_NONE;
-
-   ASSERT(vm);
-
-   FOR_EACH_VCPU_IN_SET(ipiTargets, v) {
-      uint32 targetHostCpu = vm->currentHostCpu[v];
-      if (targetHostCpu != INVALID_PCPU) {
-         ASSERT(targetHostCpu < MAX_PCPUS);
-         arch_send_call_function_single_ipi(targetHostCpu);
-         mode = IPI_UNICAST;
-      }
-   } ROF_EACH_VCPU_IN_SET();
-
-   return mode;
+   FOR_EACH_VCPU_IN_SET_WITH_MAX(ipiTargets, v, vm->numVCPUs) {
+      HostIF_OneIPI(vm, v);
+   } ROF_EACH_VCPU_IN_SET_WITH_MAX();
 }
 
 
@@ -2749,14 +2962,6 @@ HostIFCheckTrackedMPN(VMDriver *vm, // IN: The VM instance
       }
    }
    HostIF_VMUnlock(vm, 32);
-
-   if (vmx86_debug) {
-      /*
-       * The monitor may have old KSeg mappings to pages which it no longer
-       * owns.  Minimize customer noise by only logging this for developers.
-       */
-      Log("%s: MPN %" FMT64 "x not owned by this VM\n", __FUNCTION__, mpn);
-   }
    return FALSE;
 }
 
diff --git a/vmmon-only/linux/vmhost.h b/vmmon-only/linux/vmhost.h
index f686902f..bd6c0351 100644
--- a/vmmon-only/linux/vmhost.h
+++ b/vmmon-only/linux/vmhost.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -79,22 +79,23 @@ typedef struct VMHost {
     */
    Mutex vmMutex;
 
-   unsigned int       crosspagePagesCount;
-   struct page        *crosspagePages[MAX_INITBLOCK_CPUS];
-   struct task_struct *vcpuSemaTask[MAX_INITBLOCK_CPUS];
+   unsigned int         crosspagePagesCount;
+   struct page        **crosspagePages;      /* ptr to numVCPUs-sized array */
+   struct task_struct **vcpuSemaTask;        /* ptr to numVCPUs-sized array */
+
    /*
     * Pages that were allocated/mapped by VMX and locked by the driver and
     * don't have a particular VA.
     */
-   struct PhysTracker *lockedPages;
+   struct PhysTracker  *lockedPages;
    /*
     * Locked pages that were allocated by the driver and don't have
     * a particular VA. They are used as monitor anonymous pages or
     * as pages for "AWE" guest memory.
     */
-   struct PhysTracker *AWEPages;
+   struct PhysTracker  *AWEPages;
    /* Is VMDriver.hostAPIC mapped or is from __fix_to_virt(FIX_APIC_BASE)? */
-   Bool               hostAPICIsMapped;
+   Bool                 hostAPICIsMapped;
 } VMHost;
 
 #endif
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/vmcore/moduleloop.c
index 589b4bf3..bd47aaf1 100644
--- a/vmmon-only/vmcore/moduleloop.c
+++ b/vmmon-only/vmcore/moduleloop.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -42,6 +42,7 @@
 #include "driver_vmcore.h"
 #include "usercalldefs.h"
 #include "cpuid.h"
+#include "vmmblob.h"
 
 /*
  *----------------------------------------------------------------------
@@ -72,10 +73,12 @@ Vmx86_RunVM(VMDriver *vm,   // IN:
             Vcpuid vcpuid)  // IN:
 {
    uint32           retval    = MODULECALL_USERRETURN;
-   VMCrossPageData *crosspage = &vm->crosspage[vcpuid]->crosspageData;
+   VMCrossPageData *crosspage;
    int              bailValue = 0;
 
-   ASSERT(crosspage && CPUID_HostSupportsHV());
+   ASSERT(vcpuid < vm->numVCPUs && CPUID_HostSupportsHV());
+   crosspage = &vm->crosspage[vcpuid]->crosspageData;
+   ASSERT(crosspage);
 
    /*
     * Check if we were interrupted by signal.
@@ -98,13 +101,13 @@ Vmx86_RunVM(VMDriver *vm,   // IN:
        * Wake up anything that was waiting for this vcpu to run
        */
 
-      if ((VCPUSet_IsEmpty(&crosspage->yieldVCPUs) &&
+      if ((crosspage->yieldVCPUsIsEmpty &&
            crosspage->moduleCallType != MODULECALL_COSCHED) ||
           crosspage->moduleCallType == MODULECALL_SEMAWAIT) {
          HostIF_WakeUpYielders(vm, vcpuid);
       }
 
-      if (!VCPUSet_IsEmpty(&crosspage->yieldVCPUs) &&
+      if (!crosspage->yieldVCPUsIsEmpty &&
           crosspage->moduleCallType != MODULECALL_COSCHED &&
           crosspage->moduleCallType != MODULECALL_SEMAWAIT) {
          Vmx86_YieldToSet(vm, vcpuid, &crosspage->yieldVCPUs, 0, TRUE);
@@ -150,6 +153,12 @@ skipTaskSwitch:;
          break;
       }
 
+      case MODULECALL_ALLOC_ANON_LOW_PAGE: {
+         // Return via 64-bit args[0] (may return INVALID_MPN).
+         crosspage->args[0] = Vmx86_AllocLowPage(vm, FALSE);
+         break;
+      }
+
       case MODULECALL_SEMAWAIT: {
          retval = HostIF_SemaphoreWait(vm, vcpuid, crosspage->args);
 
@@ -177,10 +186,13 @@ skipTaskSwitch:;
          break;
       }
 
+      case MODULECALL_ONE_IPI: {
+         Vcpuid v = (Vcpuid)crosspage->args[0];
+         HostIF_OneIPI(vm, v);
+         break;
+      }
       case MODULECALL_IPI: {
-         HostIFIPIMode mode;
-         mode = HostIF_IPI(vm, &crosspage->vcpuSet);
-         retval = (mode != IPI_NONE);
+         HostIF_IPI(vm, &crosspage->vcpuSet);
          break;
       }
 
@@ -260,6 +272,26 @@ skipTaskSwitch:;
          crosspage->args[0] = mpn;
       } break;
 
+      case MODULECALL_GET_MON_IPI_VECTOR: {
+         retval = HostIF_GetMonitorIPIVector();
+      } break;
+
+      case MODULECALL_GET_HV_IPI_VECTOR: {
+         retval = HostIF_GetHVIPIVector();
+      } break;
+
+      case MODULECALL_GET_HOST_TIMER_VECTORS: {
+         uint8 v0, v1;
+         HostIF_GetTimerVectors(&v0, &v1);
+         crosspage->args[0] = v0;
+         crosspage->args[1] = v1;
+      } break;
+
+      case MODULECALL_BOOTSTRAP_CLEANUP: {
+         VmmBlob_Cleanup(vm->blobInfo);
+         vm->blobInfo = NULL;
+      } break;
+
       default:
          Warning("ModuleCall %d not supported\n", crosspage->moduleCallType);
       }
diff --git a/vmnet-only/smac_compat.c b/vmnet-only/smac_compat.c
index a7218fd3..28581045 100644
--- a/vmnet-only/smac_compat.c
+++ b/vmnet-only/smac_compat.c
@@ -56,6 +56,11 @@
 
 #ifdef VMX86_DEVEL
 #define DBG 1
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 13, 0)
+#define read_skb_users(skb) atomic_read(&skb->users)
+#else
+#define read_skb_users(skb) refcount_read(&skb->users)
+#endif
 #else
 #undef DBG
 #endif /* VMX86_DEVEL */
@@ -405,7 +410,7 @@ SMACL_PrintSkb(struct sk_buff *skb,          // IN: sk_buff structure
    LOG(4, (KERN_DEBUG "pkt_type %x truesize %u protocol %u\n",
             skb->pkt_type, skb->truesize, skb->protocol));
    LOG(4, (KERN_DEBUG "users %d, tail %p, end %p\n",
-            atomic_read(&skb->users), compat_skb_tail_pointer(skb),
+            read_skb_users(skb), compat_skb_tail_pointer(skb),
             compat_skb_end_pointer(skb)));
 #if 0
 #define C skb->mac.raw
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index 38d45fde..5fa2fcaf 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -49,38 +49,68 @@ extern "C" {
 #endif
 
 /*
- * In the Atomic_* definitions below, memory ordering and atomicity are somewhat
- * conflated in an inconsistent manner. First, we have Atomic_{Read,Write},
- * which only guarantees single copy atomicity, i.e. that the read/write occurs
- * in an atomic fashion, but have no implication on memory ordering. The second
- * class of Atomics are all the non-unfenced operations excluding
- * Atomic_{Read,Write}*, which both imply atomicity and act as a memory barrier,
- * implying sequentially consistent ordering of the atomic operation with all
- * loads/stores prior to and after it.
- *
- * Since on x86, the second class of operations are associated with LOCK
- * semantics, assumptions have been made about the ordering these operations
- * imply on surrounding code (see for example the vmkernel's RefCount
- * implementation). As a result, on arm64 we have to provide these same
- * guarantees. We do this by making use of DMB barriers both before and after
- * the atomic ldrx/strx sequences. A barrier before and after is required to
- * avoid having part of the atomic operation reordered with surrounding code,
- * e.g. a store-load reordering of the strx with a following load outside the
- * Atomic_ op. For the first class of operations, Atomic_{Read,Write}, we do not
- * implement a barrier.
- *
- * This implementation of Atomic operations is suboptimal on arm64, since
- * both atomicity and memory ordering are fused together. Ideally the Atomic
- * operations would only imply atomicity, and an explicit memory barrier in the
- * surrounding code used to enforce ordering where necessary. This would eschew
- * the need for the DMBs. A middle ground can be implemented where we use the
- * arm64 load-acquire/store-release exclusive instructions to implement Atomics.
- * This would imply sequential consistency of the Atomic operations (but not
- * with any of the surrounding non-atomic operations) without the need for a
- * DMB. Using these without a DMB today can still result in problematic
- * reordering by the processor with surrounding non-atomic operations, e.g. a
- * store-load reordering with a stlxr. Future optimization for arm64 should
- * consider the wider change required at the call sites to minimize DMBs.
+ * There are two concepts involved when dealing with atomic accesses:
+ * 1. Atomicity of the access itself
+ * 2. Ordering of the access with respect to other reads&writes (from the view
+ *    of other processors/devices).
+ *
+ * Two examples help to clarify #2:
+ * a. Inc: A caller implementing a simple independent global event counter
+ *         might not care if the compiler or processor visibly reorders the
+ *         increment around other memory accesses.
+ * b. Dec: A caller implementing a reference count absolutely *doesn't* want
+ *         the compiler or processor to visibly reordering writes after that
+ *         decrement: if that happened, the program could then end up writing
+ *         to memory that was freed by another processor.
+ *
+ * C11 has standardized a good model for expressing these orderings when doing
+ * atomics. It defines three *tiers* of ordering:
+ * 1. Sequential Consistency (every processor sees the same total order of
+ *    events)
+ *
+ * 2. Acquire/Release ordering (roughly, everybody can agree previous events
+ *    have completed, but they might disagree on the ordering of previous
+ *    independent events).
+ *
+ *    The relative ordering provided by this tier is sufficient for common
+ *    locking and initialization activities, but is insufficient for unusual
+ *    synchronization schemes (e.g. IRIW aka Independent Read Independent
+ *    Write designs such Dekker's algorithm, Peterson's algorithm, etc.)
+ *
+ *    In other words, this tier is close in behavior to Sequential Consistency
+ *    in much the same way a General-Relativity universe is close to a
+ *    Newtonian universe.
+ * 3. Relaxed (i.e unordered/unfenced)
+ *
+ * In C11 standard's terminology for atomic memory ordering,
+ * - in case (a) we want "relaxed" ordering for perf and,
+ * - in case (b) we want "sequentially consistent" ordering (or perhaps the
+ *   only slightly weaker "release" ordering) for correctness.
+ *
+ * There are standardized mappings of operations to orderings for every
+ * processor architecture. See
+ * - https://www.cl.cam.ac.uk/~pes20/cpp/cpp0xmappings.html
+ * - http://preshing.com/20120913/acquire-and-release-semantics/
+ *
+ * In this file:
+ * 1. all RMW (Read/Modify/Write) operations are sequentially consistent.
+ *    This includes operations like Atomic_IncN, Atomic_ReadIfEqualWriteN,
+ *    Atomic_ReadWriteN, etc.
+ * 2. all R and W operations are relaxed. This includes operations like
+ *    Atomic_WriteN, Atomic_ReadN, Atomic_TestBitN, etc.
+ *
+ * The below routines of course ensure both the CPU and compiler honor the
+ * ordering constraint.
+ *
+ * Notes:
+ * 1. Since R-only and W-only operations do not provide ordering, callers
+ *    using them for synchronizing operations like double-checked
+ *    initialization or releasing spinlocks must provide extra barriers.
+ * 2. This implementation of Atomic operations is suboptimal. On x86,simple
+ *    reads and writes have acquire/release semantics at the hardware level.
+ *    On arm64, we have separate instructions for sequentially consistent
+ *    reads and writes (the same instructions are used for acquire/release).
+ *    Neither of these are exposed for R-only or W-only callers.
  *
  * For further details on x86 and ARM memory ordering see
  * https://wiki.eng.vmware.com/ARM/MemoryOrdering.
@@ -118,10 +148,7 @@ typedef struct Atomic_uint128 {
 /*
  * Prototypes for msft atomics.  These are defined & inlined by the
  * compiler so no function definition is needed.  The prototypes are
- * needed for C++.  Since amd64 compiler doesn't support inline asm we
- * have to use these.  Unfortunately, we still have to use some inline asm
- * for the 32 bit code since the and/or/xor implementations didn't show up
- * until XP or 2k3.
+ * needed for C++.
  *
  * The declarations for the intrinsic functions were taken from ntddk.h
  * in the DDK. The declarations must match otherwise the 64-bit C++
@@ -130,7 +157,7 @@ typedef struct Atomic_uint128 {
  * Windows typedefs. This avoids having to include windows header files
  * to get to the windows types.
  */
-#if defined _MSC_VER && _MSC_VER >= 1310 && !defined BORA_NO_WIN32_INTRINS
+#if defined _MSC_VER && !defined BORA_NO_WIN32_INTRINS
 #ifdef __cplusplus
 extern "C" {
 #endif
@@ -222,38 +249,10 @@ Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
 
 
 /*
- * All the assembly code is tricky and written conservatively.
- * For example, to make sure gcc won't introduce copies,
- * we force the addressing mode like this:
- *
- *    "xchgl %0, (%1)"
- *    : "=r" (val)
- *    : "r" (&var->value),
- *      "0" (val)
- *    : "memory"
- *
- * - edward
- *
- * Actually - turns out that gcc never generates memory aliases (it
- * still does generate register aliases though), so we can be a bit
- * more agressive with the memory constraints. The code above can be
- * modified like this:
- *
- *    "xchgl %0, %1"
- *    : "=r" (val),
- *      "=m" (var->value),
- *    : "0" (val),
- *      "1" (var->value)
- *
- * The advantages are that gcc can use whatever addressing mode it
- * likes to access the memory value, and that we dont have to use a
- * way-too-generic "memory" clobber as there is now an explicit
- * declaration that var->value is modified.
- *
- * see also /usr/include/asm/atomic.h to convince yourself this is a
- * valid optimization.
- *
- * - walken
+ * The Read/Modify/Write operations on x86/x64 are all written using the
+ * "memory" constraint. This is to ensure the compiler treats the operation as
+ * a full barrier, flushing any pending/cached state currently residing in
+ * registers.
  */
 
 #if defined _MSC_VER && _MSC_VER < 1600 && defined __x86_64__
@@ -403,6 +402,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
       : "=q" (val),
         "+m" (var->value)
       : "0" (val)
+      : "memory"
    );
    return val;
 #elif defined _MSC_VER && _MSC_VER >= 1600
@@ -496,7 +496,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
         "+m" (var->value)
       : "q" (newVal),
         "0" (oldVal)
-      : "cc"
+      : "cc", "memory"
    );
 
    return val;
@@ -1002,26 +1002,15 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
    __asm__ __volatile__(
       "xchgl %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
+      : "memory"
    );
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    return _InterlockedExchange((long *)&var->value, (long)val);
 #else
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov eax, val
-      __asm mov ebx, var
-      __asm xchg [ebx]Atomic_uint32.value, eax
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#endif // _MSC_VER >= 1310
-#else
 #error No compiler defined for Atomic_ReadWrite
 #endif // __GNUC__
 }
@@ -1162,30 +1151,17 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
    __asm__ __volatile__(
       "lock; cmpxchgl %2, %1"
       : "=a" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "r" (newVal),
-	"0" (oldVal)
-      : "cc"
+        "0" (oldVal)
+      : "cc", "memory"
    );
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    return _InterlockedCompareExchange((long *)&var->value,
-				      (long)newVal,
-				      (long)oldVal);
-#else
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov eax, oldVal
-      __asm mov ebx, var
-      __asm mov ecx, newVal
-      __asm lock cmpxchg [ebx]Atomic_uint32.value, ecx
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#endif
+                                      (long)newVal,
+                                      (long)oldVal);
 #else
 #error No compiler defined for Atomic_ReadIfEqualWrite
 #endif
@@ -1267,17 +1243,17 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
    __asm__ __volatile__(
       "lock; cmpxchgq %2, %1"
       : "=a" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "r" (newVal),
-	"0" (oldVal)
-      : "cc"
+        "0" (oldVal)
+      : "cc", "memory"
    );
    return val;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
    return _InterlockedCompareExchange64((__int64 *)&var->value,
-					(__int64)newVal,
-					(__int64)oldVal);
+                                        (__int64)newVal,
+                                        (__int64)oldVal);
 #else
 #error No compiler defined for Atomic_ReadIfEqualWrite64
 #endif
@@ -1332,7 +1308,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
       "lock; andl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1397,7 +1373,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
       "lock; orl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1462,7 +1438,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
       "lock; xorl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
@@ -1510,7 +1486,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
       "lock; xorq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif
 #elif defined _MSC_VER
@@ -1569,17 +1545,11 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
       "lock; addl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    _InterlockedExchangeAdd((long *)&var->value, (long)val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock add [ebx]Atomic_uint32.value, eax
-#endif
 #else
 #error No compiler defined for Atomic_Add
 #endif
@@ -1634,17 +1604,11 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
       "lock; subl %1, %0"
       : "+m" (var->value)
       : "ri" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
-   _InterlockedExchangeAdd((long *)&var->value, (long)-val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock sub [ebx]Atomic_uint32.value, eax
-#endif
+   _InterlockedExchangeAdd((long *)&var->value, -(long)val);
 #else
 #error No compiler defined for Atomic_Sub
 #endif
@@ -1680,16 +1644,11 @@ Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
       "lock; incl %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    _InterlockedIncrement((long *)&var->value);
-#else
-   __asm mov ebx, var
-   __asm lock inc [ebx]Atomic_uint32.value
-#endif
 #else
 #error No compiler defined for Atomic_Inc
 #endif
@@ -1725,16 +1684,11 @@ Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
       "lock; decl %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    _InterlockedDecrement((long *)&var->value);
-#else
-   __asm mov ebx, var
-   __asm lock dec [ebx]Atomic_uint32.value
-#endif
 #else
 #error No compiler defined for Atomic_Dec
 #endif
@@ -1939,26 +1893,15 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
    __asm__ __volatile__(
       "lock; xaddl %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
-      : "cc"
+      : "cc", "memory"
    );
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if _MSC_VER >= 1310
    return _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov eax, val
-      __asm mov ebx, var
-      __asm lock xadd [ebx]Atomic_uint32.value, eax
-   }
-#pragma warning(pop)
-#endif
-#else
 #error No compiler defined for Atomic_ReadAdd32
 #endif
 }
@@ -2044,11 +1987,11 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
       "lock; cmpxchgq %3, %0" "\n\t"
       "sete %1"
       : "+m" (*var),
-	"=qm" (equal),
-	"=a" (dummy)
+        "=qm" (equal),
+        "=a" (dummy)
       : "r" (newVal),
         "2" (oldVal)
-      : "cc"
+      : "cc", "memory"
    );
 #else /* 32-bit version for non-ARM */
    typedef struct {
@@ -2088,9 +2031,9 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
       "lock; cmpxchg8b (%3)" "\n\t"
       "xchgl %%ebx, %6"      "\n\t"
       "sete %0"
-      :	"=qm" (equal),
-	"=a" (dummy1),
-	"=d" (dummy2)
+      : "=qm" (equal),
+        "=a" (dummy1),
+        "=d" (dummy2)
       : /*
          * See the "Rules for __asm__ statements in __PIC__ code" above: %3
          * must use a register class which does not contain %ebx.
@@ -2111,14 +2054,14 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
       "lock; cmpxchg8b %0" "\n\t"
       "sete %1"
       : "+m" (*var),
-	"=qm" (equal),
-	"=a" (dummy1),
-	"=d" (dummy2)
+        "=qm" (equal),
+        "=a" (dummy1),
+        "=d" (dummy2)
       : "2" (((S_uint64 *)&oldVal)->lowValue),
         "3" (((S_uint64 *)&oldVal)->highValue),
         "b" (((S_uint64 *)&newVal)->lowValue),
         "c" (((S_uint64 *)&newVal)->highValue)
-      : "cc"
+      : "cc", "memory"
    );
 #   endif
 #endif
@@ -2166,11 +2109,11 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
       "lock; cmpxchgl %3, %0" "\n\t"
       "sete %1"
       : "+m" (*var),
-	"=qm" (equal),
-	"=a" (dummy)
+        "=qm" (equal),
+        "=a" (dummy)
       : "r" (newVal),
         "2" (oldVal)
-      : "cc"
+      : "cc", "memory"
    );
    return equal;
 #endif /* VM_X86_ANY */
@@ -2247,7 +2190,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
    return _InterlockedAdd64((__int64 *)&var->value, 0);
 #elif defined _MSC_VER && defined __i386__
 #   pragma warning(push)
-#   pragma warning(disable : 4035)		// disable no-return warning
+#   pragma warning(disable : 4035)      // disable no-return warning
    {
       __asm mov ecx, var
       __asm mov edx, ecx
@@ -2330,9 +2273,9 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
    __asm__ __volatile__(
       "lock; xaddq %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
-      : "cc"
+      : "cc", "memory"
    );
    return val;
 #elif defined _MSC_VER
@@ -2378,7 +2321,7 @@ Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
 #if defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
-   return Atomic_ReadAdd64(var, -val);
+   return Atomic_ReadAdd64(var, -(int64)val);
 #endif
 }
 
@@ -2425,7 +2368,7 @@ Atomic_ReadInc64(Atomic_uint64 *var) // IN/OUT
 static INLINE uint64
 Atomic_ReadDec64(Atomic_uint64 *var) // IN/OUT
 {
-   return Atomic_ReadAdd64(var, CONST64U(-1));
+   return Atomic_ReadAdd64(var, (uint64)CONST64(-1));
 }
 
 
@@ -2460,7 +2403,7 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
       "lock; addq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif
 #elif defined _MSC_VER
@@ -2502,7 +2445,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
       "lock; subq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #endif
 #elif defined _MSC_VER
@@ -2542,7 +2485,7 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
       "lock; incq %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined _MSC_VER
    _InterlockedIncrement64((__int64 *)&var->value);
@@ -2581,7 +2524,7 @@ Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
       "lock; decq %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined _MSC_VER
    _InterlockedDecrement64((__int64 *)&var->value);
@@ -2617,8 +2560,9 @@ Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
    __asm__ __volatile__(
       "xchgq %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
+      : "memory"
    );
    return val;
 #elif defined _MSC_VER
@@ -2726,7 +2670,7 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
       "lock; orq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined _MSC_VER
    _InterlockedOr64((__int64 *)&var->value, (__int64)val);
@@ -2773,7 +2717,7 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
       "lock; andq %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined _MSC_VER
    _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
@@ -2811,29 +2755,17 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
 
 static INLINE void
 Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
-                uint64 bit)         // IN
+                unsigned bit)       // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __x86_64__ && defined __GNUC__
    ASSERT(bit <= 63);
    __asm__ __volatile__(
-      "lock; bts %1, %0"
+      "lock; btsq %1, %0"
       : "+m" (var->value)
-      : "ri" (bit)
-      : "cc"
+      : "ri" ((uint64)bit)
+      : "cc", "memory"
    );
-#elif defined _MSC_VER
-   uint64 oldVal;
-   uint64 newVal;
-   ASSERT(bit <= 63);
-   do {
-      oldVal = var->value;
-      newVal = oldVal | (CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #else
-#error No compiler defined for Atomic_SetBit64
-#endif
-#else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    ASSERT(bit <= 63);
@@ -2863,29 +2795,17 @@ Atomic_SetBit64(Atomic_uint64 *var, // IN/OUT
 
 static INLINE void
 Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
-                  uint64 bit)         // IN
+                  unsigned bit)       // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __x86_64__ && defined __GNUC__
    ASSERT(bit <= 63);
    __asm__ __volatile__(
-      "lock; btr %1, %0"
+      "lock; btrq %1, %0"
       : "+m" (var->value)
-      : "ri" (bit)
-      : "cc"
+      : "ri" ((uint64)bit)
+      : "cc", "memory"
    );
-#elif defined _MSC_VER
-   uint64 oldVal;
-   uint64 newVal;
-   ASSERT(bit <= 63);
-   do {
-      oldVal = var->value;
-      newVal = oldVal & ~(CONST64U(1) << bit);
-   } while (!Atomic_CMPXCHG64(var, oldVal, newVal));
 #else
-#error No compiler defined for Atomic_ClearBit64
-#endif
-#else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    ASSERT(bit <= 63);
@@ -2915,29 +2835,65 @@ Atomic_ClearBit64(Atomic_uint64 *var, // IN/OUT
 
 static INLINE Bool
 Atomic_TestBit64(Atomic_uint64 *var, // IN
-                 uint64 bit)         // IN
+                 unsigned bit)       // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
-   Bool out = FALSE;
+   Bool out;
    ASSERT(bit <= 63);
+#if defined __x86_64__ && defined __GNUC__
    __asm__ __volatile__(
-      "bt %2, %1; setc %0"
+      "btq %2, %1; setc %0"
       : "=rm"(out)
       : "m" (var->value),
-        "rJ" (bit)
+        "rJ" ((uint64)bit)
       : "cc"
    );
+#else
+   out = (var->value & (CONST64U(1) << bit)) != 0;
+#endif
    return out;
-#elif defined _MSC_VER
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestSetBit64 --
+ *
+ *      Atomically test and set the bit 'bit' in var.
+ *      Bit must be between 0 and 63.
+ *
+ * Results:
+ *      TRUE if the tested bit was set; else FALSE.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestSetBit64(Atomic_uint64 *var, // IN/OUT
+                    unsigned bit)       // IN
+{
+#if defined __x86_64__ && defined __GNUC__
+   Bool out;
    ASSERT(bit <= 63);
-   return (var->value & (CONST64U(1) << bit)) != 0;
+   __asm__ __volatile__(
+      "lock; btsq %2, %1; setc %0"
+      : "=rm" (out), "+m" (var->value)
+      : "rJ" ((uint64)bit)
+      : "cc", "memory"
+   );
+   return out;
 #else
-#error No compiler defined for Atomic_TestBit64
-#endif
-#else // __x86_64__
+   uint64 oldVal;
+   uint64 mask;
    ASSERT(bit <= 63);
-   return (var->value & (CONST64U(1) << bit)) != 0;
+   mask = CONST64U(1) << bit;
+   do {
+      oldVal = var->value;
+   } while (!Atomic_CMPXCHG64(var, oldVal, oldVal | mask));
+   return (oldVal & mask) != 0;
 #endif
 }
 
@@ -3020,8 +2976,9 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
    __asm__ __volatile__(
       "xchgw %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
+      : "memory"
    );
    return val;
 #elif defined VM_ARM_V7
@@ -3128,10 +3085,10 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
    __asm__ __volatile__(
       "lock; cmpxchgw %2, %1"
       : "=a" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "r" (newVal),
-	"0" (oldVal)
-      : "cc"
+        "0" (oldVal)
+      : "cc", "memory"
    );
    return val;
 #elif defined VM_ARM_V7
@@ -3192,7 +3149,7 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
       "lock; andw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3249,7 +3206,7 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
       "lock; orw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3306,7 +3263,7 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
       "lock; xorw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3363,7 +3320,7 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
       "lock; addw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3420,7 +3377,7 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
       "lock; subw %1, %0"
       : "+m" (var->value)
       : "re" (val)
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_V7
    register volatile uint16 res;
@@ -3476,7 +3433,7 @@ Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
       "lock; incw %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_ANY
    Atomic_Add16(var, 1);
@@ -3512,7 +3469,7 @@ Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
       "lock; decw %0"
       : "+m" (var->value)
       :
-      : "cc"
+      : "cc", "memory"
    );
 #elif defined VM_ARM_ANY
    Atomic_Sub16(var, 1);
@@ -3582,9 +3539,9 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
    __asm__ __volatile__(
       "lock; xaddw %0, %1"
       : "=r" (val),
-	"+m" (var->value)
+        "+m" (var->value)
       : "0" (val)
-      : "cc"
+      : "cc", "memory"
    );
    return val;
 #elif defined VM_ARM_V7
@@ -3715,7 +3672,7 @@ Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
                             in val)                                           \
    {                                                                          \
       return (out)(cast)Atomic_ReadWrite ## size(var,                         \
-		(uint ## size)(cast)val);                                     \
+                (uint ## size)(cast)val);                                     \
    }                                                                          \
                                                                               \
                                                                               \
@@ -3876,6 +3833,109 @@ MAKE_ATOMIC_TYPE(Ptr, 32, void const *, void *, uintptr_t)
 MAKE_ATOMIC_TYPE(Int, 32, int, int, int)
 MAKE_ATOMIC_TYPE(Bool, 8, Bool, Bool, Bool)
 
+/*
+ * Define arbitrary sized bit vector to be used by
+ * Atomic_TestSetBitVector and Atomic_TestClearBitVector.
+ */
+#define ATOMIC_BITVECTOR(varName, capacity) \
+      Atomic_uint8 varName[CEILING(capacity, 8)]
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestSetBitVector --
+ *
+ *      Atomically test and set the bit 'index' in bit vector var.
+ *
+ *      The index input value specifies which bit to modify and is 0-based.
+ *
+ * Results:
+ *      Returns the value of the bit before modification.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestSetBitVector(Atomic_uint8 *var, // IN/OUT
+                        unsigned index)    // IN
+{
+#if defined __x86_64__ && defined __GNUC__
+   Bool bit;
+   __asm__ __volatile__(
+      "lock; bts %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (var->value)
+      : "rI" (index)
+      : "cc", "memory"
+   );
+   return bit;
+#else
+   uint8 bit = 1 << index % 8;
+   return (Atomic_ReadOr8(var + index / 8, bit) & bit) != 0;
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestClearBitVector --
+ *
+ *      Atomically test and clear the bit 'index' in bit vector var.
+ *
+ *      The index input value specifies which bit to modify and is 0-based.
+ *
+ * Results:
+ *      Returns the value of the bit before modification.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestClearBitVector(Atomic_uint8 *var, // IN/OUT
+                          unsigned index)    // IN
+{
+#if defined __x86_64__ && defined __GNUC__
+   Bool bit;
+   __asm__ __volatile__(
+      "lock; btr %2, %1;"
+      "setc %0"
+      : "=qQm" (bit), "+m" (var->value)
+      : "rI" (index)
+      : "cc", "memory"
+   );
+   return bit;
+#else
+   uint8 bit = 1 << index % 8;
+   return (Atomic_ReadAnd8(var + index / 8, ~bit) & bit) != 0;
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_TestBitVector --
+ *
+ *      Test the bit 'index' (zero-based) in bit vector var.
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE Bool
+Atomic_TestBitVector(const Atomic_uint8 *var, // IN
+                     unsigned index)          // IN
+{
+   uint8 bit = 1 << index % 8;
+   return (Atomic_Read8(var + index / 8) & bit) != 0;
+}
+
+
 #ifdef VM_ARM_64
 #   include "vm_atomic_arm64_end.h"
 #endif
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index 11c3abac..79bb2789 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -1056,7 +1056,7 @@ ClearBitVector(void *var, int32 index)
       "setc %0"
       : "=qQm" (bit), "+m" (*(uint32 *)var)
       : "rI" (index)
-      : "cc"
+      : "memory", "cc"
    );
    return bit;
 #elif defined(_MSC_VER)
@@ -1078,7 +1078,7 @@ ComplementBitVector(void *var, int32 index)
       "setc %0"
       : "=qQm" (bit), "+m" (*(uint32 *)var)
       : "rI" (index)
-      : "cc"
+      : "memory", "cc"
    );
    return bit;
 #elif defined(_MSC_VER)
diff --git a/vmnet-only/vm_basic_asm_x86.h b/vmnet-only/vm_basic_asm_x86.h
index b9c684f4..e293ed25 100644
--- a/vmnet-only/vm_basic_asm_x86.h
+++ b/vmnet-only/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmnet-only/vm_basic_asm_x86_64.h b/vmnet-only/vm_basic_asm_x86_64.h
index 4f9fd4f2..f9b255a9 100644
--- a/vmnet-only/vm_basic_asm_x86_64.h
+++ b/vmnet-only/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmnet-only/vm_basic_asm_x86_common.h b/vmnet-only/vm_basic_asm_x86_common.h
index 06ae1b5f..a724178e 100644
--- a/vmnet-only/vm_basic_asm_x86_common.h
+++ b/vmnet-only/vm_basic_asm_x86_common.h
@@ -374,8 +374,8 @@ RDTSC_BARRIER(void)
  * Thanks for pasting this whole comment into every architecture header.
  *
  * On x86, we only need to care specifically about store-load reordering on
- * normal memory types. In other cases, only a compiler barrier is needed. The
- * ST_LD barrier is implemented with a locked xor operation (instead of the
+ * normal memory types. In other cases, only a compiler barrier is needed.
+ * SMP_W_BARRIER_R is implemented with a locked xor operation (instead of the
  * mfence instruction) for performance reasons. See PR 1674199 for more
  * details.
  *
@@ -389,19 +389,17 @@ SMP_W_BARRIER_R(void)
 {
    volatile long temp;
 
-   COMPILER_MEM_BARRIER();
 #if defined __GNUC__
    __asm__ __volatile__ (
-      "lock xorl $1, %0\n"
+      "lock xorl $1, %0"
       : "+m" (temp)
       : /* no additional inputs */
-      : "cc");
+      : "cc", "memory");
 #elif defined _MSC_VER
    _InterlockedXor(&temp, 1);
 #else
 #error SMP_W_BARRIER_R not defined for this compiler
 #endif
-   COMPILER_MEM_BARRIER();
 }
 
 #define SMP_R_BARRIER_R()     COMPILER_READ_BARRIER()
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index 47022384..b40e9b6a 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,12 +37,16 @@
 #include "vm_basic_types.h" // For INLINE.
 
 /* Checks for FreeBSD, filtering out VMKERNEL. */
-#define __IS_FREEBSD__ (!defined(VMKERNEL) && defined(__FreeBSD__))
+#if !defined(VMKERNEL) && defined(__FreeBSD__)
+#define __IS_FREEBSD__ 1
+#else
+#define __IS_FREEBSD__ 0
+#endif
 #define __IS_FREEBSD_VER__(ver) (__IS_FREEBSD__ && __FreeBSD_version >= (ver))
 
 #if defined _WIN32 && defined USERLEVEL
    #include <stddef.h>  /*
-                         * We redefine offsetof macro from stddef; make 
+                         * We redefine offsetof macro from stddef; make
                          * sure that it's already defined before we do that.
                          */
    #include <windows.h>	// for Sleep() and LOWORD() etc.
@@ -101,7 +105,7 @@
 
 /* The Solaris 9 cross-compiler complains about these not being used */
 #ifndef sun
-static INLINE int 
+static INLINE int
 Min(int a, int b)
 {
    return a < b ? a : b;
@@ -113,7 +117,7 @@ Min(int a, int b)
 #endif
 
 #ifndef sun
-static INLINE int 
+static INLINE int
 Max(int a, int b)
 {
    return a > b ? a : b;
@@ -168,7 +172,7 @@ Max(int a, int b)
 #endif
 
 
-/* 
+/*
  * Token concatenation
  *
  * The C preprocessor doesn't prescan arguments when they are
@@ -256,15 +260,26 @@ Max(int a, int b)
 #endif
 
 #ifndef MBYTES_2_PAGES
-#define MBYTES_2_PAGES(_nbytes) ((_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
+#define MBYTES_2_PAGES(_nbytes) \
+   ((uint64)(_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_MBYTES
 #define PAGES_2_MBYTES(_npages) ((_npages) >> (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
+#ifndef ROUNDUP_PAGES_2_MBYTES
+#define ROUNDUP_PAGES_2_MBYTES(_npages) \
+(((_npages) + MASK(MBYTES_SHIFT - PAGE_SHIFT)) >> (MBYTES_SHIFT - PAGE_SHIFT))
+#endif
+
+#ifndef ROUNDDOWN_PAGES_2_MBYTES
+#define ROUNDDOWN_PAGES_2_MBYTES(_npages) \
+((_npages) >> (MBYTES_SHIFT - PAGE_SHIFT))
+#endif
+
 #ifndef GBYTES_2_PAGES
-#define GBYTES_2_PAGES(_nbytes) ((_nbytes) << (30 - PAGE_SHIFT))
+#define GBYTES_2_PAGES(_nbytes) ((uint64)(_nbytes) << (30 - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_GBYTES
@@ -369,7 +384,7 @@ Max(int a, int b)
 #ifdef _MSC_VER
 #ifdef __cplusplus
 extern "C"
-#endif 
+#endif
 void *_ReturnAddress(void);
 #pragma intrinsic(_ReturnAddress)
 #define GetReturnAddress() _ReturnAddress()
@@ -412,22 +427,6 @@ void *_ReturnAddress(void);
 
 #ifdef USERLEVEL // {
 
-/*
- * Note this might be a problem on NT b/c while sched_yield guarantees it
- * moves you to the end of your priority list, Sleep(0) offers no such
- * guarantee.  Bummer.  --Jeremy.
- */
-
-#if defined(_WIN32)
-#      define YIELD()		Sleep(0)
-#elif defined(VMKERNEL)
-/* We don't have a YIELD macro in the vmkernel */
-#else
-#      include <sched.h>        // For sched_yield.  Don't ask.  --Jeremy.
-#      define YIELD()		sched_yield()
-#endif 
-
-
 /*
  * Standardize some Posix names on Windows.
  */
@@ -497,19 +496,8 @@ typedef int pid_t;
 
 #elif defined(__APPLE__) && defined(KERNEL)
 
-#include "availabilityMacOS.h"
-
-#if MAC_OS_X_VERSION_MIN_REQUIRED >= 1050
-// The Mac OS 10.5 kernel SDK defines va_copy in stdarg.h.
+// The macOS kernel SDK defines va_copy in stdarg.h.
 #include <stdarg.h>
-#else
-/*
- * The Mac OS 10.4 kernel SDK needs va_copy. Based on inspection of
- * stdarg.h from the MacOSX10.4u.sdk kernel framework, this should
- * work.
- */
-#define va_copy(dest, src) ((dest) = (src))
-#endif // MAC_OS_X_VERSION_MIN_REQUIRED
 
 #elif defined(__GNUC__) && (__GNUC__ < 3)
 
@@ -529,7 +517,7 @@ typedef int pid_t;
  * driver.
  */
 
-#ifdef _WIN32
+#if defined(_WIN32) && defined(_MSC_VER)
 #define PATH_MAX 256
 #ifndef strcasecmp
 #define strcasecmp(_s1,_s2)   _stricmp((_s1),(_s2))
@@ -539,29 +527,6 @@ typedef int pid_t;
 #endif
 #endif
 
-#if defined __linux__ && !defined __KERNEL__ && !defined MODULE && \
-                         !defined VMM && !defined FROBOS && !defined __ANDROID__
-#include <features.h>
-#if __GLIBC_PREREQ(2, 1) && !defined GLIBC_VERSION_21
-#define GLIBC_VERSION_21
-#endif
-#if __GLIBC_PREREQ(2, 2) && !defined GLIBC_VERSION_22
-#define GLIBC_VERSION_22
-#endif
-#if __GLIBC_PREREQ(2, 3) && !defined GLIBC_VERSION_23
-#define GLIBC_VERSION_23
-#endif
-#if __GLIBC_PREREQ(2, 4) && !defined GLIBC_VERSION_24
-#define GLIBC_VERSION_24
-#endif
-#if __GLIBC_PREREQ(2, 5) && !defined GLIBC_VERSION_25
-#define GLIBC_VERSION_25
-#endif
-#if __GLIBC_PREREQ(2, 12) && !defined GLIBC_VERSION_212
-#define GLIBC_VERSION_212
-#endif
-#endif
-
 /*
  * Convenience definitions of unicode characters.
  */
@@ -634,7 +599,7 @@ typedef int pid_t;
 #define RELEASE_ONLY(x) x
 #else
 #define vmx86_release   0
-#define RELEASE_ONLY(x) 
+#define RELEASE_ONLY(x)
 #endif
 
 #ifdef VMX86_SERVER
@@ -687,6 +652,12 @@ typedef int pid_t;
 #define vmw_apple_sandbox 0
 #endif
 
+#if defined(__APPLE__) && defined(VMW_APPLE_APP_STORE)
+#define vmw_apple_app_store 1
+#else
+#define vmw_apple_app_store 0
+#endif
+
 #ifdef VMM
 #define VMM_ONLY(x) x
 #else
@@ -699,17 +670,6 @@ typedef int pid_t;
 #define USER_ONLY(x) x
 #endif
 
-/* VMVISOR ifdef only allowed in the vmkernel */
-#ifdef VMKERNEL
-#ifdef VMVISOR
-#define vmvisor 1
-#define VMVISOR_ONLY(x) x
-#else
-#define vmvisor 0
-#define VMVISOR_ONLY(x)
-#endif
-#endif
-
 #ifdef _WIN32
 #define VMW_INVALID_HANDLE INVALID_HANDLE_VALUE
 #else
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index 01aa0c9f..54f3e7e7 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,24 +38,6 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
-/* STRICT ANSI means the Xserver build and X defines Bool differently. */
-#if !defined(_XTYPEDEF_BOOL) && \
-    (!defined(__STRICT_ANSI__) || defined(__FreeBSD__) || \
-      defined(__MINGW32__) || defined(__APPLE__))
-#define _XTYPEDEF_BOOL
-typedef char           Bool;
-#endif
-
-#ifndef FALSE
-#define FALSE          0
-#endif
-
-#ifndef TRUE
-#define TRUE           1
-#endif
-
-#define IS_BOOL(x)     (((x) & ~1) == 0)
-
 /*
  * Macros __i386__ and __ia64 are intrinsically defined by GCC
  */
@@ -87,7 +69,8 @@ typedef char           Bool;
  */
 
 #ifdef __i386__
-/* VM_I386 is historically synonymous with VM_X86_ANY in bora, but misleading,
+/*
+ * VM_I386 is historically synonymous with VM_X86_ANY in bora, but misleading,
  * since it is confused with the __i386__ gcc but defined for both 32- and
  * 64-bit x86. We retain it here for legacy compatibility.
  */
@@ -99,12 +82,12 @@ typedef char           Bool;
 
 #ifdef __x86_64__
 #define VM_X86_64
+#define vm_x86_64 1
 #define VM_I386
 #define VM_X86_ANY
 #define VM_64BIT
-#define vm_x86_64 (1)
 #else
-#define vm_x86_64 (0)
+#define vm_x86_64 0
 #endif
 
 #ifdef __arm__
@@ -115,13 +98,15 @@ typedef char           Bool;
 
 #ifdef __aarch64__
 #define VM_ARM_64
+#define vm_arm_64 1
 #define VM_ARM_ANY
 #define VM_64BIT
-#define vm_arm_64 (1)
 #else
-#define vm_arm_64 (0)
+#define vm_arm_64 0
 #endif
 
+#define vm_64bit (sizeof (void *) == 8)
+
 #ifdef _MSC_VER
 
 #pragma warning (3 :4505) // unreferenced local function
@@ -135,17 +120,15 @@ typedef char           Bool;
 
 #endif
 
-#if defined(__linux__) && defined(__cplusplus) && __cplusplus >= 201103L
-
+#if defined(__cplusplus) && __cplusplus >= 201103L || \
+    defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L || \
+    defined(__APPLE__) || defined(HAVE_STDINT_H)
 /*
- * We're using stdint.h instead of cstdint below because of libstdcpp.cpp.
- * It looks like a C++ file. When being preprocessed all the C++ specific
- * defines(e.g. __cplusplus) are set, but the C++ include paths are not.
+ * We're using <stdint.h> instead of <cstdint> below because some C++ code
+ * deliberately compiles without C++ include paths.
  */
 #include <stdint.h>
 
-typedef char          Bool;
-
 typedef uint64_t    uint64;
 typedef  int64_t     int64;
 typedef uint32_t    uint32;
@@ -155,56 +138,25 @@ typedef  int16_t     int16;
 typedef  uint8_t     uint8;
 typedef   int8_t      int8;
 
-typedef uint64 BA;
-typedef uint64 MA;
-typedef uint32 MPN32;
-
-#elif defined(__APPLE__) || defined(HAVE_STDINT_H)
-
-/*
- * TODO: This is a C99 standard header.  We should be able to test for
- * #if __STDC_VERSION__ >= 199901L, but that breaks the Netware build
- * (which doesn't have stdint.h).
- */
-
-#include <stdint.h>
-
-typedef uint64_t    uint64;
-typedef  int64_t     int64;
-typedef uint32_t    uint32;
-typedef  int32_t     int32;
-typedef uint16_t    uint16;
-typedef  int16_t     int16;
-typedef  uint8_t    uint8;
-typedef   int8_t     int8;
-
-/*
- * Note: C does not specify whether char is signed or unsigned, and
- * both gcc and msvc implement processor-specific signedness.  With
- * three types:
- * typeof(char) != typeof(signed char) != typeof(unsigned char)
- *
- * Be careful here, because gcc (4.0.1 and others) likes to warn about
- * conversions between signed char * and char *.
- */
-
 #else /* !HAVE_STDINT_H */
 
+/* Pre-c99 or pre-c++11; use compiler extension to get 64-bit types */
 #ifdef _MSC_VER
 
 typedef unsigned __int64 uint64;
 typedef signed __int64 int64;
 
 #elif __GNUC__
-/* The Xserver source compiles with -ansi -pendantic */
-#   if !defined(__STRICT_ANSI__) || defined(__FreeBSD__)
-#      if defined(VM_X86_64) || defined(VM_ARM_64)
+#   if defined(VM_X86_64) || defined(VM_ARM_64)
 typedef unsigned long uint64;
 typedef long int64;
-#      else
+#   else
+/*
+ * Only strict c90 (without extensions) lacks a 'long long' type.
+ * If this declaration fails ... use -std=c99 or -std=gnu90.
+ */
 typedef unsigned long long uint64;
 typedef long long int64;
-#      endif
 #   endif
 #else
 #   error - Need compiler define for int64/uint64
@@ -220,6 +172,36 @@ typedef signed char        int8;
 
 #endif /* HAVE_STDINT_H */
 
+
+/*
+ * The _XTYPEDEF_BOOL guard prevents colliding with:
+ * <X11/Xlib.h> #define Bool int
+ * <X11/Xdefs.h> typedef int Bool;
+ * If using this header AND X11 headers, be sure to #undef Bool and
+ * be careful about the different size.
+ */
+#if !defined(_XTYPEDEF_BOOL)
+#define _XTYPEDEF_BOOL
+/*
+ * C does not specify whether char is signed or unsigned, and
+ * both gcc and msvc implement it as a non-signed, non-unsigned type.
+ * Thus, (uint8_t *)&Bool and (int8_t *)&Bool are possible compile errors.
+ * This is intentional.
+ */
+typedef char           Bool;
+#endif
+
+#ifndef FALSE
+#define FALSE          0
+#endif
+
+#ifndef TRUE
+#define TRUE           1
+#endif
+
+#define IS_BOOL(x)     (((x) & ~1) == 0)
+
+
 /*
  * FreeBSD (for the tools build) unconditionally defines these in
  * sys/inttypes.h so don't redefine them if this file has already
@@ -344,6 +326,7 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
  */
 
 #ifdef _MSC_VER
+   /* MSVC added C99-compatible formatting in vs2015. */
    #define FMT64      "I64"
    #ifdef VM_X86_64
       #define FMTSZ      "I64"
@@ -355,53 +338,29 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
       #define FMTH       "I"
    #endif
 #elif defined __APPLE__
-   /* Mac OS hosts use the same formatters for 32- and 64-bit. */
-   #define FMT64 "ll"
+   /* macOS hosts use the same formatters for 32- and 64-bit. */
+   #define FMT64         "ll"
    #if KERNEL
-      #define FMTSZ "l"
-   #else
-      #define FMTSZ "z"
-   #endif
-   #define FMTPD "l"
-   #define FMTH ""
-#elif __GNUC__
-   #define FMTH ""
-   #if defined(sun)
-      #if defined(VM_X86_64) || defined(VM_ARM_64)
-         #define FMTSZ  "l"
-         #define FMTPD  "l"
-      #else
-         #define FMTSZ  ""
-         #define FMTPD  ""
-      #endif
-   #elif defined(__linux__) || \
-        (defined(__FreeBSD__) && (__FreeBSD__ + 0))\
-      || (defined(_POSIX_C_SOURCE) && _POSIX_C_SOURCE >= 200112L) \
-      || (defined(_POSIX_VERSION) && _POSIX_VERSION >= 200112L) \
-      || (defined(_POSIX2_VERSION) && _POSIX2_VERSION >= 200112L)
-      /* BSD, Linux */
-      #define FMTSZ     "z"
-
-      #if defined(VM_X86_64) || defined(VM_ARM_64)
-         #define FMTPD  "l"
-      #else
-         #define FMTPD  ""
-      #endif
+      /* macOS osfmk/kern added 'z' length specifier in 10.13 */
+      #define FMTSZ      "l"
    #else
-      /* Systems with a pre-C99 libc */
-      #define FMTSZ     "Z"
-      #if defined(VM_X86_64) || defined(VM_ARM_64)
-         #define FMTPD  "l"
-      #else
-         #define FMTPD  ""
-      #endif
+      #define FMTSZ      "z"
    #endif
+   #define FMTPD         "l"
+   #define FMTH          ""
+#elif defined __GNUC__
+   /*
+    * Every POSIX system we target has C99-compatible printf
+    * (supports 'z' for size_t and 'll' for long long).
+    */
+   #define FMTH          ""
+   #define FMTSZ         "z"
    #if defined(VM_X86_64) || defined(VM_ARM_64)
-      #define FMT64     "l"
-   #elif defined(sun) || defined(__FreeBSD__)
-      #define FMT64     "ll"
+      #define FMT64      "l"
+      #define FMTPD      "l"
    #else
-      #define FMT64     "L"
+      #define FMT64      "ll"
+      #define FMTPD      ""
    #endif
 #else
    #error - Need compiler define for FMT64 and FMTSZ
@@ -485,26 +444,23 @@ typedef uint8 *TCA;  /* Pointer into TC (usually). */
  * Type big enough to hold an integer between 0..100
  */
 typedef uint8 Percent;
-#define AsPercent(v)	((Percent)(v))
+#define AsPercent(v) ((Percent)(v))
 
 
 typedef uintptr_t VA;
 typedef uintptr_t VPN;
 
 typedef uint64    PA;
-typedef uint32    PPN;
+typedef uint64    PPN;
+typedef uint32    PPNTMP;
 
 typedef uint64    TPA;
-typedef uint32    TPPN;
+typedef uint64    TPPN;
 
 typedef uint64    PhysMemOff;
 typedef uint64    PhysMemSize;
 
-/* The Xserver source compiles with -ansi -pendantic */
-#ifndef __STRICT_ANSI__
 typedef uint64    BA;
-#endif
-
 #ifdef VMKERNEL
 typedef void     *BPN;
 #else
@@ -514,9 +470,12 @@ typedef uint64    BPN;
 #define UINT64_2_BPN(u) ((BPN)(u))
 #define BPN_2_UINT64(b) ((uint64)(b))
 
-typedef uint32    PageNum;
-typedef unsigned      MemHandle;
-typedef unsigned int  IoHandle;
+typedef uint64    PgCnt64;
+typedef uint64    PageCnt;
+typedef uint64    PgNum64;
+typedef uint64    PageNum;
+typedef unsigned  MemHandle;
+typedef unsigned  IoHandle;
 typedef int32     World_ID;
 
 /* !! do not alter the definition of INVALID_WORLD_ID without ensuring
@@ -560,11 +519,8 @@ typedef uint128 UReg128;
 typedef  Reg64  Reg;
 typedef UReg64 UReg;
 #endif
-/* The Xserver source compiles with -ansi -pendantic */
-#ifndef __STRICT_ANSI__
 typedef uint64 MA;
 typedef uint32 MPN32;
-#endif
 
 /*
  * This type should be used for variables that contain sector
@@ -615,6 +571,7 @@ typedef uint64 LA64;
 typedef uint64 LPN64;
 typedef uint64 PA64;
 typedef uint64 PPN64;
+typedef uint64 TPPN64;
 typedef uint64 MA64;
 typedef uint64 MPN;
 
@@ -640,10 +597,14 @@ typedef void * UserVA;
 #endif
 
 
+/* Maximal observable PPN value. */
 #define MAX_PPN_BITS      31
-#define MAX_PPN           (((PPN)1 << MAX_PPN_BITS) - 1) /* Maximal observable PPN value. */
-#define INVALID_PPN       ((PPN)0xffffffff)
-#define APIC_INVALID_PPN  ((PPN)0xfffffffe)
+#define MAX_PPN           (((PPN64)1 << MAX_PPN_BITS) - 1)
+
+#define INVALID_PPN       ((PPN64)0xffffffff)
+#define INVALID_PPN32     ((PPN32)0xffffffff)
+#define INVALID_PPN64     ((PPN64)0xffffffffffffffffull)
+#define APIC_INVALID_PPN  ((PPN64)0xfffffffe)
 
 #define INVALID_BPN       ((BPN)0x000000ffffffffffull)
 
@@ -663,7 +624,7 @@ typedef void * UserVA;
 #define INVALID_LPN       ((LPN)-1)
 #define INVALID_VPN       ((VPN)-1)
 #define INVALID_LPN64     ((LPN64)-1)
-#define INVALID_PAGENUM   ((PageNum)-1)
+#define INVALID_PAGENUM   ((uint32)-1)
 
 /*
  * Format modifier for printing VA, LA, and VPN.
@@ -755,6 +716,14 @@ typedef void * UserVA;
 #error "gcc version is too old to compile assembly, need gcc-3.3 or better"
 #endif
 
+/*
+ * Similarly, we require a compiler that is at least vc80 (vs2005).
+ * Enforce this here.
+ */
+#if defined _MSC_VER && _MSC_VER < 1400
+#error "cl.exe version is too old, need vc80 or better"
+#endif
+
 
 /*
  * Consider the following reasons functions are inlined:
@@ -783,7 +752,7 @@ typedef void * UserVA;
 #define INLINE_SINGLE_CALLER INLINE_ALWAYS
 
 /*
- * Used when a hard guaranteed of no inlining is needed. Very few
+ * Used when a hard guarantee of no inlining is needed. Very few
  * instances need this since the absence of INLINE is a good hint
  * that gcc will not do inlining.
  */
@@ -1086,33 +1055,6 @@ typedef void * UserVA;
 # define FMTMODE "o"
 #endif
 
-/*
- * Format modifier for printing time_t. Most platforms define a time_t to be
- * a long int, but on FreeBSD (as of 5.0, it seems), the time_t is a signed
- * size quantity. Refer to the definition of FMTSZ to see why we need silly
- * preprocessor arithmetic.
- * Use this like this: printf("The mode is %" FMTTIME ".\n", time);
- */
-#if defined(__FreeBSD__) && (__FreeBSD__ + 0) && ((__FreeBSD__ + 0) >= 5)
-#   define FMTTIME FMTSZ"d"
-#else
-#   if defined(_MSC_VER)
-#      ifndef _SAFETIME_H_
-#         if (_MSC_VER < 1400) || defined(_USE_32BIT_TIME_T)
-#             define FMTTIME "ld"
-#         else
-#             define FMTTIME FMT64"d"
-#         endif
-#      else
-#         ifndef FMTTIME
-#            error "safetime.h did not define FMTTIME"
-#         endif
-#      endif
-#   else
-#      define FMTTIME "ld"
-#   endif
-#endif
-
 #ifdef __APPLE__
 /*
  * Format specifier for all these annoying types such as {S,U}Int32
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
index ab396bc1..39371ad2 100644
--- a/vmnet-only/vm_device_version.h
+++ b/vmnet-only/vm_device_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2005-2012,2014-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2005-2012,2014-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -98,7 +98,16 @@
 #define PCI_DEVICE_VMI_INTERFACE        0x00
 #define PCI_DEVICE_VMI_REVISION         0x01
 
-#define PCI_DEVICE_ID_VMWARE_DUMMY      0x0809
+/*
+ * Device IDs for the PCI passthru test device:
+ *
+ * 0x0809 is for old fashioned PCI with MSI.
+ * 0x080A is for PCI express with MSI-X.
+ * 0x080B is for PCI express with configurable BARs.
+ */
+#define PCI_DEVICE_ID_VMWARE_PCI_TEST   0x0809
+#define PCI_DEVICE_ID_VMWARE_PCIE_TEST1 0x080A
+#define PCI_DEVICE_ID_VMWARE_PCIE_TEST2 0x080B
 
 #define PCI_DEVICE_ID_VMWARE_VRDMA      0x0820
 #define PCI_DEVICE_ID_VMWARE_VTPM       0x0830
@@ -115,6 +124,7 @@
  */
 #define PCI_VENDOR_ID_AMD               0x1022
 #define PCI_DEVICE_ID_AMD_VLANCE        0x2000
+#define PCI_DEVICE_ID_AMD_IOMMU         0x1577
 #define PCI_VENDOR_ID_BUSLOGIC			0x104B
 #define PCI_DEVICE_ID_BUSLOGIC_MULTIMASTER_NC	0x0140
 #define PCI_DEVICE_ID_BUSLOGIC_MULTIMASTER	0x1040
@@ -153,16 +163,18 @@
 #define PCI_DEVICE_ID_INTEL_LYNXPOINT_XHCI 0x8c31
 
 /*
- * Intel Quickassist (QAT) devices:
- * - Gen 1: Cave Creek (CVC) and Coleto Creek (CLC)
- * - Gen 2: Lewisburg (LBG)
+ * Intel Volume Management Device (VMD)
  */
-#define PCI_DEVICE_ID_INTEL_QAT_CVC     0x0434
-#define PCI_DEVICE_ID_INTEL_QAT_CLC     0x0435
-#define PCI_DEVICE_ID_INTEL_QAT_LBG     0x37c8
-#define PCI_DEVICE_ID_INTEL_QAT_CVC_VF  0x0442
-#define PCI_DEVICE_ID_INTEL_QAT_CLC_VF  0x0443
-#define PCI_DEVICE_ID_INTEL_QAT_LBG_VF  0x37c9
+#define PCI_DEVICE_ID_INTEL_VMD_V1           0x201d
+
+/*
+ * Intel Quickassist (QAT) devices.
+ */
+#define PCI_DEVICE_ID_INTEL_QAT_DH895XCC     0x0435
+#define PCI_DEVICE_ID_INTEL_QAT_DH895XCC_VF  0x0443
+
+#define PCI_DEVICE_ID_INTEL_QAT_C62X         0x37c8
+#define PCI_DEVICE_ID_INTEL_QAT_C62X_VF      0x37c9
 
 /*
  * Intel FPGAs
@@ -237,8 +249,12 @@
 
 /************* SCSI implementation limits ********************************/
 #define SCSI_MAX_CONTROLLERS	 4	  // Need more than 1 for MSCS clustering
-#define	SCSI_MAX_DEVICES	 16	  // BT-958 emulates only 16
-#define PVSCSI_MAX_DEVICES       255      // 255 (including the controller)
+#define	SCSI_MAX_DEVICES         16	  // BT-958 emulates only 16
+#define PVSCSI_HWV14_MAX_DEVICES 65	  /* HWv14 And Later Supports 64 
+					   * + controller at ID 7 
+					   */
+#define PVSCSI_MAX_DEVICES       255	  // 255 (including the controller)
+#define PVSCSI_MAX_NUM_DISKS     (PVSCSI_HWV14_MAX_DEVICES - 1)
 
 /************* SATA implementation limits ********************************/
 #define SATA_MAX_CONTROLLERS   4
@@ -247,10 +263,7 @@
 #define AHCI_MAX_PORTS SATA_MAX_DEVICES
 
 /*
- * Maximum number of supported disk in a VM.
- *
- * Note: With some config options for PVSCSI, maximum number of disks could
- * be ~1K but that number is not publicly supported yet.
+ * Publicly supported maximum number of disks per VM.
  */
 #define MAX_NUM_DISKS \
    ((SATA_MAX_CONTROLLERS * SATA_MAX_DEVICES) + \
@@ -258,6 +271,19 @@
     (NVME_MAX_CONTROLLERS * NVME_MAX_NAMESPACES) + \
     (IDE_NUM_INTERFACES * IDE_DRIVES_PER_IF))
 
+/*
+ * Maximum number of supported disks in a VM from HWV14 or later, using PVSCSI updated max
+ * devices.  The note above still holds true, but instead of publicly supporting
+ * all devices, HWv14 simply extends the maximum support to 256 devices,
+ * instead ~244 calculated above.
+ *
+ * PVSCSI_HW_MAX_DEVICES is 65 - allowing 64 disks + controller (at ID 7)
+ * 4 * 64 = 256 devices.
+ *
+ */
+#define MAX_NUM_DISKS_HWV14 MAX(MAX_NUM_DISKS, \
+   (SCSI_MAX_CONTROLLERS * PVSCSI_MAX_NUM_DISKS))
+
 /*
  * VSCSI_BV_INTS is the number of uint32's needed for a bit vector
  * to cover all scsi devices per target.
@@ -365,6 +391,6 @@ DEFINE_GUID(GUID_CLASS_VMWARE_USB_DEVICES,
  *
  */
 #define JEDEC_VENDOR_ID_VMWARE          0x289
-#define JEDEC_DEVICE_ID_VMWARE_NVDIMM   0x0
+#define JEDEC_DEVICE_ID_VMWARE_NVDIMM   0x1
 
 #endif /* VM_DEVICE_VERSION_H */
diff --git a/vmnet-only/vnetInt.h b/vmnet-only/vnetInt.h
index 5f41269d..e05a25d0 100644
--- a/vmnet-only/vnetInt.h
+++ b/vmnet-only/vnetInt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,15 +37,8 @@
  * Logging
  */
 
-#ifdef notdef
-#ifdef VMX86_RELEASE
 #define LOGLEVEL 0
-#else
-#define LOGLEVEL 1
-#endif
-#endif
-     
-#define LOGLEVEL 1
+
 
 #if LOGLEVEL >= 0
 #define LOG(level, args) ((void) (LOGLEVEL >= (level) ? (printk args) : 0))

From b71c1b9e0b79424a3a10ddefd670b028aee84be0 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Mon, 12 Nov 2018 07:53:50 +0100
Subject: [PATCH 10/41] import Workstation 15.0.1 module sources

---
 vmmon-only/common/task.c | 26 ++++++++++++++++++++------
 1 file changed, 20 insertions(+), 6 deletions(-)

diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index e17d728f..54f2ddf6 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -1092,8 +1092,9 @@ TaskSetCrossGDTVMM(BSVMM_GDTInit *gdt)
  * TaskSetCrossGDTHost --
  *
  *      Initializes the host portion of the crossGDT by copying it directly
- *      from the host kernel's GDT. We assume that all the host segments we
- *      will ever need come from the first page of the host's GDT.
+ *      from the host kernel's GDT. We assume that all the host segments
+ *      we will ever need come from the first page of the host's GDT and
+ *      precede the lowest segment needed by the monitor.
  *
  * Results:
  *      TRUE on success, FALSE otherwise.
@@ -1105,17 +1106,30 @@ TaskSetCrossGDTVMM(BSVMM_GDTInit *gdt)
  */
 
 static void
-TaskSetCrossGDTHost(void)
+TaskSetCrossGDTHost(const BSVMM_GDTInit *gdt)
 {
    unsigned len;
    DTR64 hostGDT;
+   unsigned i;
+   /* Copy descriptors up to at most the size of the CrossGDT. */
+   unsigned minVMMIndex = sizeof(CrossGDT) / sizeof(Descriptor);
+
    /*
     * All copied host segment descriptors will come from the first page of
-    * the host kernel GDT.
+    * the host kernel GDT and precede the first monitor segment descriptor.
     */
+   ASSERT_ON_COMPILE(sizeof(CrossGDT) % sizeof(Descriptor) == 0);
    ASSERT(HostIF_GlobalLockIsHeld());
+   for (i = 0; i < ARRAYSIZE(gdt->entries); i++) {
+      const BSVMM_GDTInitEntry *entry = &gdt->entries[i];
+      if (entry->present == 1) {
+         minVMMIndex = MIN(entry->index, minVMMIndex);
+      }
+   }
    TaskSaveGDT(&hostGDT);
-   len = MIN((unsigned)hostGDT.limit + 1, sizeof(CrossGDT));
+   /* PR 2142795: Only copy up to at most the monitor's first descriptor. */
+   len = MIN((unsigned)hostGDT.limit + 1, minVMMIndex * sizeof(Descriptor));
+   ASSERT(len <= sizeof(CrossGDT));
    memcpy(crossGDT->gdtes, (void*)HOST_KERNEL_LA_2_VA((LA)hostGDT.offset), len);
 }
 
@@ -1157,7 +1171,7 @@ Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
          return FALSE;
       }
       memset(crossGDT, 0, sizeof *crossGDT);
-      TaskSetCrossGDTHost();
+      TaskSetCrossGDTHost(gdt);
    }
 
    populatedCrossGDT = TaskSetCrossGDTVMM(gdt);

From a93f44ee441a7dcc3860e4ca0d204b6be67f23c9 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Wed, 15 May 2019 07:10:51 +0200
Subject: [PATCH 11/41] import Workstation 15.1.0 module sources

---
 vmmon-only/common/phystrack.c   | 13 +++----
 vmmon-only/common/phystrack.h   |  4 +-
 vmmon-only/common/task.c        | 14 ++++++-
 vmmon-only/include/iocontrols.h |  3 +-
 vmmon-only/include/x86cpuid.h   | 17 ++++++++-
 vmmon-only/include/x86msr.h     |  4 +-
 vmmon-only/linux/hostif.c       | 66 ++++++++++++++++++++++++++++-----
 vmnet-only/userif.c             | 19 ++++++----
 8 files changed, 110 insertions(+), 30 deletions(-)

diff --git a/vmmon-only/common/phystrack.c b/vmmon-only/common/phystrack.c
index cd95fdb3..f9e005d2 100644
--- a/vmmon-only/common/phystrack.c
+++ b/vmmon-only/common/phystrack.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2014,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -24,9 +24,8 @@
  *    Depending on configuration phystracker provides either 2-level or
  *    3-level structure to track whether page (specified by its MPN) is
  *    locked or no.  Linux uses 3-level structures with top limit of
- *    1TB (32bit) or 16TB (64bit).  Windows use 2-level structures
- *    ready to hold 128GB (32bit) or 2TB (64bit) of memory.  On Mac
- *    limit is 2-level 128GB.
+ *    1TB (32bit) or 16TB (64bit).  Windows and Mac use 2-level structures
+ *    ready to hold 128GB (32bit) or 2TB (64bit) of memory.
  *
  *    2-level phystracker is built on top of 3-level one by collapsing
  *    middle level.
@@ -50,9 +49,7 @@
 #define BYTES_PER_ENTRY      (PAGE_SIZE)
 #define PHYSTRACK_L3_ENTRIES (8 * BYTES_PER_ENTRY) /* 128MB */
 
-#if defined(WINNT_DDK)
-#define PHYSTRACK_L1_ENTRIES (PHYSTRACK_MAX_SUPPORTED_GB * 8)
-#elif defined(__linux__)
+#if defined(__linux__)
 #define PHYSTRACK_L2_ENTRIES (BYTES_PER_ENTRY / sizeof(void *)) /* 64GB or 128GB */
 /*
  * Currently MPN is 32 bits.  15 bits are in L3, 9 bits are in L2,
@@ -60,7 +57,7 @@
  */
 #define PHYSTRACK_L1_ENTRIES (256) /* 16TB. */
 #else
-#define PHYSTRACK_L1_ENTRIES ((128 + 4) * 8) /* 128 GB */
+#define PHYSTRACK_L1_ENTRIES (PHYSTRACK_MAX_SUPPORTED_GB * 8)
 #endif
 
 #ifndef PHYSTRACK_L2_ENTRIES
diff --git a/vmmon-only/common/phystrack.h b/vmmon-only/common/phystrack.h
index e88c19a3..6d29ebbe 100644
--- a/vmmon-only/common/phystrack.h
+++ b/vmmon-only/common/phystrack.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -29,7 +29,7 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
-#if defined(WINNT_DDK)
+#if !defined (__linux__)
 /* XXX: can be more efficient based on server vs. desktop and version of Windows */
 #define PHYSTRACK_MAX_SUPPORTED_GB (2048 + 4) /* 2 TB 64-bit W2k8 + 4 GB PCI */
 #endif
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index 54f2ddf6..bafaba87 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -2909,6 +2909,18 @@ Task_Switch(VMDriver *vm,  // IN
    }
 
    if (crosspage->crosspageData.moduleCallType == MODULECALL_INTR) {
+
+      /*
+       * Newer versions of Window expect EFLAGS_AC to be set when handling an
+       * interupt - PR  2248661.
+       */
+      if ((flags & EFLAGS_AC) != 0) {
+         uintptr_t   curFlags;
+         SAVE_FLAGS(curFlags);
+         curFlags |= EFLAGS_AC;
+         RESTORE_FLAGS(curFlags);
+      }
+
       /*
        * Note we must do the RAISE_INTERRUPT before ever enabling
        * interrupts or bad things have happened (might want to know exactly
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 6c227369..60fa0ab4 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -144,7 +144,7 @@ PtrToVA64(void const *ptr) // IN
  * See bora/doc/vmcore details.
  */
 
-#define VMMON_VERSION           (360 << 16 | 0)
+#define VMMON_VERSION           (361 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -276,6 +276,7 @@ enum IOCTLCmd {
 #endif
 
 #if defined __APPLE__
+   IOCTLCMD(GET_NUM_RESPONDING_CPUS),
    IOCTLCMD(ALLOC_LOW_PAGES),
    IOCTLCMD(INIT_DRIVER),
    IOCTLCMD(BLUEPILL),
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 1146bea3..9c6a81b0 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -465,6 +465,9 @@ FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                  NO,   0, FALSE)
 #define CPUID_7_EDX_28 \
 FLAG(   7,  0, EDX, 28,  1, LEVEL7EDX_RSVD1,                    NO,  0, FALSE)
 
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+#define CPUID_7_EDX_10 \
+FLAG(   7,  0, EDX, 10,  1, LEAF7_RSVD,                         NO,  0, FALSE)
 #define CPUID_7_EDX_31 \
 FLAG(   7,  0, EDX, 31,  1, LEVEL7EDX_RSVD2,                    NO,  0, FALSE)
 
@@ -519,6 +522,7 @@ FLAG(   7,  0, ECX, 22,  1, RDPID,                             NO,   0, TRUE)  \
 FLAG(   7,  0, ECX, 30,  1, SGX_LC,                            YES, 17, FALSE) \
 FLAG(   7,  0, EDX,  2,  1, AVX512QVNNIW,                      YES, 16, TRUE)  \
 FLAG(   7,  0, EDX,  3,  1, AVX512QFMAPS,                      YES, 16, TRUE)  \
+CPUID_7_EDX_10                                                                 \
 FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                          ANY,  9, FALSE) \
 FLAG(   7,  0, EDX, 27,  1, STIBP,                             YES,  9, FALSE) \
 CPUID_7_EDX_28                                                                 \
@@ -1432,6 +1436,8 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_STEPPING_KABYLAKE_ES     0x8  // Kabylake S/H/U/Y ES
 #define CPUID_STEPPING_COFFEELAKE_A    0xA  // Coffeelake U/S/H
 #define CPUID_STEPPING_COFFEELAKE_B    0xB  // Coffeelake S/H
+#define CPUID_STEPPING_CASCADELAKE_A   0x5  // Cascade Lake A-step
+#define CPUID_STEPPING_CASCADELAKE_B1  0x7  // Cascade Lake B1-step
 
 #define CPUID_MODEL_PIII_07    7
 #define CPUID_MODEL_PIII_08    8
@@ -1656,6 +1662,15 @@ CPUID_MODEL_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
            effectiveModel == CPUID_MODEL_HASWELL_46);
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_CASCADELAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_55 &&
+          CPUID_EFFECTIVE_STEPPING(v) >= CPUID_STEPPING_CASCADELAKE_A &&
+          CPUID_EFFECTIVE_STEPPING(v) <= CPUID_STEPPING_CASCADELAKE_B1;
+}
 
 static INLINE Bool
 CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 92aca35c..6a581b8d 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -120,6 +120,8 @@ MSRQuery;
 #define MSR_ARCH_CAPABILITIES_RDCL_NO             (1ULL << 0)
 #define MSR_ARCH_CAPABILITIES_IBRS_ALL            (1ULL << 1)
 #define MSR_ARCH_CAPABILITIES_RSBA                (1ULL << 2)
+#define MSR_ARCH_CAPABILITIES_NOL1F_VMENTRY       (1ULL << 3)
+#define MSR_ARCH_CAPABILITIES_SSB_NO              (1ULL << 4)
 
 
 #define MSR_SPEC_CTRL_IBRS                        (1UL << 0)
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 21758c2c..b05e0143 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1638,9 +1638,13 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
     * since at least 2.6.0.
     */
 
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 0, 0)
    extern unsigned long totalram_pages;
 
    unsigned int totalPhysicalPages = totalram_pages;
+#else
+   unsigned int totalPhysicalPages = totalram_pages();
+#endif
 
    /*
     * Use the memory information linux exports as of late for a more
@@ -1738,6 +1742,49 @@ HostIF_WaitForFreePages(unsigned int timeoutMs)  // IN:
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIFGetTime --
+ *
+ *      Reads the current time in UPTIME_FREQ units.
+ *
+ * Results:
+ *      The uptime, in units of UPTIME_FREQ.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static uint64
+HostIFGetTime(void)
+{
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 0, 0)
+   struct timeval tv;
+
+   do_gettimeofday(&tv);
+   return tv.tv_usec * (UPTIME_FREQ / 1000000) + tv.tv_sec * UPTIME_FREQ;
+#else
+   struct timespec64 now;
+
+   /*
+    * Use raw time used by Posix timers.  This time is not affected by
+    * NTP adjustments, so it may drift from real time and monotonic time,
+    * but it will stay in sync with other timers.
+    */
+   ktime_get_raw_ts64(&now);
+   /*
+    * UPTIME_FREQ resolution is lower than tv_nsec,
+    * so we have to do division...
+    */
+   ASSERT_ON_COMPILE(1000000000 % UPTIME_FREQ == 0);
+   return now.tv_nsec / (1000000000 / UPTIME_FREQ) + now.tv_sec * UPTIME_FREQ;
+#endif
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -1769,7 +1816,6 @@ HostIF_WaitForFreePages(unsigned int timeoutMs)  // IN:
 static uint64
 HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies
 {
-   struct timeval tv;
    uint64 monotime, uptime, upBase, monoBase;
    int64 diff;
    uint32 version;
@@ -1784,13 +1830,12 @@ HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies
       monoBase = uptimeState.monotimeBase;
    } while (!VersionedAtomic_EndTryRead(&uptimeState.version, version));
 
-   do_gettimeofday(&tv);
+   uptime = HostIFGetTime();
    upBase = Atomic_Read64(&uptimeState.uptimeBase);
 
    monotime = (uint64)(jifs - jifBase) * (UPTIME_FREQ / HZ);
    monotime += monoBase;
 
-   uptime = tv.tv_usec * (UPTIME_FREQ / 1000000) + tv.tv_sec * UPTIME_FREQ;
    uptime += upBase;
 
    /*
@@ -1895,13 +1940,11 @@ HostIFUptimeResyncMono(struct timer_list *timer)  // IN: ignored
 void
 HostIF_InitUptime(void)
 {
-   struct timeval tv;
+   uint64 tm;
 
    uptimeState.jiffiesBase = jiffies;
-   do_gettimeofday(&tv);
-   Atomic_Write64(&uptimeState.uptimeBase,
-                  -(tv.tv_usec * (UPTIME_FREQ / 1000000) +
-                    tv.tv_sec * UPTIME_FREQ));
+   tm = HostIFGetTime();
+   Atomic_Write64(&uptimeState.uptimeBase, -tm);
 
 #if LINUX_VERSION_CODE < KERNEL_VERSION(4, 15, 0) && !defined(timer_setup)
    init_timer(&uptimeState.timer);
@@ -3405,7 +3448,12 @@ HostIF_MapUserMem(VA addr,                  // IN: User memory virtual address
 
    ASSERT(handle);
 
-   if (!access_ok(VERIFY_WRITE, p, size)) {
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 0, 0)
+   if (!access_ok(VERIFY_WRITE, p, size))
+#else
+   if (!access_ok(p, size))
+#endif
+   {
       printk(KERN_ERR "%s: Couldn't verify write to uva 0x%p with size %"
              FMTSZ"u\n", __func__, p, size);
 
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index acc6ca69..a598dba8 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -137,16 +137,21 @@ UserifLockPage(VA addr) // IN
  */
 
 static INLINE int
-VNetUserIfMapPtr(VA uAddr,        // IN: pointer to user memory
+VNetUserIfMapPtr(VA64 uAddr,      // IN: pointer to user memory
                  size_t size,     // IN: size of data
                  struct page **p, // OUT: locked page
                  void **ptr)      // OUT: kernel mapped pointer
 {
-   if (!access_ok(VERIFY_WRITE, (void *)uAddr, size) ||
-       (((uAddr + size - 1) & ~(PAGE_SIZE - 1)) !=
-        (uAddr & ~(PAGE_SIZE - 1)))) {
+   uint8 v;
+
+   /* Check area does not straddle two pages. */
+   if ((uAddr & (PAGE_SIZE - 1)) + size > PAGE_SIZE) {
       return -EINVAL;
    }
+   /* Check if it is user's area.  UserifLockPage() checks writability. */
+   if (copy_from_user(&v, (void *)(unsigned long)uAddr, sizeof v) != 0) {
+      return -EFAULT;
+   }
 
    *p = UserifLockPage(uAddr);
    if (*p == NULL) {
@@ -158,7 +163,7 @@ VNetUserIfMapPtr(VA uAddr,        // IN: pointer to user memory
 }
 
 static INLINE int
-VNetUserIfMapUint32Ptr(VA uAddr,        // IN: pointer to user memory
+VNetUserIfMapUint32Ptr(VA64 uAddr,      // IN: pointer to user memory
                        struct page **p, // OUT: locked page
                        uint32 **ptr)    // OUT: kernel mapped pointer
 {
@@ -201,7 +206,7 @@ VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
       return -EBUSY;
    }
 
-   if ((retval = VNetUserIfMapUint32Ptr((VA)vn->pollPtr, &pollPage,
+   if ((retval = VNetUserIfMapUint32Ptr(vn->pollPtr, &pollPage,
                                         &pollPtr)) < 0) {
       return retval;
    }
@@ -213,7 +218,7 @@ VNetUserIfSetupNotify(VNetUserIF *userIf, // IN
       goto error_free;
    }
 
-   if ((retval = VNetUserIfMapUint32Ptr((VA)vn->recvClusterPtr,
+   if ((retval = VNetUserIfMapUint32Ptr(vn->recvClusterPtr,
                                         &recvClusterPage,
                                         &recvClusterCount)) < 0) {
       goto error_free;

From 51949a38728e2e7aa5eda7b36465bb4a55488c7e Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 21 Sep 2019 00:18:33 +0200
Subject: [PATCH 12/41] import Workstation 15.5.0 module sources

---
 vmmon-only/Makefile                           |   14 +-
 vmmon-only/bootstrap/monLoader.c              |  192 +-
 vmmon-only/bootstrap/monLoaderVmmon.c         |   61 +-
 vmmon-only/bootstrap/vmmblob.c                |    5 +-
 vmmon-only/common/apic.c                      |   12 +-
 vmmon-only/common/cpuid.c                     |    6 +-
 vmmon-only/common/cpuid.h                     |    9 +-
 vmmon-only/common/hostKernel.h                |    4 +-
 vmmon-only/common/hostif.h                    |   20 +-
 vmmon-only/common/hostifMem.h                 |    3 +-
 vmmon-only/common/memtrack.c                  |   34 +-
 vmmon-only/common/memtrack.h                  |    6 +-
 vmmon-only/common/phystrack.c                 |   31 +-
 vmmon-only/common/phystrack.h                 |    1 +
 vmmon-only/common/sharedAreaVmmon.c           |  299 +++
 vmmon-only/common/statVarsVmmon.c             |  282 +++
 vmmon-only/common/task.c                      |  137 +-
 vmmon-only/common/task.h                      |    7 +-
 vmmon-only/common/vmx86.c                     |  382 ++--
 vmmon-only/common/vmx86.h                     |   36 +-
 vmmon-only/include/circList.h                 |   30 +-
 vmmon-only/include/cpuid_info.h               |   77 -
 vmmon-only/include/includeCheck.h             |    2 +-
 vmmon-only/include/iocontrols.h               |  125 +-
 vmmon-only/include/modulecall.h               |   24 +-
 vmmon-only/include/monAddrLayout.h            |   24 +-
 vmmon-only/include/monLoader.h                |   73 +-
 vmmon-only/include/monLoaderLog.h             |   20 +-
 vmmon-only/include/mon_assert.h               |   65 +-
 vmmon-only/include/pagelist.h                 |    2 +-
 vmmon-only/include/pcip_defs.h                |   12 +-
 .../include/{perfctr_generic.h => perfctr.h}  |   59 +-
 .../include/{x86perfctr.h => perfctr_arch.h}  |  344 +---
 vmmon-only/include/ptsc.h                     |   33 +-
 vmmon-only/include/rateconv.h                 |    4 +-
 .../include/{initblock.h => sharedAreaType.h} |   44 +-
 vmmon-only/include/sharedAreaVmmon.h          |   62 +
 .../{basic_initblock.h => statVarsVmmon.h}    |   53 +-
 vmmon-only/include/usercalldefs.h             |    4 +-
 vmmon-only/include/vcpuid.h                   |   19 +-
 vmmon-only/include/vcpuset.h                  |   46 +-
 vmmon-only/include/vm_asm.h                   |   19 +-
 vmmon-only/include/vm_asm_x86.h               |  735 +++----
 vmmon-only/include/vm_asm_x86_64.h            |  137 --
 vmmon-only/include/vm_assert.h                |    4 +-
 vmmon-only/include/vm_atomic.h                |   17 +-
 vmmon-only/include/vm_basic_asm.h             |  234 ++-
 vmmon-only/include/vm_basic_asm_x86.h         |   55 +-
 vmmon-only/include/vm_basic_asm_x86_64.h      |  165 +-
 vmmon-only/include/vm_basic_asm_x86_common.h  |  460 ++++-
 vmmon-only/include/vm_basic_defs.h            |  132 +-
 vmmon-only/include/vm_basic_types.h           |  291 +--
 vmmon-only/include/vm_pagetable.h             |   22 +-
 vmmon-only/include/vmm_constants.h            |    5 +-
 vmmon-only/include/vmmem_shared.h             |   11 +-
 vmmon-only/include/x86_basic_defs.h           |   13 +-
 vmmon-only/include/x86cpuid.h                 | 1802 +++++++++--------
 vmmon-only/include/x86cpuid_asm.h             |   59 +-
 vmmon-only/include/x86desc.h                  |   86 +-
 vmmon-only/include/x86msr.h                   |  191 +-
 vmmon-only/include/x86paging_64.h             |   53 +-
 vmmon-only/include/x86segdescrs.h             |   32 +-
 vmmon-only/include/x86svm.h                   |  120 +-
 vmmon-only/include/x86types.h                 |   23 +-
 vmmon-only/include/x86vt-exit-reasons.h       |   12 +-
 vmmon-only/include/x86vt-vmcs-fields.h        |    2 +-
 vmmon-only/include/x86vt.h                    |   40 +-
 vmmon-only/linux/driver.c                     |  204 +-
 vmmon-only/linux/driver.h                     |   31 +-
 vmmon-only/linux/hostif.c                     |  290 +--
 vmmon-only/linux/hostif_priv.h                |    8 +-
 vmmon-only/vmcore/moduleloop.c                |   72 +-
 vmnet-only/Makefile                           |   14 +-
 vmnet-only/net.h                              |    4 +-
 vmnet-only/netif.c                            |   82 +-
 vmnet-only/smac.c                             |    4 +-
 vmnet-only/userif.c                           |   29 +-
 vmnet-only/vm_assert.h                        |    4 +-
 vmnet-only/vm_atomic.h                        |   17 +-
 vmnet-only/vm_basic_asm.h                     |  234 ++-
 vmnet-only/vm_basic_asm_x86.h                 |   55 +-
 vmnet-only/vm_basic_asm_x86_64.h              |  165 +-
 vmnet-only/vm_basic_asm_x86_common.h          |  460 ++++-
 vmnet-only/vm_basic_defs.h                    |  132 +-
 vmnet-only/vm_basic_types.h                   |  291 +--
 vmnet-only/vm_device_version.h                |   37 +-
 86 files changed, 5193 insertions(+), 4323 deletions(-)
 create mode 100644 vmmon-only/common/sharedAreaVmmon.c
 create mode 100644 vmmon-only/common/statVarsVmmon.c
 delete mode 100644 vmmon-only/include/cpuid_info.h
 rename vmmon-only/include/{perfctr_generic.h => perfctr.h} (52%)
 rename vmmon-only/include/{x86perfctr.h => perfctr_arch.h} (67%)
 rename vmmon-only/include/{initblock.h => sharedAreaType.h} (63%)
 create mode 100644 vmmon-only/include/sharedAreaVmmon.h
 rename vmmon-only/include/{basic_initblock.h => statVarsVmmon.h} (54%)
 delete mode 100644 vmmon-only/include/vm_asm_x86_64.h

diff --git a/vmmon-only/Makefile b/vmmon-only/Makefile
index ccdd2959..f859c8c7 100644
--- a/vmmon-only/Makefile
+++ b/vmmon-only/Makefile
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+# Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -98,6 +98,13 @@ auto-build: $(DRIVER_KO)
 $(DRIVER): $(DRIVER_KO)
 	if [ $< -nt $@ ] || [ ! -e $@ ] ; then cp -f $< $@; fi
 
+# Use SUBDIRS on 2.x, 3.x, 4.x.  Use M on newer kernels.
+ifeq ($(filter-out 2 3 4,$(firstword $(subst ., ,$(VM_UNAME)))),)
+DIRVAR := SUBDIRS
+else
+DIRVAR := M
+endif
+
 #
 # Define a setup target that gets built before the actual driver.
 # This target may not be used at all, but if it is then it will be defined
@@ -107,7 +114,7 @@ prebuild:: ;
 postbuild:: ;
 
 $(DRIVER_KO): prebuild
-	$(MAKE) -C $(BUILD_DIR) SUBDIRS=$$PWD SRCROOT=$$PWD/$(SRCROOT) \
+	$(MAKE) -C $(BUILD_DIR) $(DIRVAR)=$$PWD SRCROOT=$$PWD/$(SRCROOT) \
 	  MODULEBUILDDIR=$(MODULEBUILDDIR) modules
 	$(MAKE) -C $$PWD SRCROOT=$$PWD/$(SRCROOT) \
 	  MODULEBUILDDIR=$(MODULEBUILDDIR) postbuild
@@ -129,6 +136,9 @@ ifdef VMX86_DEBUG
 CC_OPTS += -DVMX86_DEBUG
 endif
 
+# Add Spectre options when available
+CC_OPTS += $(call vm_check_gcc,-mindirect-branch=thunk -mindirect-branch-register,)
+
 include $(SRCROOT)/Makefile.kernel
 
 else
diff --git a/vmmon-only/bootstrap/monLoader.c b/vmmon-only/bootstrap/monLoader.c
index bf5f4877..676c0724 100644
--- a/vmmon-only/bootstrap/monLoader.c
+++ b/vmmon-only/bootstrap/monLoader.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -24,14 +24,7 @@
  *      See monLoader.h for a full description.
  */
 
-#ifdef VMX86_VMX
-
-#include <string.h>
-#include <limits.h>
-#include "vmx.h"
-#include "vm_assert.h"
-
-#elif defined VMKERNEL
+#if defined VMKERNEL
 
 #include "vmkernel.h"
 #include "libc.h"
@@ -57,15 +50,15 @@
 
 #include "vm_assert.h"
 
-#else /* !defined VMX86_VMX && !defined VMKERNEL && !defined VMMON */
+#else /* !defined VMKERNEL && !defined VMMON */
 #error MonLoader cannot be built as part of this environment
 #endif
 
 #include "vm_basic_types.h"
 #include "monLoader.h"
 #include "vcpuid.h"
-#include "x86types.h"
-#include "x86paging_64.h"
+#include "vm_pagetable.h"
+#include "address_defs.h"
 #include "monLoaderLog.h"
 
 #define CANONICAL_MASK MASK64(36)
@@ -75,12 +68,6 @@
 #define L2EArrayIdx(b,v) ((unsigned)((((v) - (b)) & CANONICAL_MASK) >> 18))
 #define L1EArrayIdx(b,v) ((unsigned)((((v) - (b)) & CANONICAL_MASK) >> 9))
 
-/*
- * Import address space from VMX rather than building it.  Once monitor loading
- * is removed from VMX entirely, code to import will be deleted.
- */
-#define IMPORT_AS_FROM_VMX (TRUE)
-
 /* The maximum (canonical-address) VPN */
 #define VPN_MAX MASK64(52)
 
@@ -111,15 +98,11 @@ typedef struct MonLoaderContext {
       VPN          ASLastVPN;   /* last VPN in the address space (inclusive) */
       uint64       ASPTEFlags;  /* PTE flags for L4->L1 connection. */
       Vcpuid       currentVCPU;
-      Bool         ASImported;  /* Was this AS imported or created anew? */
       Bool         hasAddrSpace;
    } vcpu;
 } MonLoaderContext;
 
 
-static const Bool importFromVMX = IMPORT_AS_FROM_VMX;
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -192,7 +175,7 @@ MonLoaderIsMapped(MonLoaderContext *ctx,    // IN/OUT
    if (ret != ML_OK) {
       return ret;
    }
-   *mapped = PTE_PRESENT(pte);
+   *mapped = ML_PERM_PRESENT(pte);
    return ML_OK;
 }
 
@@ -280,15 +263,40 @@ MonLoaderMapMPN(MonLoaderContext *ctx,    // IN/OUT
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * MonLoaderBuildsPtLevel --
+ *
+ *      Determines whether MonLoader allocates and maps the page table(s) for
+ *      the monitor at the given level.
+ *
+ * Result:
+ *      TRUE if MonLoader creates the page table at the given level, FALSE
+ *      otherwise.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+static Bool
+MonLoaderCreatesPtLevel(PT_Level level)
+{
+   ASSERT(level >= PT_LEVEL_STOP && level <= PT_MAX_LEVELS);
+   return FALSE;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
  * MonLoaderCreateAddressSpace --
  *
- *      Creates or (if importAS is set) verifies an address space.  The VPN
- *      range specified by firstVPN and size is used to determine page counts
- *      at each page table level to map every page.  Sufficient pages are then
- *      allocated or verified.
+ *      Creates or verifies an address space.  The VPN range specified by
+ *      firstVPN and size is used to determine page counts at each page table
+ *      level to map every page.  Sufficient pages are then allocated or
+ *      verified.
  *
  * Result:
  *      ML_OK if successful, some other value on error.
@@ -302,8 +310,7 @@ static MonLoaderError
 MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
                             VPN               firstVPN, // IN
                             uint64            flags,    // IN
-                            uint64            monPages, // IN
-                            Bool              importAS) // IN
+                            uint64            monPages) // IN
 {
    Vcpuid vcpu = ctx->vcpu.currentVCPU;
    VPN lastVPN = firstVPN + monPages - 1;
@@ -329,11 +336,13 @@ MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
    ctx->vcpu.ASFirstVPN = firstVPN;
    ctx->vcpu.ASLastVPN = lastVPN;
    ctx->vcpu.ASPTEFlags = flags;
-   ctx->vcpu.ASImported = importAS;
 
    ptMPNs = &ctx->vcpu.ptMPNs;
 
-   if (importAS) {
+   if (MonLoaderCreatesPtLevel(PT_LEVEL_4)) {
+      NOT_IMPLEMENTED();
+   } else {
+      /* Verify the VMX's allocation. */
       mpn = MonLoaderCallout_GetPageRoot(ctx->envCtx, vcpu);
       if (mpn == INVALID_MPN) {
          return ML_ERROR_CALLOUT_PAGEROOT_GET;
@@ -341,13 +350,13 @@ MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
       LOG(5, "%s: vcpu %u page root=0x%"FMT64"x\n", __FUNCTION__, vcpu, mpn);
       ptMPNs->L4MPNs[0] = mpn;
       MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
-   } else {
-      NOT_IMPLEMENTED();
    }
    ptMPNs->L4MPNCount = 1;
 
    for (i = 0; i < L3MPNsNeeded; i++) {
-      if (importAS) {
+      if (MonLoaderCreatesPtLevel(PT_LEVEL_3)) {
+         NOT_IMPLEMENTED();
+      } else {
          VPN monVPN = firstVPN + i * PT_PAGES_PER_L4E;
          unsigned L4Off = PT_LPN_2_L4OFF(monVPN);
          PT_L1E pte;
@@ -357,20 +366,20 @@ MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
          }
          LOG(5, "%s: monVPN=0x%"FMTVPN"x: L4E=0x%"FMT64"x\n", __FUNCTION__,
                  monVPN, pte);
-         mpn = LM_PTE_2_PFN(pte);
+         mpn = ML_PTE_2_PFN(pte);
          if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
             return ML_ERROR_PAGE_TABLE_IMPORT;
          }
          MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
-      } else {
-         NOT_IMPLEMENTED();
       }
       ptMPNs->L3MPNs[i] = mpn;
    }
    ptMPNs->L3MPNCount = L3MPNsNeeded;
       
    for (i = 0; i < L2MPNsNeeded; i++) {
-      if (importAS) {
+      if (MonLoaderCreatesPtLevel(PT_LEVEL_2)) {
+         NOT_IMPLEMENTED();
+      } else {
          VPN monVPN = firstVPN + i * PT_PAGES_PER_L3E;
          unsigned L3Off = PT_LPN_2_L3OFF(monVPN);
          unsigned L3Page = L3EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
@@ -381,20 +390,20 @@ MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
          }
          LOG(5, "%s: monVPN=0x%"FMTVPN"x: L3E=0x%"FMT64"x\n", __FUNCTION__,
                  monVPN, pte);
-         mpn = LM_PTE_2_PFN(pte);
+         mpn = ML_PTE_2_PFN(pte);
          if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
             return ML_ERROR_PAGE_TABLE_IMPORT;
          }
          MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
-      } else {
-         NOT_IMPLEMENTED();
       }
       ptMPNs->L2MPNs[i] = mpn;
    }
    ptMPNs->L2MPNCount = L2MPNsNeeded;
 
    for (i = 0; i < L1MPNsNeeded; i++) {
-      if (importAS) {
+      if (MonLoaderCreatesPtLevel(PT_LEVEL_1)) {
+         NOT_IMPLEMENTED();
+      } else {
          VPN monVPN = firstVPN + i * PT_PAGES_PER_L2E;
          unsigned L2Off = PT_LPN_2_L2OFF(monVPN);
          unsigned L2Page = L2EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
@@ -405,17 +414,15 @@ MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
          }
          LOG(5, "%s: monVPN=0x%"FMTVPN"x: L2E=0x%"FMT64"x\n", __FUNCTION__,
                  monVPN, pte);
-         if (!PTE_PRESENT(pte)) {
+         if (!ML_PERM_PRESENT(pte)) {
             ptMPNs->L1MPNs[i] = INVALID_MPN;
             continue;
          }
-         mpn = LM_PTE_2_PFN(pte);
+         mpn = ML_PTE_2_PFN(pte);
          if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
             return ML_ERROR_PAGE_TABLE_IMPORT;
          }
          MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
-      } else {
-         NOT_IMPLEMENTED();
       }
       ptMPNs->L1MPNs[i] = mpn;
    }
@@ -446,12 +453,12 @@ MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
  */
 static MonLoaderError
 MonLoaderMapPageTables(MonLoaderContext *ctx,      // IN/OUT
-                       unsigned          level,    // IN
+                       PT_Level          level,    // IN
                        uint64            flags,    // IN
                        VPN               monVPN,   // IN
                        uint64            monPages) // IN
 {
-   Bool verify = ctx->vcpu.ASImported;
+   Bool verify = !MonLoaderCreatesPtLevel(level);
    uint64    i;
    unsigned  count;
    MPN      *ptMPNs;
@@ -460,25 +467,25 @@ MonLoaderMapPageTables(MonLoaderContext *ctx,      // IN/OUT
       if (!ctx->vcpu.hasAddrSpace) {
          return ML_ERROR_NO_ADDRSPACE;
       }
-      if (level < 1 || level > 4) {
+      if (level < PT_LEVEL_STOP || level > PT_MAX_LEVELS) {
          return ML_ERROR_ARGS;
       }
    }
 
    switch (level) {
-      case 4:
+      case PT_LEVEL_4:
          count = ctx->vcpu.ptMPNs.L4MPNCount;
          ptMPNs = ctx->vcpu.ptMPNs.L4MPNs;
          break;
-      case 3:
+      case PT_LEVEL_3:
          count = ctx->vcpu.ptMPNs.L3MPNCount;
          ptMPNs = ctx->vcpu.ptMPNs.L3MPNs;
          break;
-      case 2:
+      case PT_LEVEL_2:
          count = ctx->vcpu.ptMPNs.L2MPNCount;
          ptMPNs = ctx->vcpu.ptMPNs.L2MPNs;
          break;
-      case 1:
+      case PT_LEVEL_1:
          count = ctx->vcpu.ptMPNs.L1MPNCount;
          ptMPNs = ctx->vcpu.ptMPNs.L1MPNs;
          break;
@@ -494,11 +501,11 @@ MonLoaderMapPageTables(MonLoaderContext *ctx,      // IN/OUT
          VPN vpn = monVPN + i;
          if (verify) {
             PT_L1E l1e;
-            if (ptMPNs[i] == INVALID_MPN && level == 1) {
+            if (ptMPNs[i] == INVALID_MPN && level == PT_LEVEL_1) {
                continue;
             }
             if (MonLoaderTranslateMonVPNToL1E(ctx, vpn, &l1e) != ML_OK ||
-                LM_PTE_2_PFN(l1e) != ptMPNs[i] || !ML_PERMS_MATCH(l1e, flags)) {
+                ML_PTE_2_PFN(l1e) != ptMPNs[i] || !ML_PERMS_MATCH(l1e, flags)) {
                return ML_ERROR_PAGE_TABLE_VERIFY;
             }
          } else {
@@ -629,7 +636,7 @@ MonLoaderCopyFromBlob(MonLoaderContext *ctx,        // IN/OUT
  *      ML_OK if successful, some other value on error.
  *
  * Side effects:
- *      User pages may be mapped in.
+ *      User or host pages may be mapped in.
  *
  *----------------------------------------------------------------------
  */
@@ -660,6 +667,14 @@ MonLoaderShareWork(MonLoaderContext *ctx,        // IN/OUT
                                                   vcpu);
       }
       if (mpn == INVALID_MPN) {
+         if (subIndex == MONLOADER_HT_MAP_IDX) {
+            /*
+             * This item is tied to a vmkernel feature.
+             * When the feature is disabled, there is nothing to share.
+             */
+            ASSERT(vmx86_server);
+            return ML_OK;
+         }
          /* Partial sharing is allowed.  Return success if any occurred. */
          return i != 0 ? ML_OK : ML_ERROR_SHARE;
       }
@@ -672,45 +687,6 @@ MonLoaderShareWork(MonLoaderContext *ctx,        // IN/OUT
 }
 
 
-#ifndef VMMON
-/*
- *----------------------------------------------------------------------
- *
- * MonLoaderSetEntrypoint --
- *
- *      Calls out to set the code and stack entrypoint.
- *
- * Result:
- *      ML_OK if successful, some other value on error.
- *
- * Side effects:
- *      The monitor entrypoint for the current VCPU may be set.
- *
- *----------------------------------------------------------------------
- */
-static MonLoaderError
-MonLoaderSetEntrypoint(MonLoaderContext *ctx,           // IN
-                       uint16            codeSelector,  // IN
-                       VA64              code,          // IN
-                       uint16            stackSelector, // IN
-                       VA64              stack)         // IN
-{
-   if (VA_2_VPN(code) < ctx->vcpu.ASFirstVPN  ||
-       VA_2_VPN(code) > ctx->vcpu.ASLastVPN   ||
-       VA_2_VPN(stack) < ctx->vcpu.ASFirstVPN ||
-       VA_2_VPN(stack) > ctx->vcpu.ASLastVPN) {
-      return ML_ERROR_INVALID_VPN; /* Address is outside address space. */
-   }
-   if (MonLoaderCallout_SetEntrypoint(ctx->envCtx, codeSelector, code,
-                                      stackSelector, stack)) {
-      return ML_OK;
-   } else {
-      return ML_ERROR_CALLOUT_ENTRYPOINT;
-   }
-}
-#endif
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -795,7 +771,7 @@ MonLoaderShareFromBlob(MonLoaderContext *ctx,        // IN/OUT
 
    if ((blobOffset & (PAGE_SIZE - 1)) != 0 ||
        (blobSize & (PAGE_SIZE - 1)) != 0 ||
-       (flags & PTE_RW) != 0) {
+       ML_PERM_WRITEABLE(flags)) {
       return ML_ERROR_SHARE;
    }
    if (blobSize > monBytes || blobSize == 0) {
@@ -866,7 +842,7 @@ MonLoader_Process(MonLoaderHeader  *header,   // IN/OUT
       return ML_ERROR_TABLE_MISSING;
    }
 
-   if (!MonLoaderCallout_Init(args, &ctx.envCtx)) {
+   if (!MonLoaderCallout_Init(args, &ctx.envCtx, numVCPUs)) {
       return ML_ERROR_CALLOUT_INIT;
    }
    ret = ML_OK;
@@ -887,7 +863,6 @@ MonLoader_Process(MonLoaderHeader  *header,   // IN/OUT
          uint64               monBytes   = PAGES_2_BYTES(monPages);
          uint64               subIndex   = entry->subIndex;
          uint64               bspOnly    = entry->bspOnly;
-         uint64               isPriv     = vmx86_server || entry->procVmmon;
          *line = i;
 
          /*
@@ -896,17 +871,6 @@ MonLoader_Process(MonLoaderHeader  *header,   // IN/OUT
          if (bspOnly && !IS_BOOT_VCPUID(*vcpu)) {
             continue;
          }
-         /*
-          * Entries marked as privileged (isPriv == TRUE) are processed
-          * by the privileged layer (VMKernel/vmmon). Others are
-          * processed by the VMX. One exception is the entry of type
-          * ML_CONTENT_ADDRSPACE: it is always processed by the VMX and,
-          * if marked as privileged, also by the privileged layer.
-          */
-         if (isPriv != MonLoaderCallout_IsPrivileged(ctx.envCtx) &&
-             (content != ML_CONTENT_ADDRSPACE || isPriv == 0)) {
-            continue;
-         }
          if (monPages == 0 || monVPN + monPages - 1 > VPN_MAX) {
             ret = ML_ERROR_SIZE;
             continue;
@@ -919,8 +883,7 @@ MonLoader_Process(MonLoaderHeader  *header,   // IN/OUT
                   continue;
                }
                /* Create or verify the address space and page table MPNs. */
-               ret = MonLoaderCreateAddressSpace(&ctx, monVPN, flags, monPages,
-                                                 importFromVMX);
+               ret = MonLoaderCreateAddressSpace(&ctx, monVPN, flags, monPages);
                break;
             case ML_CONTENT_PAGETABLE_L4:
             case ML_CONTENT_PAGETABLE_L3:
@@ -988,15 +951,10 @@ MonLoader_Process(MonLoaderHeader  *header,   // IN/OUT
          }
       }
    }
-#ifndef VMMON
+#ifdef VMKERNEL
    if (ret == ML_OK) {
       if (ctx.vcpu.ASLastVPN == 0) {
          ret = ML_ERROR_NO_ADDRSPACE;
-      } else {
-         ret = MonLoaderSetEntrypoint(&ctx, header->codeSelector,
-                                      header->codeEntrypoint,
-                                      header->stackSelector,
-                                      header->stackEntrypoint);
       }
    }
 #endif
diff --git a/vmmon-only/bootstrap/monLoaderVmmon.c b/vmmon-only/bootstrap/monLoaderVmmon.c
index 85931983..dce62cbf 100644
--- a/vmmon-only/bootstrap/monLoaderVmmon.c
+++ b/vmmon-only/bootstrap/monLoaderVmmon.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -65,7 +65,7 @@ typedef struct MonLoaderEnvContext {
  */
 
 Bool
-MonLoaderCallout_Init(void *args, MonLoaderEnvContext **ctx)
+MonLoaderCallout_Init(void *args, MonLoaderEnvContext **ctx, unsigned numVCPUs)
 {
    MonLoaderEnvContext *c;
    MonLoaderArgs *mlArgs = (MonLoaderArgs *)args;
@@ -215,7 +215,7 @@ MonLoaderCallout_AllocMPN(MonLoaderEnvContext *ctx,  // IN
    vpn = Vmx86_MapPage(mpn);
    if (vpn == 0) {
       Log("Failed to map MPN 0x%"FMT64"x\n", mpn);
-      Vmx86_FreeLockedPages(vm, (VA64)&mpn, 1, TRUE);
+      Vmx86_FreeLockedPages(vm, &mpn, 1);
       return INVALID_MPN;
    }
    HostIF_VMLock(vm, 41);
@@ -225,7 +225,7 @@ MonLoaderCallout_AllocMPN(MonLoaderEnvContext *ctx,  // IN
       Log("Failed to track mapping from VPN 0x%"FMTVPN"x to MPN 0x%"FMT64"x\n",
           vpn, mpn);
       Vmx86_UnmapPage(vpn);
-      Vmx86_FreeLockedPages(vm, (VA64)&mpn, 1, TRUE);
+      Vmx86_FreeLockedPages(vm, &mpn, 1);
       return INVALID_MPN;
    }
    return mpn;
@@ -386,10 +386,8 @@ MonLoaderFindSharedRegion(MonLoaderEnvContext *ctx,
    int i;
 
    for (i = 0; i < ML_SHARED_REGIONS_MAX; i++) {
-      if (ctx->shRegions[i].baseVpn == INVALID_VPN) {
-         /* Not found. */
-         return NULL;
-      } else if (ctx->shRegions[i].index == index) {
+      if (ctx->shRegions[i].index == index &&
+          ctx->shRegions[i].baseVpn != INVALID_VPN) {
          return &ctx->shRegions[i];
       }
    }
@@ -425,10 +423,6 @@ MonLoaderGetSharedRegionMPN(MonLoaderEnvContext *ctx,
 
    ASSERT(IS_BOOT_VCPUID(vcpuid));
 
-   if (index >= ML_SHARED_REGIONS_MAX) {
-      Log("Invalid shared region %"FMT64"x", index);
-      return INVALID_MPN;
-   }
    s = MonLoaderFindSharedRegion(ctx, index);
    if (s == NULL) {
       return INVALID_MPN;
@@ -465,10 +459,10 @@ MonLoaderGetSharedRegionMPN(MonLoaderEnvContext *ctx,
  */
 
 MPN
-MonLoaderCallout_GetSharedUserPage(MonLoaderEnvContext *ctx,
-                                   uint64 subIndex, // IN
-                                   unsigned page,   // IN
-                                   Vcpuid vcpu)     // IN
+MonLoaderCallout_GetSharedUserPage(MonLoaderEnvContext *ctx, // IN
+                                   uint64 subIndex,          // IN
+                                   unsigned page,            // IN
+                                   Vcpuid vcpu)              // IN
 {
    if (subIndex == MONLOADER_HEADER_IDX) {
       return VmmBlob_GetHeaderMpn(ctx->vm);
@@ -484,30 +478,7 @@ MonLoaderCallout_GetSharedHostPage(MonLoaderEnvContext *ctx,      // IN
                                    unsigned             page,     // IN
                                    Vcpuid               vcpu)     // IN
 {
-   NOT_IMPLEMENTED();
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * MonLoaderCallout_IsPrivileged --
- *
- *      Returns whether or not this is a privileged environment.
- *
- * Returns:
- *      TRUE if privileged, FALSE if not.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-Bool
-MonLoaderCallout_IsPrivileged(MonLoaderEnvContext *ctx) // IN
-{
-   return TRUE;
+   return MonLoaderGetSharedRegionMPN(ctx, subIndex, vcpu, page);
 }
 
 
@@ -534,13 +505,3 @@ MonLoaderCallout_GetBlobMpn(MonLoaderEnvContext *ctx,    // IN
    ASSERT((offset & (PAGE_SIZE - 1)) == 0);
    return VmmBlob_GetMpn(ctx->vm, BYTES_2_PAGES(offset));
 }
-
-Bool
-MonLoaderCallout_SetEntrypoint(MonLoaderEnvContext *ctx,           // IN
-                               uint16               codeSelector,  // IN
-                               VA64                 code,          // IN
-                               uint16               stackSelector, // IN
-                               VA64                 stack)         // IN
-{
-   NOT_IMPLEMENTED();
-}
diff --git a/vmmon-only/bootstrap/vmmblob.c b/vmmon-only/bootstrap/vmmblob.c
index 0e599d9e..60fe76ae 100644
--- a/vmmon-only/bootstrap/vmmblob.c
+++ b/vmmon-only/bootstrap/vmmblob.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2017-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2017-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,7 +31,8 @@
 #include "vmmblob.h"
 #include "monLoader.h"
 
-#define VMMBLOB_SIZE_MAX (12 * 1024 * 1024)
+#define VMMBLOB_SIZE_MAX (22 * 1024 * 1024) /* Ensure enough space for
+                                             * obj build with * GCOV_VMM=1. */
 
 /*
  *----------------------------------------------------------------------
diff --git a/vmmon-only/common/apic.c b/vmmon-only/common/apic.c
index 7ba781ea..6ac29db7 100644
--- a/vmmon-only/common/apic.c
+++ b/vmmon-only/common/apic.c
@@ -65,7 +65,7 @@ APIC_GetMA(void)
     * Check if X2 APIC mode is enabled.
     */
 
-   if ((__GET_MSR(MSR_APIC_BASE) & APIC_MSR_X2APIC_ENABLED) != 0) {
+   if ((X86MSR_GetMSR(MSR_APIC_BASE) & APIC_MSR_X2APIC_ENABLED) != 0) {
       return (MA)-1;
    }
 
@@ -75,7 +75,7 @@ APIC_GetMA(void)
     */
 
    // Mask out goo in the low 12 bits, which is unrelated to the address.
-   result = __GET_MSR(MSR_APIC_BASE) & ~MASK64(PAGE_SHIFT);
+   result = X86MSR_GetMSR(MSR_APIC_BASE) & ~MASK64(PAGE_SHIFT);
 
    /*
     * On Intel, the high bits are reserved so we mask.
@@ -122,7 +122,7 @@ APIC_Read(const APICDescriptor *desc, // IN
           int regNum)                 // IN
 {
    if (desc->isX2) {
-      return (uint32 )__GET_MSR(MSR_X2APIC_BASE + regNum);
+      return (uint32)X86MSR_GetMSR(MSR_X2APIC_BASE + regNum);
    } else {
       return desc->base[regNum][0];
    }
@@ -182,7 +182,7 @@ APIC_Write(const APICDescriptor *desc, // IN
            uint32 val)                 // IN
 {
    if (desc->isX2) {
-      __SET_MSR(MSR_X2APIC_BASE + regNum, val);
+      X86MSR_SetMSR(MSR_X2APIC_BASE + regNum, val);
    } else {
       desc->base[regNum][0] = val;
    }
@@ -210,7 +210,7 @@ uint64
 APIC_ReadICR(const APICDescriptor *desc) // IN
 {
    if (desc->isX2) {
-      return __GET_MSR(MSR_X2APIC_BASE + APICR_ICRLO);
+      return X86MSR_GetMSR(MSR_X2APIC_BASE + APICR_ICRLO);
    } else {
       uint32 icrHi = desc->base[APICR_ICRHI][0];
       uint32 icrLo = desc->base[APICR_ICRLO][0];
@@ -244,7 +244,7 @@ APIC_WriteICR(const APICDescriptor *desc, // IN
 {
    if (desc->isX2) {
       uint64 icr = (uint64) id << 32 | icrLo;
-      __SET_MSR(MSR_X2APIC_BASE + APICR_ICRLO, icr);
+      X86MSR_SetMSR(MSR_X2APIC_BASE + APICR_ICRLO, icr);
    } else {
       ASSERT(!(id & ~(APIC_ICRHI_DEST_MASK >> APIC_ICRHI_DEST_OFFSET)));
       desc->base[APICR_ICRHI][0] = id << APIC_ICRHI_DEST_OFFSET;
diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
index ed534962..425363f7 100644
--- a/vmmon-only/common/cpuid.c
+++ b/vmmon-only/common/cpuid.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2016-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2016-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -16,7 +16,7 @@
  *
  *********************************************************/
 
-#ifdef linux
+#ifdef __linux__
 /* Must come before any kernel header file --hpreg */
 #   include "driver-config.h"
 
@@ -40,6 +40,7 @@ uint32      cpuidVersion;
 Bool        hostSupportsVT;
 Bool        hostSupportsSVM;
 Bool        hostHasSpecCtrl;
+Bool        hostSupportsXSave;
 
 
 /*
@@ -84,6 +85,7 @@ CPUID_Init(void)
    __GET_CPUID(1, &regs);
    cpuidVersion = regs.eax;
    cpuidFeatures = regs.edx;
+   hostSupportsXSave = CPUID_ISSET(1, ECX, XSAVE, regs.ecx);
 
    __GET_CPUID(0, &regs);
    ptr = (uint32 *)name;
diff --git a/vmmon-only/common/cpuid.h b/vmmon-only/common/cpuid.h
index cc6c95b7..512d8c3b 100644
--- a/vmmon-only/common/cpuid.h
+++ b/vmmon-only/common/cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2016-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2016-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,6 +37,7 @@ extern CpuidVendor cpuidVendor;
 extern Bool        hostSupportsVT;
 extern Bool        hostSupportsSVM;
 extern Bool        hostHasSpecCtrl;
+extern Bool        hostSupportsXSave;
 
 void CPUID_Init(void);
 Bool CPUID_AddressSizeSupported(void);
@@ -84,6 +85,12 @@ CPUID_HostSupportsSpecCtrl(void)
    return hostHasSpecCtrl;
 }
 
+static INLINE Bool
+CPUID_HostSupportsXSave(void)
+{
+   return hostSupportsXSave;
+}
+
 static INLINE Bool
 CPUID_SSE2Supported(void)
 {
diff --git a/vmmon-only/common/hostKernel.h b/vmmon-only/common/hostKernel.h
index 51dc0e3f..752d3cc4 100644
--- a/vmmon-only/common/hostKernel.h
+++ b/vmmon-only/common/hostKernel.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -27,7 +27,7 @@
 #   define __HOST_KERNEL_H__
 
 
-#   ifdef linux
+#   ifdef __linux__
 /*
  * In some cases, this files needs to include Linux kernel header file
  * asm/page.h.
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index c0d0a789..9400ca25 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -59,7 +59,7 @@
 
 #define CROSSCALL_SLEEP_US 1000
 
-EXTERN int   HostIF_Init(VMDriver *vm, uint32 numVCPUs);
+EXTERN Bool  HostIF_Init(VMDriver *vm, uint32 numVCPUs);
 EXTERN int   HostIF_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
 EXTERN void *HostIF_MapCrossPage(VMDriver *vm, VA64 uAddr);
 
@@ -76,12 +76,12 @@ EXTERN Bool  HostIF_IsLockedByMPN(VMDriver *vm, MPN mpn);
 EXTERN void  HostIF_FreeAllResources(VMDriver *vm);
 EXTERN uint64 HostIF_ReadUptime(void);
 EXTERN uint64 HostIF_UptimeFrequency(void);
-EXTERN unsigned int HostIF_EstimateLockedPageLimit(const VMDriver *vm,
-                                                   unsigned int lockedPages);
+EXTERN PageCnt HostIF_EstimateLockedPageLimit(const VMDriver *vm,
+                                              PageCnt lockedPages);
 EXTERN void  HostIF_Wait(unsigned int timeoutMs);
 EXTERN void  HostIF_WaitForFreePages(unsigned int timeoutMs);
-EXTERN void *HostIF_AllocKernelPages(unsigned numPages, MPN *mpns);
-EXTERN void  HostIF_FreeKernelPages(unsigned numPages, void *ptr);
+EXTERN void *HostIF_AllocKernelPages(PageCnt numPages, MPN *mpns);
+EXTERN void  HostIF_FreeKernelPages(PageCnt numPages, void *ptr);
 EXTERN void  HostIF_VMLock(VMDriver *vm, int callerID);
 EXTERN void  HostIF_VMUnlock(VMDriver *vm, int callerID);
 #ifdef VMX86_DEBUG
@@ -111,11 +111,11 @@ EXTERN void HostIF_WaitForThreads(VMDriver *vm, Vcpuid currVcpu);
 EXTERN void HostIF_CancelWaitForThreads(VMDriver *vm, Vcpuid currVcpu);
 EXTERN void HostIF_WakeUpYielders(VMDriver *vm, Vcpuid currVcpu);
 
-EXTERN int HostIF_AllocLockedPages(VMDriver *vm, VA64 addr,
-                                   unsigned int numPages, Bool kernelMPNBuffer);
-EXTERN int HostIF_FreeLockedPages(VMDriver *vm, VA64 addr,
-                                  unsigned int numPages, Bool kernelMPNBuffer);
+EXTERN int64 HostIF_AllocLockedPages(VMDriver *vm, VA64 addr,
+                                     PageCnt numPages, Bool kernelMPNBuffer);
+EXTERN int HostIF_FreeLockedPages(VMDriver *vm, MPN *mpns, PageCnt numPages);
 EXTERN MPN HostIF_GetNextAnonPage(VMDriver *vm, MPN mpn);
+EXTERN PageCnt HostIF_GetNumAnonPages(VMDriver *vm);
 EXTERN MPN HostIF_AllocLowPage(VMDriver *vm);
 
 EXTERN int HostIF_ReadPhysical(VMDriver *vm, MA ma, VA64 addr,
diff --git a/vmmon-only/common/hostifMem.h b/vmmon-only/common/hostifMem.h
index 789f223e..98621f85 100644
--- a/vmmon-only/common/hostifMem.h
+++ b/vmmon-only/common/hostifMem.h
@@ -29,9 +29,10 @@
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
+#include "vm_basic_types.h"
 
 
-void *HostIF_AllocKernelMem(size_t size, int nonPageable);
+void *HostIF_AllocKernelMem(size_t size, Bool nonPageable);
 void  HostIF_FreeKernelMem(void *ptr);
 
 #endif // ifdef _HOSTIFMEM_H_
diff --git a/vmmon-only/common/memtrack.c b/vmmon-only/common/memtrack.c
index b8dd3516..48f8241b 100644
--- a/vmmon-only/common/memtrack.c
+++ b/vmmon-only/common/memtrack.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -96,7 +96,7 @@
  * Modify this value to increase the maximum number of tracked pages
  * per MemTrack instance.
  */
-#define MEMTRACK_MAX_TRACKED        MBYTES_2_PAGES(4096)
+#define MEMTRACK_MAX_TRACKED        GBYTES_2_PAGES(119)
 
 /*
  * Linux uses a 3-level directory, because we want to keep allocations
@@ -148,7 +148,7 @@ typedef uint64 MemTrackHTKey;
 
 typedef struct MemTrack {
    VMDriver         *vm;            /* The VM instance. */
-   unsigned          numPages;      /* Number of pages tracked. */
+   PageCnt           numPages;      /* Number of pages tracked. */
    MemTrackDir1      dir1;          /* First level directory. */
    MemTrackHT        vpnHashTable;  /* VPN to entry hashtable. */
    MemTrackHT       *mpnHashTable;  /* MPN to entry hashtable. */
@@ -197,7 +197,7 @@ MemTrackAllocPage(void)
 
 #define MEMTRACK_ALLOCDFN(_name, _itype, _otype)   \
    static INLINE _otype *                          \
-   _name(_itype *arg, unsigned pos)                \
+   _name(_itype *arg, uint64 pos)                  \
    {                                               \
       if (arg->dir[pos] == NULL) {                 \
          arg->dir[pos] = MemTrackAllocPage();      \
@@ -273,8 +273,8 @@ MemTrackHTInsert(MemTrackHT *ht,          // IN
 static void
 MemTrackCleanup(MemTrack *mt)    // IN
 {
-   unsigned idx;
-   unsigned p1;
+   PageCnt idx;
+   uint64 p1;
    MemTrackDir1 *dir1;
    Bool freeBackMap = mt != NULL && mt->mpnHashTable != NULL;
 
@@ -284,7 +284,7 @@ MemTrackCleanup(MemTrack *mt)    // IN
    dir1 = &mt->dir1;
 
    for (p1 = 0; p1 < MEMTRACK_DIR1_ENTRIES; p1++) {
-      unsigned p2;
+      uint64 p2;
       MemTrackDir2 *dir2 = MEMTRACK_GETDIR2(dir1, p1);
 
       if (dir2 == NULL) {
@@ -339,7 +339,7 @@ MemTrack *
 MemTrack_Init(VMDriver *vm) // IN:
 {
    MemTrack *mt;
-   unsigned idx;
+   PageCnt idx;
 
 #if defined(MEMTRACK_3LEVEL)
    ASSERT_ON_COMPILE(sizeof *mt <= PAGE_SIZE);
@@ -359,7 +359,8 @@ MemTrack_Init(VMDriver *vm) // IN:
       MemTrackHTPage *htPage = MemTrackAllocPage();
 
       if (htPage == NULL) {
-         Warning("MemTrack failed to allocate VPN hash table (%d).\n", idx);
+         Warning("MemTrack failed to allocate VPN hash table (%"FMT64"d).\n",
+                 idx);
          goto error;
       }
       mt->vpnHashTable.pages[idx] = htPage;
@@ -374,7 +375,8 @@ MemTrack_Init(VMDriver *vm) // IN:
    for (idx = 0; idx < MEMTRACK_HT_PAGES; idx++) {
       MemTrackHTPage *htPage = MemTrackAllocPage();
       if (htPage == NULL) {
-         Warning("MemTrack failed to allocate MPN hash table (%d).\n", idx);
+         Warning("MemTrack failed to allocate MPN hash table (%"FMT64"d).\n",
+                 idx);
          goto error;
       }
       mt->mpnHashTable->pages[idx] = htPage;
@@ -409,8 +411,8 @@ MemTrack_Add(MemTrack *mt,    // IN
              VPN64 vpn,       // IN
              MPN mpn)         // IN
 {
-   unsigned idx = mt->numPages;
-   unsigned p1, p2, p3;
+   PageCnt idx = mt->numPages;
+   uint64 p1, p2, p3;
    MemTrackEntry *ent;
    MemTrackDir1 *dir1 = &mt->dir1;
    MemTrackDir2 *dir2;
@@ -535,16 +537,16 @@ MemTrack_LookupMPN(MemTrack *mt, // IN
  *----------------------------------------------------------------------
  */
 
-unsigned
+PageCnt
 MemTrack_Cleanup(MemTrack *mt,            // IN
                  MemTrackCleanupCb *cb,   // IN
                  void *cData)             // IN
 {
-   unsigned idx;
-   unsigned count = 0;
+   PageCnt idx;
+   PageCnt count = 0;
 
    for (idx = 0; idx < mt->numPages; idx++) {
-      unsigned p1, p2, p3;
+      uint64 p1, p2, p3;
       MemTrackEntry *ent;
       MemTrackDir1 *dir1 = &mt->dir1;
       MEMTRACK_IDX2DIR(idx, p1, p2, p3);
diff --git a/vmmon-only/common/memtrack.h b/vmmon-only/common/memtrack.h
index 1f9cb78b..e0b6bd5f 100644
--- a/vmmon-only/common/memtrack.h
+++ b/vmmon-only/common/memtrack.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2017-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -43,8 +43,8 @@ typedef struct MemTrackEntry {
 typedef void (MemTrackCleanupCb)(void *cData, MemTrackEntry *entry);
 
 extern struct MemTrack *MemTrack_Init(VMDriver *vm);
-extern unsigned MemTrack_Cleanup(struct MemTrack *mt, MemTrackCleanupCb *cb,
-                                 void *cbData);
+extern PageCnt MemTrack_Cleanup(struct MemTrack *mt, MemTrackCleanupCb *cb,
+                                void *cbData);
 extern MemTrackEntry *MemTrack_Add(struct MemTrack *mt, VPN64 vpn, MPN mpn);
 extern MemTrackEntry *MemTrack_LookupVPN(struct MemTrack *mt, VPN64 vpn);
 extern MemTrackEntry *MemTrack_LookupMPN(struct MemTrack *mt, MPN mpn);
diff --git a/vmmon-only/common/phystrack.c b/vmmon-only/common/phystrack.c
index f9e005d2..2e09e3e6 100644
--- a/vmmon-only/common/phystrack.c
+++ b/vmmon-only/common/phystrack.c
@@ -32,7 +32,7 @@
  */
 
 
-#ifdef linux
+#ifdef __linux__
 /* Must come before any kernel header file --hpreg */
 #   include "driver-config.h"
 
@@ -490,3 +490,32 @@ PhysTrack_GetNext(const PhysTracker *tracker, // IN
    return INVALID_MPN;
 }
 
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PhysTrack_GetNumTrackedPages --
+ *
+ *      Returns the total number of tracked pages
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+PageCnt
+PhysTrack_GetNumTrackedPages(const PhysTracker *tracker)
+{
+   PageCnt numTrackedMPNs = 0;
+   MPN nextMPN;
+   ASSERT(tracker);
+   ASSERT(HostIF_VMLockIsHeld(tracker->vm));
+   nextMPN = PhysTrack_GetNext(tracker, INVALID_MPN);
+   while (nextMPN != INVALID_MPN) {
+      numTrackedMPNs++;
+      nextMPN = PhysTrack_GetNext(tracker, nextMPN);
+   }
+   return numTrackedMPNs;
+}
+
diff --git a/vmmon-only/common/phystrack.h b/vmmon-only/common/phystrack.h
index 6d29ebbe..47d10cf9 100644
--- a/vmmon-only/common/phystrack.h
+++ b/vmmon-only/common/phystrack.h
@@ -44,6 +44,7 @@ EXTERN void PhysTrack_Add(struct PhysTracker *, MPN);
 EXTERN void PhysTrack_Remove(struct PhysTracker *, MPN);
 EXTERN Bool PhysTrack_Test(const struct PhysTracker *, MPN);
 EXTERN MPN PhysTrack_GetNext(const struct PhysTracker *, MPN);
+EXTERN PageCnt PhysTrack_GetNumTrackedPages(const struct PhysTracker *);
 
 #endif
 
diff --git a/vmmon-only/common/sharedAreaVmmon.c b/vmmon-only/common/sharedAreaVmmon.c
new file mode 100644
index 00000000..a5cdeeb7
--- /dev/null
+++ b/vmmon-only/common/sharedAreaVmmon.c
@@ -0,0 +1,299 @@
+/*********************************************************
+ * Copyright (C) 2018 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * sharedAreaVmmon.c --
+ *
+ *     VMMon shared area management.
+ */
+
+#ifdef __linux__
+#   include "driver-config.h"
+#   include <linux/string.h> /* memset() in the kernel. */
+#else
+#   include <string.h>
+#endif
+#include "vmware.h"
+#include "vm_assert.h"
+#include "hostif.h"
+#include "sharedAreaVmmon.h"
+#include "vmx86.h"
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SharedAreaVmmonIsMultiVCPU --
+ *
+ *      Helper function for determining if a shared area type represents
+ *      a region that has VCPU-specific memory.
+ *
+ * Results:
+ *      TRUE if type has VCPU-specific memory, FALSE otherwise.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+SharedAreaVmmonIsMultiVCPU(SharedAreaType type)
+{
+   switch (type) {
+   case SHARED_AREA_PER_VM:
+   case SHARED_AREA_PER_VM_VMX:
+      return FALSE;
+   default:
+      return TRUE;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SharedAreaVmmon_Init --
+ *
+ *      Initializes the shared area component of the VM Driver.
+ *
+ * Results:
+ *      A pointer to the VMMon shared area.
+ *
+ *----------------------------------------------------------------------
+ */
+
+SharedAreaVmmon *
+SharedAreaVmmon_Init(VMDriver *vm)
+{
+   SharedAreaVmmon *sa;
+
+   /*
+    * Allocate the shared area pointer here. The pages in each region are
+    * lazily allocated when a region is registered.
+    */
+   sa = HostIF_AllocKernelMem(sizeof *sa, FALSE);
+   if (sa == NULL) {
+      Warning("SharedArea failed to allocate handle.\n");
+      return NULL;
+   }
+   memset(sa, 0, sizeof *sa);
+   return sa;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SharedAreaVmmon_Cleanup --
+ *
+ *      Cleans up the shared area component of the VM Driver by freeing all
+ *      previously allocated VMMon shared area memory.
+ *
+ * Results:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+SharedAreaVmmon_Cleanup(SharedAreaVmmon *area)
+{
+   SharedAreaType t;
+
+   if (area == NULL) {
+      return;
+   }
+
+   for (t = 0; t < NUM_SHARED_AREAS; t++) {
+      SharedAreaVmmonRegion *region = &area->regions[t];
+
+      if (region->pages != NULL) {
+         HostIF_FreeKernelMem(region->pages);
+      }
+   }
+   HostIF_FreeKernelMem(area);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SharedAreaVmmon_ValidateRegionArgs --
+ *
+ *      Validate the given VMMon shared area region registration block.
+ *
+ * Results:
+ *      TRUE if the block is valid and can be used to register a shared
+ *      area region for a VCPU, FALSE otherwise.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+SharedAreaVmmon_ValidateRegionArgs(VMDriver *vm,
+                                   VMSharedAreaRegistrationBlock *block)
+{
+   SharedAreaVmmonRegion *region;
+   Vcpuid vcpu         = block->vcpu;
+   SharedAreaType type = block->region.index;
+   PageCnt numPages    = block->region.numPages;
+
+   if (vm == NULL               ||
+       vm->sharedArea == NULL   ||
+       vcpu >= vm->numVCPUs     ||
+       numPages == 0            ||
+       type >= NUM_SHARED_AREAS ||
+       (!SharedAreaVmmonIsMultiVCPU(type) && vcpu > 0)) {
+      return FALSE;
+   }
+
+   region = &vm->sharedArea->regions[type];
+   if (region->pagesPerVcpu != 0) {
+
+      /*
+       * A region that was previously registered for a given VCPU should have
+       * the same number of pages as originally specified. Also, a region can
+       * only be reserved once for a given VCPU throughout the runtime of a VM.
+       */
+      return region->pagesPerVcpu == numPages &&
+             region->pages[vcpu * region->pagesPerVcpu] == INVALID_MPN;
+   } else {
+      /* First registration for this region. */
+      ASSERT(region->pages == NULL);
+      return TRUE;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SharedAreaVmmon_RegisterRegion --
+ *
+ *      Register a VMMon shared area region for a given VCPU with the VM Driver.
+ *      A successful return value indicates that the backing pages of the
+ *      shared area region are locked and tracked by the VM Driver.
+ *
+ * Results:
+ *      TRUE if the region was successfully registered for the given VCPU,
+ *      FALSE otherwise.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+SharedAreaVmmon_RegisterRegion(VMDriver *vm,
+                               VMSharedAreaRegistrationBlock *block)
+{
+   Vcpuid vcpu = block->vcpu;
+   SharedAreaType type = block->region.index;
+   SharedAreaVmmonRegion *region;
+   MPN *pages;
+   PageCnt page;
+
+   ASSERT(SharedAreaVmmon_ValidateRegionArgs(vm, block));
+   region = &vm->sharedArea->regions[type];
+   if (region->pagesPerVcpu == 0) {
+      PageCnt pagesInRegion = block->region.numPages;
+
+      if (SharedAreaVmmonIsMultiVCPU(type)) {
+         pagesInRegion *= vm->numVCPUs;
+      }
+      region->pages = HostIF_AllocKernelMem(sizeof *pages * pagesInRegion,
+                                            FALSE);
+      if (region->pages == NULL) {
+         Warning("Failed to allocate pages array for region %u\n", type);
+         return FALSE;
+      }
+      for (page = 0; page < pagesInRegion; page++) {
+         region->pages[page] = INVALID_MPN;
+      }
+      region->pagesPerVcpu = block->region.numPages;
+   }
+
+   pages = region->pages + vcpu * region->pagesPerVcpu;
+   for (page = 0; page < region->pagesPerVcpu; page++) {
+      ASSERT(pages[page] == INVALID_MPN);
+   }
+
+   /*
+    * Lock all shared area backing pages throughout the runtime of the monitor.
+    * The pages remain locked until they are freed by HostIF during VM Driver
+    * tear-down.
+    */
+   for (page = 0; page < region->pagesPerVcpu; page++) {
+      VPN vmxVPN = block->region.baseVpn + page;
+      VA64 uAddr = VPN_2_VA(vmxVPN);
+      int status = Vmx86_LockPage(vm, uAddr, FALSE, pages + page);
+
+      if (status != PAGE_LOCK_SUCCESS) {
+         PageCnt resetPage;
+
+         /* Reset the region pages for this VCPU to their original state. */
+         for (resetPage = 0; resetPage < page; resetPage++) {
+            status = Vmx86_UnlockPage(vm, uAddr);
+            ASSERT(status == PAGE_UNLOCK_SUCCESS);
+            pages[resetPage] = INVALID_MPN;
+         }
+         return FALSE;
+      }
+   }
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * SharedAreaVmmon_GetRegionMPN --
+ *
+ *      For the shared area region corresponding to the given type and VCPU,
+ *      get the MPN backing the region at the given offset.
+ *
+ * Results:
+ *      The MPN backing the region, or INVALID_MPN if no MPN is found.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+SharedAreaVmmon_GetRegionMPN(VMDriver *vm, SharedAreaVmmonRequest *request)
+{
+   SharedAreaType type = request->type;
+   Vcpuid vcpu = request->vcpu;
+   SharedAreaVmmonRegion *region;
+   PageCnt pgOffset = request->offset;
+   MPN *pages;
+
+   ASSERT(vcpu < vm->numVCPUs);
+   ASSERT(type < NUM_SHARED_AREAS);
+   ASSERT(IMPLIES(!SharedAreaVmmonIsMultiVCPU(type), vcpu == 0));
+   region = &vm->sharedArea->regions[type];
+   pages = region->pages + vcpu * region->pagesPerVcpu;
+   if (region->pages == NULL || region->pagesPerVcpu == 0) {
+      Warning("(%s) Requested unregistered region %u, VCPU %u\n", __FUNCTION__,
+              type, vcpu);
+      return INVALID_MPN;
+   }
+   if (pgOffset >= region->pagesPerVcpu) {
+      Warning("(%s) Offset %"FMT64"u (type %u, per-VCPU size %"FMT64"u)\n",
+              __FUNCTION__, pgOffset, type, region->pagesPerVcpu);
+      return INVALID_MPN;
+   }
+
+   return pages[pgOffset];
+}
diff --git a/vmmon-only/common/statVarsVmmon.c b/vmmon-only/common/statVarsVmmon.c
new file mode 100644
index 00000000..8cc0d1bf
--- /dev/null
+++ b/vmmon-only/common/statVarsVmmon.c
@@ -0,0 +1,282 @@
+/*********************************************************
+ * Copyright (C) 2018-2019 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * statVarsVmmon.c --
+ *
+ *     VMMon stat variables management.
+ */
+
+#ifdef __linux__
+#   include "driver-config.h"
+#   include <linux/string.h> /* memset() in the kernel. */
+#else
+#   include <string.h>
+#endif
+#include "vmware.h"
+#include "vm_assert.h"
+#include "hostif.h"
+#include "statVarsVmmon.h"
+#include "vmx86.h"
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * StatVarsVmmon_Init --
+ *
+ *      Initializes the stat vars component of the VM Driver.
+ *
+ * Results:
+ *      A pointer to the VMMon stat vars struct.
+ *
+ *----------------------------------------------------------------------
+ */
+
+StatVarsVmmon *
+StatVarsVmmon_Init(VMDriver *vm)
+{
+   StatVarsVmmon *statVars;
+
+   statVars = HostIF_AllocKernelMem(sizeof *statVars, FALSE);
+   if (statVars == NULL) {
+      Warning("StatVars failed to allocate handle.\n");
+      return NULL;
+   }
+   memset(statVars, 0, sizeof *statVars);
+   return statVars;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * StatVarsVmmon_Cleanup --
+ *
+ *      Cleans up the stat vars component of the VM Driver by freeing all
+ *      previously allocated VMMon stat vars memory.
+ *
+ * Results:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+StatVarsVmmon_Cleanup(StatVarsVmmon *statVars)
+{
+   if (statVars == NULL) {
+      return;
+   }
+
+   if (statVars->pages != NULL) {
+      HostIF_FreeKernelMem(statVars->pages);
+   }
+   HostIF_FreeKernelMem(statVars);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * StatVarsVmmonValidateRegistration --
+ *
+ *      Validate the given VMMon stat vars registration block.
+ *
+ * Results:
+ *      TRUE if the block is valid and can be used to register stat vars
+ *      backing pages for a VCPU, FALSE otherwise.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+StatVarsVmmonValidateRegistration(VMDriver *vm,
+                                   VMStatVarsRegistrationBlock *block)
+{
+   Vcpuid vcpu      = block->vcpu;
+   PageCnt numPages = block->numPages;
+   PageCnt pagesPerVcpu;
+   MPN *pages;
+
+   if (vm == NULL           ||
+       vm->statVars == NULL ||
+       numPages == 0        ||
+       vcpu >= vm->numVCPUs) {
+      return FALSE;
+   }
+
+   pagesPerVcpu = vm->statVars->pagesPerVcpu;
+   pages = vm->statVars->pages;
+   if (pagesPerVcpu == 0) {
+      ASSERT(pages == NULL);
+      return TRUE;
+   } else {
+      return pagesPerVcpu == numPages &&
+             pages[vcpu * pagesPerVcpu] == INVALID_MPN;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * StatVarsVmmon_RegisterVCPU --
+ *
+ *      Register stat vars backing pages for the given VCPU with VMMon.
+ *      A successful return value indicates that stat vars backing pages
+ *      for the given VCPU are locked and tracked by the VM Driver.
+ *
+ * Results:
+ *      TRUE if the backing pages were successfully registered for the
+ *      given VCPU, FALSE otherwise.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+StatVarsVmmon_RegisterVCPU(VMDriver *vm,
+                           VMStatVarsRegistrationBlock *block)
+{
+   Vcpuid vcpu = block->vcpu;
+   PageCnt pagesPerVcpu = block->numPages;
+   StatVarsVmmon *statVars = vm->statVars;
+   MPN *pages;
+   PageCnt page;
+
+   HostIF_VMLock(vm, 45);
+   if (!StatVarsVmmonValidateRegistration(vm, block)) {
+      HostIF_VMUnlock(vm, 45);
+      return FALSE;
+   }
+   if (statVars->pagesPerVcpu == 0) {
+      PageCnt totalPages = pagesPerVcpu * vm->numVCPUs;
+      statVars->pages = HostIF_AllocKernelMem(totalPages * sizeof *pages,
+                                              FALSE);
+      if (statVars->pages == NULL) {
+         HostIF_VMUnlock(vm, 45);
+         return FALSE;
+      }
+      for (page = 0; page < totalPages; page++) {
+         statVars->pages[page] = INVALID_MPN;
+      }
+      statVars->pagesPerVcpu = pagesPerVcpu;
+   }
+
+   /*
+    * Validate that all pages in this VCPU's region are still invalid. Before
+    * unlocking, temporarily set the first page to 0 to prevent a malicious user
+    * from triggering an ASSERT by firing parallel ioctls for the same VCPU.
+    */
+   pages = statVars->pages + vcpu * pagesPerVcpu;
+   for (page = 0; page < pagesPerVcpu; page++) {
+      ASSERT(pages[page] == INVALID_MPN);
+   }
+   ASSERT_ON_COMPILE(INVALID_MPN != 0);
+   pages[0] = 0;
+   HostIF_VMUnlock(vm, 45);
+
+   /*
+    * Verify that all stat vars backing pages are locked.  The pages are
+    * assumed to remain locked either until they are unlocked by the VMX
+    * following a NUMA migration, or by HostIF during VM Driver tear-down.
+    */
+   for (page = 0; page < pagesPerVcpu; page++) {
+      VPN vmxVPN = block->baseVpn + page;
+      VA64 uAddr = VPN_2_VA(vmxVPN);
+      PageCnt resetPage;
+      MPN *currPage = pages + page;
+      Bool verifiedLocked = FALSE;
+      int status = Vmx86_LockPage(vm, uAddr, FALSE, currPage);
+
+      /*
+       * Backing pages are expected to be locked by the VMX before being
+       * registered.
+       */
+      if (status == PAGE_LOCK_ALREADY_LOCKED) {
+         verifiedLocked = TRUE;
+         status = Vmx86_LookupUserMPN(vm, uAddr, currPage);
+         /*
+          * PR 2260615: Some platforms return PAGE_LOCK_SUCCESS for a successful
+          * user MPN lookup, others return PAGE_LOOKUP_SUCCESS, but they both
+          * happen to equal the same value.
+          */
+         ASSERT_ON_COMPILE(PAGE_LOOKUP_SUCCESS == PAGE_LOCK_SUCCESS);
+         if (status == PAGE_LOOKUP_SUCCESS) {
+            /*
+             * The backing page was verified as previously locked, and was
+             * successfully recorded.
+             */
+            continue;
+         }
+      }
+      /*
+       * The backing page was either not previously locked, or was not recorded.
+       * In either case, reset all previously recorded pages to INVALID_MPN.
+       */
+      if (!verifiedLocked && status == PAGE_LOCK_SUCCESS) {
+         status = Vmx86_UnlockPage(vm, uAddr);
+         ASSERT(status == PAGE_UNLOCK_SUCCESS);
+      }
+      for (resetPage = 0; resetPage <= page; resetPage++) {
+         pages[resetPage] = INVALID_MPN;
+      }
+      return FALSE;
+   }
+
+   return TRUE;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * StatVarsVmmon_GetRegionMPN --
+ *
+ *      Obtain the backing MPN for stat vars for the given VCPU at
+ *      the given offset.
+ *
+ * Results:
+ *      The backing stat vars MPN for the given VCPU at the given offset
+ *      if it has been registered, or INVALID_MPN otherwise.
+ *
+ *----------------------------------------------------------------------
+ */
+
+MPN
+StatVarsVmmon_GetRegionMPN(struct VMDriver *vm, Vcpuid vcpu, PageCnt offset)
+{
+   MPN *pages;
+   MPN backingPage;
+   StatVarsVmmon *statVars = vm->statVars;
+
+   ASSERT(vcpu < vm->numVCPUs);
+
+   HostIF_VMLock(vm, 46);
+   if (offset >= statVars->pagesPerVcpu) {
+      HostIF_VMUnlock(vm, 46);
+      Warning("(%s) Requested MPN at invalid offset %"FMT64"u for VCPU %u\n",
+              __FUNCTION__, offset, vcpu);
+      return INVALID_MPN;
+   }
+
+   pages = statVars->pages + vcpu * statVars->pagesPerVcpu;
+   backingPage = pages[offset];
+   HostIF_VMUnlock(vm, 46);
+   return backingPage;
+}
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index bafaba87..e23c0f0e 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -33,7 +33,7 @@
  *
  */
 
-#ifdef linux
+#ifdef __linux__
 /* Must come before any kernel header file --hpreg */
 #   include "driver-config.h"
 #   include <linux/string.h> /* memset() in the kernel */
@@ -61,10 +61,11 @@
 #include "x86vt.h"
 #include "x86vtinstr.h"
 #include "apic.h"
-#include "x86perfctr.h"
+#include "perfctr.h"
 #include "x86paging_common.h"
 #include "x86paging_64.h"
 #include "memtrack.h"
+#include "monLoader.h"
 
 #ifdef LINUX_GDT_IS_RO
 #   include <asm/desc.h>
@@ -846,7 +847,7 @@ TaskApplyPTPatches(VMDriver *vm, VMCrossPageData *cpData)
       VMMPageTablePatch *patch = &cpData->vmmPTP[i];
       unsigned l4idx = PT_LPN_2_L4OFF(patch->lpn);
       unsigned l3idx = PT_LPN_2_L3OFF(patch->lpn);
-      PT_L4E pte;
+      PT_L4E pte = 0;
       MA ma = cpData->monCR3 + l4idx * sizeof pte; /* PTE machine address. */
 
       if (patch->level == PTP_EMPTY) {
@@ -943,8 +944,8 @@ static Bool
 TaskVerifyPTPatches(VMDriver *vm,
                     VMCrossPageData *cpData)
 {
-   LPN64 xgCPN = LA_2_LPN(cpData->vmmCrossGDTLA);
-   LPN64 xpCPN = LA_2_LPN(cpData->vmmCrossPageLA);
+   LPN64 xgCPN = LA_2_LPN(cpData->crossGDTLA);
+   LPN64 xpCPN = LA_2_LPN(cpData->crossPageLA);
    MPN   xpMPN = MA_2_MPN(cpData->crosspageMA);
    MA    cr3   = cpData->monCR3;
    return TaskVerifyPTMap(vm, cr3, xpCPN, xpMPN) &&
@@ -1092,9 +1093,8 @@ TaskSetCrossGDTVMM(BSVMM_GDTInit *gdt)
  * TaskSetCrossGDTHost --
  *
  *      Initializes the host portion of the crossGDT by copying it directly
- *      from the host kernel's GDT. We assume that all the host segments
- *      we will ever need come from the first page of the host's GDT and
- *      precede the lowest segment needed by the monitor.
+ *      from the host kernel's GDT. We assume that all the host segments we
+ *      will ever need come from the first page of the host's GDT.
  *
  * Results:
  *      TRUE on success, FALSE otherwise.
@@ -1106,30 +1106,17 @@ TaskSetCrossGDTVMM(BSVMM_GDTInit *gdt)
  */
 
 static void
-TaskSetCrossGDTHost(const BSVMM_GDTInit *gdt)
+TaskSetCrossGDTHost(void)
 {
    unsigned len;
    DTR64 hostGDT;
-   unsigned i;
-   /* Copy descriptors up to at most the size of the CrossGDT. */
-   unsigned minVMMIndex = sizeof(CrossGDT) / sizeof(Descriptor);
-
    /*
     * All copied host segment descriptors will come from the first page of
-    * the host kernel GDT and precede the first monitor segment descriptor.
+    * the host kernel GDT.
     */
-   ASSERT_ON_COMPILE(sizeof(CrossGDT) % sizeof(Descriptor) == 0);
    ASSERT(HostIF_GlobalLockIsHeld());
-   for (i = 0; i < ARRAYSIZE(gdt->entries); i++) {
-      const BSVMM_GDTInitEntry *entry = &gdt->entries[i];
-      if (entry->present == 1) {
-         minVMMIndex = MIN(entry->index, minVMMIndex);
-      }
-   }
    TaskSaveGDT(&hostGDT);
-   /* PR 2142795: Only copy up to at most the monitor's first descriptor. */
-   len = MIN((unsigned)hostGDT.limit + 1, minVMMIndex * sizeof(Descriptor));
-   ASSERT(len <= sizeof(CrossGDT));
+   len = MIN((unsigned)hostGDT.limit + 1, sizeof(CrossGDT));
    memcpy(crossGDT->gdtes, (void*)HOST_KERNEL_LA_2_VA((LA)hostGDT.offset), len);
 }
 
@@ -1171,7 +1158,7 @@ Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
          return FALSE;
       }
       memset(crossGDT, 0, sizeof *crossGDT);
-      TaskSetCrossGDTHost(gdt);
+      TaskSetCrossGDTHost();
    }
 
    populatedCrossGDT = TaskSetCrossGDTVMM(gdt);
@@ -1589,8 +1576,8 @@ TaskCreatePTPatches(VMDriver    *vm,
                     uint16      *numPages)
 {
    VMCrossPageData * const cpData = &crosspage->crosspageData;
-   LPN64                   xgCPN  = LA_2_LPN(cpData->vmmCrossGDTLA);
-   LPN64                   xpCPN  = LA_2_LPN(cpData->vmmCrossPageLA);
+   LPN64                   xgCPN  = LA_2_LPN(cpData->crossGDTLA);
+   LPN64                   xpCPN  = LA_2_LPN(cpData->crossPageLA);
    MPN                     xpMPN  = MA_2_MPN(cpData->crosspageMA);
    /*
     * Set up patches that the BackToHost code will use to map the
@@ -1616,8 +1603,7 @@ TaskCreatePTPatches(VMDriver    *vm,
  *    Initialize the crosspage used to switch to the monitor task.
  *
  * Results:
- *    0 on success
- *    != 0 on failure
+ *    TRUE on success, FALSE on failure.
  *
  * Side effects:
  *    None
@@ -1625,29 +1611,28 @@ TaskCreatePTPatches(VMDriver    *vm,
  *-----------------------------------------------------------------------------
  */
 
-int
-Task_InitCrosspage(VMDriver *vm,          // IN
-                   InitBlock *initParams) // IN/OUT: Initial params from the
-                                          //         VM
+Bool
+Task_InitCrosspage(VMDriver *vm,               // IN
+                   LPN monStartLPN,            // IN
+                   LPN monEndLPN,              // IN
+                   PerVcpuPages *perVcpuPages) // IN
 {
    Vcpuid vcpuid;
    uint16 numPTPPages = 0;
 
    if (crossGDT == NULL) {
-      return 1;
+      return FALSE;
    }
 
-   initParams->crossGDTMPN = crossGDTMPN;
-
    ASSERT(0 < vm->numVCPUs && vm->numVCPUs <= MAX_VCPUS);
    for (vcpuid = 0; vcpuid < vm->numVCPUs; vcpuid++) {
-      VA64             crossPageUserAddr = initParams->crosspage[vcpuid];
+      VA64             crossPageUserAddr = perVcpuPages[vcpuid].crosspage;
       VMCrossPage     *p = HostIF_MapCrossPage(vm, crossPageUserAddr);
       VMCrossPageData *cpData;
       MPN              crossPageMPN;
 
       if (p == NULL) {
-         return 1;
+         return FALSE;
       }
       cpData = &p->crosspageData;
 
@@ -1656,7 +1641,7 @@ Task_InitCrosspage(VMDriver *vm,          // IN
           PAGE_LOOKUP_SUCCESS ||
           crossPageMPN == 0) {
          HostIF_VMUnlock(vm, 38);
-         return 1;
+         return FALSE;
       }
       HostIF_VMUnlock(vm, 38);
 
@@ -1673,39 +1658,39 @@ Task_InitCrosspage(VMDriver *vm,          // IN
          Warning("%s: crosspage version mismatch: vmmon claims %#x, must "
                  "match vmx version of %#x.\n", __FUNCTION__,
                  (int)CROSSPAGE_VERSION, cpData->version);
-         return 1;
+         return FALSE;
       }
       if (!pseudoTSC.initialized) {
          Warning("%s*: PseudoTSC has not been initialized\n", __FUNCTION__);
-         return 1;
+         return FALSE;
       }
       cpData->crosspageMA = MPN_2_MA(crossPageMPN);
-      cpData->hostCrossPageLA = (LA64)(uintptr_t)p;
-      cpData->vmmCrossPageLA = cpData->hostCrossPageLA;
-      cpData->vmmCrossGDTLA = HOST_KERNEL_VA_2_LA((VA)crossGDT);
+      cpData->crossPageLA = (LA64)(uintptr_t)p;
+      cpData->crossGDTLA = HOST_KERNEL_VA_2_LA((VA)crossGDT);
       cpData->crossGDTHKLADesc.offset = HOST_KERNEL_VA_2_LA((VA)crossGDT);
       cpData->crossGDTHKLADesc.limit  = sizeof(CrossGDT) - 1;
+      if (CPUID_HostSupportsXSave()) {
+         cpData->wsCR4 |= CR4_OSXSAVE;
+      }
+      cpData->monCR3 = MPN_2_MA(vm->ptRootMpns[vcpuid]);
 
       HostIF_VMLock(vm, 39);
-      if (!TaskCreatePTPatches(vm, p,
-                               initParams->monStartLPN,
-                               initParams->monEndLPN,
-                               &numPTPPages)) {
+      if (!TaskCreatePTPatches(vm, p, monStartLPN, monEndLPN, &numPTPPages)) {
          HostIF_VMUnlock(vm, 39);
          Warning("%s: Could not create page table patches for VCPU %d\n",
                  __FUNCTION__, vcpuid);
-         return 1;
+         return FALSE;
       }
       HostIF_VMUnlock(vm, 39);
       if (!TaskApplyPTPatches(vm, cpData)) {
          Warning("%s: Could not apply page table patches for VCPU %d\n",
                  __FUNCTION__, vcpuid);
-         return 1;
+         return FALSE;
       }
       if (!TaskVerifyPTPatches(vm, cpData)) {
          Warning("%s: Page table patches for VCPU %d failed verification\n",
                  __FUNCTION__, vcpuid);
-         return 1;
+         return FALSE;
       }
 
       /*
@@ -1733,12 +1718,12 @@ Task_InitCrosspage(VMDriver *vm,          // IN
       TaskInitHostSwitchIDT(p);
    }
    /*
-    * Report back to the VMX the number of pages allocated for this VM's
-    * page table patches.
+    * Store the number of pages allocated for this VM's page table patches so
+    * the bootstrap can account for the memory overhead later in a module call.
     */
-   initParams->numPTPPages = numPTPPages;
+   vm->numPTPPages = numPTPPages;
 
-   return 0;
+   return TRUE;
 }
 
 
@@ -2520,7 +2505,7 @@ Task_Switch(VMDriver *vm,  // IN
     * world switch.  We must be careful not to overwrite the
     * crosspages arguments when doing this though, see bug 820257.
     */
-   if (hvRootMPN == INVALID_MPN) {
+   if (hvRootMPN == INVALID_MPN && CPUID_HostSupportsHV()) {
       crosspage->crosspageData.userCallType = MODULECALL_USERCALL_NONE;
       crosspage->crosspageData.moduleCallType = MODULECALL_ALLOC_VMX_PAGE;
       crosspage->crosspageData.pcpuNum = pCPU;
@@ -2545,9 +2530,9 @@ Task_Switch(VMDriver *vm,  // IN
           * hosts IDT - PR 848701.
           */
          if (pebsAvailable) {
-            pebsMSR = __GET_MSR(IA32_MSR_PEBS_ENABLE);
+            pebsMSR = X86MSR_GetMSR(IA32_MSR_PEBS_ENABLE);
             if (pebsMSR != 0) {
-               __SET_MSR(IA32_MSR_PEBS_ENABLE, 0);
+               X86MSR_SetMSR(IA32_MSR_PEBS_ENABLE, 0);
             }
          }
 
@@ -2556,9 +2541,9 @@ Task_Switch(VMDriver *vm,  // IN
           * enabled.
           */
          if (ptAvailable) {
-            ptMSR = __GET_MSR(MSR_RTIT_CTL);
+            ptMSR = X86MSR_GetMSR(MSR_RTIT_CTL);
             if ((ptMSR & MSR_RTIT_CTL_TRACE_EN) != 0) {
-               __SET_MSR(MSR_RTIT_CTL, ptMSR & ~MSR_RTIT_CTL_TRACE_EN);
+               X86MSR_SetMSR(MSR_RTIT_CTL, ptMSR & ~MSR_RTIT_CTL_TRACE_EN);
             }
          }
 
@@ -2578,12 +2563,12 @@ Task_Switch(VMDriver *vm,  // IN
              * so that we can set CR4.VMXE to activate VMX.
              */
             uint64 bits = MSR_FEATCTL_LOCK | MSR_FEATCTL_VMXE;
-            uint64 featCtl = __GET_MSR(MSR_FEATCTL);
+            uint64 featCtl = X86MSR_GetMSR(MSR_FEATCTL);
             if ((featCtl & bits) != bits) {
                if ((featCtl & MSR_FEATCTL_LOCK) != 0) {
                   Panic("Intel VT-x is disabled and locked on CPU %d\n", pCPU);
                }
-               __SET_MSR(MSR_FEATCTL, featCtl | bits);
+               X86MSR_SetMSR(MSR_FEATCTL, featCtl | bits);
             }
          }
 
@@ -2651,12 +2636,12 @@ Task_Switch(VMDriver *vm,  // IN
          }
 
          if (CPUID_HostSupportsSVM()) {
-            efer = __GET_MSR(MSR_EFER);
+            efer = X86MSR_GetMSR(MSR_EFER);
             if ((efer & MSR_EFER_SVME) == 0) {
-               __SET_MSR(MSR_EFER, efer | MSR_EFER_SVME);
+               X86MSR_SetMSR(MSR_EFER, efer | MSR_EFER_SVME);
             }
-            foreignHSAVE = __GET_MSR(MSR_VM_HSAVE_PA);
-            __SET_MSR(MSR_VM_HSAVE_PA, MPN_2_MA(hvRootMPN));
+            foreignHSAVE = X86MSR_GetMSR(MSR_VM_HSAVE_PA);
+            X86MSR_SetMSR(MSR_VM_HSAVE_PA, MPN_2_MA(hvRootMPN));
          }
 
          /*
@@ -2721,9 +2706,9 @@ Task_Switch(VMDriver *vm,  // IN
          if (CPUID_HostSupportsSpecCtrl()) {
 #ifdef CYCLE_SPEC_CTRL
             currentSpecCtrlValue = (currentSpecCtrlValue + 1) % 4;
-            __SET_MSR(MSR_SPEC_CTRL, currentSpecCtrlValue);
+            X86MSR_SetMSR(MSR_SPEC_CTRL, currentSpecCtrlValue);
 #endif
-            crosspage->crosspageData.specCtrl = __GET_MSR(MSR_SPEC_CTRL);
+            crosspage->crosspageData.specCtrl = X86MSR_GetMSR(MSR_SPEC_CTRL);
          }
 
          DEBUG_ONLY(crosspage->crosspageData.monTinyStack[0] = 0xDEADBEEF;)
@@ -2737,11 +2722,11 @@ Task_Switch(VMDriver *vm,  // IN
 
 #ifdef CYCLE_SPEC_CTRL
          if (CPUID_HostSupportsSpecCtrl()) {
-            readSpecCtrlValue = __GET_MSR(MSR_SPEC_CTRL);
+            readSpecCtrlValue = X86MSR_GetMSR(MSR_SPEC_CTRL);
             specCtrlEqual = readSpecCtrlValue ==
                             crosspage->crosspageData.specCtrl;
             /* Do not leak cycling SPEC_CTRL value back to host. */
-            __SET_MSR(MSR_SPEC_CTRL, 0);
+            X86MSR_SetMSR(MSR_SPEC_CTRL, 0);
          }
 #endif
 
@@ -2764,9 +2749,9 @@ Task_Switch(VMDriver *vm,  // IN
          }
 
          if (CPUID_HostSupportsSVM()) {
-            __SET_MSR(MSR_VM_HSAVE_PA, foreignHSAVE);
+            X86MSR_SetMSR(MSR_VM_HSAVE_PA, foreignHSAVE);
             if ((efer & MSR_EFER_SVME) == 0) {
-               __SET_MSR(MSR_EFER, efer);
+               X86MSR_SetMSR(MSR_EFER, efer);
             }
          }
 
@@ -2840,11 +2825,11 @@ Task_Switch(VMDriver *vm,  // IN
          TaskLoadIDT(&hostIDT);
 
          if (pebsMSR != 0) {
-            __SET_MSR(IA32_MSR_PEBS_ENABLE, pebsMSR);
+            X86MSR_SetMSR(IA32_MSR_PEBS_ENABLE, pebsMSR);
          }
 
          if ((ptMSR & MSR_RTIT_CTL_TRACE_EN) != 0) {
-            __SET_MSR(MSR_RTIT_CTL, ptMSR);
+            X86MSR_SetMSR(MSR_RTIT_CTL, ptMSR);
          }
 
          TaskUpdateLatestPTSC(vm, &crosspage->crosspageData);
@@ -2912,10 +2897,10 @@ Task_Switch(VMDriver *vm,  // IN
 
       /*
        * Newer versions of Window expect EFLAGS_AC to be set when handling an
-       * interupt - PR  2248661.
+       * interrupt - PR 2248661.
        */
       if ((flags & EFLAGS_AC) != 0) {
-         uintptr_t   curFlags;
+         uintptr_t curFlags;
          SAVE_FLAGS(curFlags);
          curFlags |= EFLAGS_AC;
          RESTORE_FLAGS(curFlags);
diff --git a/vmmon-only/common/task.h b/vmmon-only/common/task.h
index 0ea0b01b..acf9f713 100644
--- a/vmmon-only/common/task.h
+++ b/vmmon-only/common/task.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013,2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2013,2015,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -24,10 +24,11 @@
 #include "includeCheck.h"
 #include "bootstrap_vmm.h"
 
-struct InitBlock;
+struct MonLoaderHeader;
 
 extern Bool Task_CreateCrossGDT(BSVMM_GDTInit *gdt);
-extern int Task_InitCrosspage(VMDriver *vm, struct InitBlock *params);
+extern Bool Task_InitCrosspage(VMDriver *vm, LPN monStartLPN, LPN monEndLPN,
+                               PerVcpuPages *perVcpuPages);
 extern void Task_Switch(VMDriver *vm, Vcpuid vcpuid);
 extern Bool Task_Initialize(void);
 extern void Task_Terminate(void);
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index 598a97e6..2ae9fb7a 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -42,7 +42,6 @@
 #include "vm_basic_math.h"
 #include "vmx86.h"
 #include "task.h"
-#include "initblock.h"
 #include "vm_asm.h"
 #include "iocontrols.h"
 #include "hostif.h"
@@ -56,14 +55,16 @@
 #include "x86vt.h"
 #include "x86svm.h"
 #include "x86cpuid_asm.h"
-#if defined(linux)
+#if defined(__linux__)
 #include <asm/timex.h>
 #endif
-#include "x86perfctr.h"
+#include "perfctr.h"
 #include "x86vtinstr.h"
 #include "bootstrap_vmm.h"
 #include "monLoader.h"
 #include "vmmblob.h"
+#include "sharedAreaVmmon.h"
+#include "statVarsVmmon.h"
 
 PseudoTSC pseudoTSC;
 
@@ -77,14 +78,14 @@ static VMDriver *vmDriverList = NULL;
 static LockedPageLimit lockedPageLimit = {
    0,                        // host: does not need to be initialized.
    0,                        // configured: must be set by some VM as it is powered on.
-   (uint32)MAX_LOCKED_PAGES, // dynamic
+   MAX_LOCKED_PAGES,         // dynamic
 };
 
 /* Percentage of guest "paged" memory that must fit within the hard limit. */
-static unsigned minVmMemPct;
+static Percent minVmMemPct;
 
 /* Number of pages actually locked by all virtual machines */
-static unsigned numLockedPages;
+static PageCnt numLockedPages;
 
 /* Total virtual machines on this host */
 static unsigned vmCount;
@@ -141,13 +142,12 @@ typedef struct NXData {
  *----------------------------------------------------------------------
  */
 
-static INLINE unsigned
+static INLINE PageCnt
 Vmx86AdjustLimitForOverheads(const VMDriver* vm,
-                             const uint32 limit)
+                             const PageCnt limit)
 {
-   uint32 extraCost = (vm != NULL) ? vmCount * vm->memInfo.perVMOverhead : 0;
+   PageCnt extraCost = (vm != NULL) ? vmCount * vm->memInfo.perVMOverhead : 0;
    ASSERT(HostIF_GlobalLockIsHeld());
-
    return (extraCost < limit) ?  (limit - extraCost) : 0;
 }
 
@@ -176,12 +176,11 @@ Vmx86AdjustLimitForOverheads(const VMDriver* vm,
  *----------------------------------------------------------------------
  */
 
-static INLINE unsigned
+static INLINE PageCnt
 Vmx86LockedPageLimit(const VMDriver* vm)  // IN:
 {
-   uint32 overallLimit;
+   PageCnt overallLimit;
    ASSERT(HostIF_GlobalLockIsHeld());
-
    lockedPageLimit.host = HostIF_EstimateLockedPageLimit(vm, numLockedPages);
    overallLimit = MIN(MIN(lockedPageLimit.configured, lockedPageLimit.dynamic),
                       lockedPageLimit.host);
@@ -212,7 +211,7 @@ Vmx86LockedPageLimit(const VMDriver* vm)  // IN:
 
 static INLINE Bool
 Vmx86HasFreePages(VMDriver *vm,
-                  unsigned int numPages,
+                  PageCnt numPages,
                   Bool checkVM)
 {
    /*
@@ -226,10 +225,7 @@ Vmx86HasFreePages(VMDriver *vm,
           (!checkVM || HostIF_VMLockIsHeld(vm)));
 
    if (checkVM) {
-      /*
-       * Check the per-vm limit.
-       */
-
+      /* Check the per-vm limit. */
       ASSERT(HostIF_VMLockIsHeld(vm));
       if (vm->memInfo.admitted) {
          if (vm->memInfo.maxAllocation <= vm->memInfo.locked) {
@@ -239,12 +235,8 @@ Vmx86HasFreePages(VMDriver *vm,
          }
       }
    } else {
-      /*
-       * Check the global limit.
-       */
-
-      unsigned limit = Vmx86LockedPageLimit(vm);
-
+      /* Check the global limit. */
+      PageCnt limit = Vmx86LockedPageLimit(vm);
       if (limit <= numLockedPages) {
          return FALSE;
       } else if (limit - numLockedPages < numPages) {
@@ -555,7 +547,7 @@ Vmx86_Free(void *ptr)
 void *
 Vmx86_Calloc(size_t numElements, // IN
              size_t elementSize, // IN
-             int nonPageable)    // IN
+             Bool nonPageable)   // IN
 {
    size_t numBytes = numElements * elementSize;
    void *retval;
@@ -732,6 +724,14 @@ Vmx86FreeAllVMResources(VMDriver *vm)
          VmmBlob_Cleanup(vm->blobInfo);
          vm->blobInfo = NULL;
       }
+      if (vm->sharedArea != NULL) {
+         SharedAreaVmmon_Cleanup(vm->sharedArea);
+         vm->sharedArea = NULL;
+      }
+      if (vm->statVars != NULL) {
+         StatVarsVmmon_Cleanup(vm->statVars);
+         vm->statVars = NULL;
+      }
 
       HostIF_FreeAllResources(vm);
 
@@ -768,7 +768,7 @@ Vmx86FreeAllVMResources(VMDriver *vm)
 
 static Bool
 Vmx86ReserveFreePages(VMDriver *vm,
-                      unsigned int numPages,
+                      PageCnt numPages,
                       Bool ignoreLimits)
 {
    Bool retval = FALSE;
@@ -779,15 +779,14 @@ Vmx86ReserveFreePages(VMDriver *vm,
    for (retries = 3; !retval && (retries > 0); retries--) {
       HostIF_GlobalLock(17);
       HostIF_VMLock(vm, 0);
-
-      // Check VM's limit and don't wait.
+      /* Check VM's limit and don't wait. */
       retval = Vmx86HasFreePages(vm, numPages, TRUE);
       if (!retval) {
          HostIF_VMUnlock(vm, 0);
          HostIF_GlobalUnlock(17);
          break;
       } else {
-         // Wait to satisfy the global limit.
+         /* Wait to satisfy the global limit. */
          retval = Vmx86HasFreePages(vm, numPages, FALSE);
          if (retval) {
             numLockedPages += numPages;
@@ -841,7 +840,7 @@ Vmx86ReserveFreePages(VMDriver *vm,
 
 static void
 Vmx86UnreserveFreePages(VMDriver *vm,
-                        unsigned int numPages)
+                        PageCnt numPages)
 {
    ASSERT(vm);
 
@@ -879,7 +878,7 @@ static void
 Vmx86GetNX(void *clientData) // IN/OUT: A NXData *
 {
    NXData *nxData = (NXData *)clientData;
-   uint64 efer = __GET_MSR(MSR_EFER);
+   uint64 efer = X86MSR_GetMSR(MSR_EFER);
 
    Atomic_Inc32(&nxData->responded);
    if ((efer & MSR_EFER_NXE) == MSR_EFER_NXE) {
@@ -946,11 +945,6 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
       return NULL;
    }
 
-   /* Disallow VM creation if HV is not available, as the VM cannot be run. */
-   if (!CPUID_HostSupportsHV()) {
-      return NULL;
-   }
-
    /* Disallow VM creation if NX is disabled on the host as VMM requires NX. */
    if (!hostUsesNX) {
       Log("NX/XD must be enabled.  Cannot create VM.\n");
@@ -970,25 +964,30 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
       Atomic_Write32(&vm->currentHostCpu[v], INVALID_PCPU);
       vm->ptRootMpns[v] = INVALID_MPN;
    }
-   if (HostIF_Init(vm, numVCPUs)) {
-      goto cleanup;
-   }
-   bsBuf = HostIF_AllocKernelMem(bsBlobSize, FALSE);
-   if (bsBuf == NULL) {
-      goto cleanup;
-   }
-   if (HostIF_CopyFromUser(bsBuf, bsBlob, bsBlobSize) != 0) {
-      goto cleanup;
-   }
-   bsParams = BSVMM_Validate(bsBuf, bsBlobSize);
-   if (bsParams == NULL) {
-      Warning("Could not validate the VMM bootstrap blob");
+   if (!HostIF_Init(vm, numVCPUs)) {
       goto cleanup;
    }
 
-   if (!Task_CreateCrossGDT(&bsParams->gdtInit)) {
-      goto cleanup;
+   /* The ULM does not use the cross GDT. */
+   if (bsBlobSize != 0) {
+      bsBuf = HostIF_AllocKernelMem(bsBlobSize, FALSE);
+      if (bsBuf == NULL) {
+         goto cleanup;
+      }
+      if (HostIF_CopyFromUser(bsBuf, bsBlob, bsBlobSize) != 0) {
+         goto cleanup;
+      }
+      bsParams = BSVMM_Validate(bsBuf, bsBlobSize);
+      if (bsParams == NULL) {
+         Warning("Could not validate the VMM bootstrap blob");
+         goto cleanup;
+      }
+
+      if (!Task_CreateCrossGDT(&bsParams->gdtInit)) {
+         goto cleanup;
+      }
    }
+
    vm->ptpTracker = MemTrack_Init(vm);
    if (vm->ptpTracker == NULL) {
       goto cleanup;
@@ -997,6 +996,14 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
    if (vm->vmmTracker == NULL) {
       goto cleanup;
    }
+   vm->sharedArea = SharedAreaVmmon_Init(vm);
+   if (vm->sharedArea == NULL) {
+      goto cleanup;
+   }
+   vm->statVars = StatVarsVmmon_Init(vm);
+   if (vm->statVars == NULL) {
+      goto cleanup;
+   }
 
    HostIF_GlobalLock(0);
 
@@ -1015,7 +1022,9 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
 
    HostIF_GlobalUnlock(0);
 
-   HostIF_FreeKernelMem(bsBuf);
+   if (bsBuf != NULL) {
+      HostIF_FreeKernelMem(bsBuf);
+   }
    return vm;
 
 cleanup:
@@ -1052,7 +1061,8 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
  */
 
 static Bool
-Vmx86SetPageTableRoots(VMDriver *vm, UserVA64 *ptRootVAs, uint16 numVCPUs)
+Vmx86SetPageTableRoots(VMDriver *vm, PerVcpuPages *perVcpuPages,
+                       uint16 numVCPUs)
 {
    uint16 vcpu;
 
@@ -1060,14 +1070,16 @@ Vmx86SetPageTableRoots(VMDriver *vm, UserVA64 *ptRootVAs, uint16 numVCPUs)
       return FALSE;
    }
    for (vcpu = 0; vcpu < numVCPUs; vcpu++) {
-      if ((ptRootVAs[vcpu] & (PAGE_SIZE - 1)) != 0) {
+      VA64 ptRoot = perVcpuPages[vcpu].ptRoot;
+
+      if ((ptRoot & (PAGE_SIZE - 1)) != 0) {
          Warning("Error: page table VA %"FMT64"x is not page-aligned\n",
-                 ptRootVAs[vcpu]);
+                 ptRoot);
          return FALSE;
       }
       ASSERT(vm->ptRootMpns[vcpu] == INVALID_MPN);
       HostIF_VMLock(vm, 38);
-      if (HostIF_LookupUserMPN(vm, ptRootVAs[vcpu], &vm->ptRootMpns[vcpu]) !=
+      if (HostIF_LookupUserMPN(vm, ptRoot, &vm->ptRootMpns[vcpu]) !=
           PAGE_LOOKUP_SUCCESS) {
          HostIF_VMUnlock(vm, 38);
          Warning("Failure looking up page table root MPN for VCPU %d\n", vcpu);
@@ -1128,7 +1140,7 @@ Vmx86_ProcessBootstrap(VMDriver *vm,
                        uint32 numBytes,
                        uint32 headerOffset,
                        uint16 numVCPUs,
-                       UserVA64 *ptRootVAs,
+                       PerVcpuPages *perVcpuPages,
                        VMSharedRegion *shRegions)
 {
    VmmBlobInfo *bi = NULL;
@@ -1136,18 +1148,31 @@ Vmx86_ProcessBootstrap(VMDriver *vm,
    Vcpuid errVcpu;
    MonLoaderError ret;
    MonLoaderArgs args;
+   MonLoaderHeader *header;
 
    if (!VmmBlob_Load(bsBlobAddr, numBytes, headerOffset, &bi)) {
       Warning("Error loading VMM bootstrap blob\n");
       goto error;
    }
    vm->blobInfo = bi;
-   if (!Vmx86SetPageTableRoots(vm, ptRootVAs, numVCPUs)) {
+   header = bi->header;
+   if (!Vmx86SetPageTableRoots(vm, perVcpuPages, numVCPUs)) {
+      goto error;
+   }
+
+   /*
+    * Initialize the driver's part of the cross-over page used to
+    * talk to the monitor.
+    */
+   if (!Task_InitCrosspage(vm, header->monStartLPN, header->monEndLPN,
+                           perVcpuPages)) {
+      Warning("Error initializing crosspage\n");
       goto error;
    }
+
    args.vm = vm;
    args.shRegions = shRegions;
-   ret = MonLoader_Process(bi->header, numVCPUs, &args, &errLine, &errVcpu);
+   ret = MonLoader_Process(header, numVCPUs, &args, &errLine, &errVcpu);
    if (ret != ML_OK) {
       Warning("Error processing bootstrap: error %d at line %u, vcpu %u\n",
                ret, errLine, errVcpu);
@@ -1268,78 +1293,6 @@ Vmx86_Close(void)
 }
 
 
-/*
- *-----------------------------------------------------------------------------
- *
- * Vmx86_InitVM --
- *
- *    Initializaiton of the VM.  Expects all initial arguments
- *    to be part of the InitBlock structure.
- *
- * Results:
- *    0 on success
- *    != 0 on failure
- *
- * Side effects:
- *    Many
- *
- *-----------------------------------------------------------------------------
- */
-
-int
-Vmx86_InitVM(VMDriver *vm,          // IN
-             InitBlock *initParams) // IN/OUT: Initial params from the VM
-{
-   int retval;
-
-   if (initParams->magicNumber != INIT_BLOCK_MAGIC) {
-      Warning("Bad magic number for init block 0x%x\n",
-              initParams->magicNumber);
-
-      return 1;
-   }
-   if (vm->numVCPUs == 0 || vm->numVCPUs > MAX_VCPUS) {
-      Warning("Invalid number of VCPUs %d\n", vm->numVCPUs);
-
-      return 1;
-   }
-
-   /*
-    * Initialize the driver's part of the cross-over page used to
-    * talk to the monitor
-    */
-
-   retval = Task_InitCrosspage(vm, initParams);
-   if (retval) {
-      Warning("Task crosspage init died with retval=%d\n", retval);
-      /*
-       *  Note that any clean-up of resources will be handled during
-       *  power-off when Vmx86_ReleaseVM() is called as part of
-       *  MonitorLoop_PowerOff().
-       */
-
-      return 1;
-   }
-
-   /*
-    *  Check if we want to arbitrarily fail every N VM initializations.
-    *  Useful in testing PR 72482.
-    */
-
-   if (initParams->vmInitFailurePeriod != 0) {
-      static uint32 counter = 0;
-
-      if ((++counter) % initParams->vmInitFailurePeriod == 0) {
-         Warning("VM initialization failed on %d iteration\n", counter);
-
-         return 1;
-      }
-   }
-
-   return 0;
-}
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -1690,42 +1643,13 @@ Vmx86_GetNumVMs(void)
 }
 
 
-int32
-Vmx86_GetTotalMemUsage(void)
+static INLINE PageCnt
+Vmx86MinAllocationFunc(PageCnt nonpaged,
+                       PageCnt anonymous,
+                       PageCnt mainmem,
+                       Percent memPct)
 {
-   VMDriver *vm;
-   int totalmem = 0;
-
-   HostIF_GlobalLock(15);
-   vm = vmDriverList;
-
-   for (vm = vmDriverList; vm != NULL; vm = vm->nextDriver) {
-      /*
-       * The VM lock is not strictly necessary as the vm will
-       * stay on the list until we release the global lock and
-       * because of order in which "admitted" and "mainMemSize"
-       * are set when each VM is admitted.
-       */
-
-      if (vm->memInfo.admitted) {
-          totalmem += PAGES_2_MBYTES(ROUNDUP(vm->memInfo.mainMemSize,
-                                             MBYTES_2_PAGES(1)));
-      }
-   }
-
-   HostIF_GlobalUnlock(15);
-
-   return totalmem;
-}
-
-
-static INLINE unsigned
-Vmx86MinAllocationFunc(unsigned nonpaged,
-                       unsigned anonymous,
-                       unsigned mainmem,
-                       unsigned memPct)
-{
-   return RatioOf(memPct, mainmem, 100) + nonpaged + anonymous;
+   return (memPct * mainmem) / 100 + nonpaged + anonymous;
 }
 
 
@@ -1749,12 +1673,11 @@ Vmx86MinAllocationFunc(unsigned nonpaged,
  *----------------------------------------------------------------------
  */
 
-static INLINE unsigned
+static INLINE PageCnt
 Vmx86MinAllocation(VMDriver *vm,
-                   unsigned memPct)
+                   Percent memPct)
 {
    ASSERT(HostIF_VMLockIsHeld(vm));
-
    return Vmx86MinAllocationFunc(vm->memInfo.nonpaged, vm->memInfo.anonymous,
                                  vm->memInfo.mainMemSize, memPct);
 }
@@ -1780,12 +1703,11 @@ Vmx86MinAllocation(VMDriver *vm,
  *----------------------------------------------------------------------
  */
 
-static unsigned
-Vmx86CalculateGlobalMinAllocation(unsigned memPct)
+static PageCnt
+Vmx86CalculateGlobalMinAllocation(Percent memPct)
 {
    VMDriver *vm;
-   unsigned minAllocation = 0;
-
+   PageCnt minAllocation = 0;
    ASSERT(HostIF_GlobalLockIsHeld());
    /* Pages of other vms required to fit inside the hard limit. */
    for (vm = vmDriverList; vm; vm = vm->nextDriver) {
@@ -1819,10 +1741,9 @@ Vmx86CalculateGlobalMinAllocation(unsigned memPct)
  */
 
 static INLINE_SINGLE_CALLER void
-Vmx86UpdateMinAllocations(unsigned memPct)  // IN:
+Vmx86UpdateMinAllocations(Percent memPct)  // IN:
 {
    VMDriver *vm;
-
    ASSERT(HostIF_GlobalLockIsHeld());
    /* Pages of other vms required to fit inside the hard limit. */
    for (vm = vmDriverList; vm; vm = vm->nextDriver) {
@@ -1855,7 +1776,7 @@ Vmx86UpdateMinAllocations(unsigned memPct)  // IN:
  */
 
 Bool
-Vmx86_SetConfiguredLockedPagesLimit(unsigned limit)  // IN:
+Vmx86_SetConfiguredLockedPagesLimit(PageCnt limit)  // IN:
 {
    Bool retval = FALSE;
 
@@ -1889,7 +1810,7 @@ Vmx86_SetConfiguredLockedPagesLimit(unsigned limit)  // IN:
  */
 
 void
-Vmx86_SetDynamicLockedPagesLimit(unsigned limit)  // IN:
+Vmx86_SetDynamicLockedPagesLimit(PageCnt limit)  // IN:
 {
    HostIF_GlobalLock(11);
    lockedPageLimit.dynamic = limit;
@@ -2031,33 +1952,29 @@ Vmx86_UnlockPageByMPN(VMDriver *vm, // IN: VMDriver
  *-----------------------------------------------------------------------------
  */
 
-int
+int64
 Vmx86_AllocLockedPages(VMDriver *vm,         // IN: VMDriver
                        VA64 addr,            // OUT: VA of an array for
                                              //      allocated MPNs.
-                       unsigned numPages,    // IN: number of pages to allocate
+                       PageCnt numPages,     // IN: number of pages to allocate
                        Bool kernelMPNBuffer, // IN: is the MPN buffer in kernel
                                              //     or user address space?
                        Bool ignoreLimits)    // IN: should limits be ignored?
 {
-   int allocatedPages;
-
+   int64 allocatedPages;
    if (!Vmx86ReserveFreePages(vm, numPages, ignoreLimits)) {
       // XXX What kind of system-specific error code is that? --hpreg
       return PAGE_LOCK_LIMIT_EXCEEDED;
    }
-
    HostIF_VMLock(vm, 7);
    allocatedPages = HostIF_AllocLockedPages(vm, addr, numPages,
                                             kernelMPNBuffer);
    HostIF_VMUnlock(vm, 7);
-
    if (allocatedPages < 0) {
       Vmx86UnreserveFreePages(vm, numPages);
    } else if (allocatedPages < numPages) {
       Vmx86UnreserveFreePages(vm, numPages - allocatedPages);
    }
-
    return allocatedPages;
 }
 
@@ -2082,14 +1999,13 @@ Vmx86_AllocLockedPages(VMDriver *vm,         // IN: VMDriver
 
 int
 Vmx86_FreeLockedPages(VMDriver *vm,         // IN: VM instance pointer
-                      VA64 addr,            // IN: user or kernel array of MPNs to free
-                      unsigned numPages,    // IN: number of pages to free
-                      Bool kernelMPNBuffer) // IN: is the MPN buffer in kernel or user address space?
+                      MPN *mpns,            // IN: MPNs to free
+                      PageCnt numPages)     // IN: number of pages to free
 {
    int ret;
 
    HostIF_VMLock(vm, 8);
-   ret = HostIF_FreeLockedPages(vm, addr, numPages, kernelMPNBuffer);
+   ret = HostIF_FreeLockedPages(vm, mpns, numPages);
    HostIF_VMUnlock(vm, 8);
 
    if (ret == 0) {
@@ -2170,6 +2086,33 @@ Vmx86_GetNextAnonPage(VMDriver *vm,       // IN: VM instance pointer
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_GetNumAnonPages --
+ *
+ *      Queries the driver for the total number of anonymous pages.
+ *
+ * Results:
+ *      Total number of anonymous pages
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+PageCnt
+Vmx86_GetNumAnonPages(VMDriver *vm)       // IN: VM instance pointer
+{
+   PageCnt ret;
+   HostIF_VMLock(vm, 45);
+   ret = HostIF_GetNumAnonPages(vm);
+   HostIF_VMUnlock(vm, 45);
+   return ret;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -2275,10 +2218,10 @@ Vmx86_GetMemInfo(VMDriver *curVM,
 
 static void
 Vmx86SetMemoryUsage(VMDriver *curVM,       // IN/OUT
-                    unsigned paged,        // IN
-                    unsigned nonpaged,     // IN
-                    unsigned anonymous,    // IN
-                    unsigned aminVmMemPct) // IN
+                    PageCnt  paged,        // IN
+                    PageCnt  nonpaged,     // IN
+                    PageCnt  anonymous,    // IN
+                    Percent  aminVmMemPct) // IN
 {
    ASSERT(HostIF_VMLockIsHeld(curVM));
    curVM->memInfo.paged         = paged;
@@ -2317,8 +2260,7 @@ Vmx86_Admit(VMDriver *curVM,     // IN
             VMMemInfoArgs *args) // IN/OUT
 {
    Bool allowAdmissionCheck = FALSE;
-   unsigned int globalMinAllocation;
-
+   PageCnt globalMinAllocation;
    HostIF_GlobalLock(9);
 
    /*
@@ -2360,8 +2302,8 @@ Vmx86_Admit(VMDriver *curVM,     // IN
 
 #if defined _WIN32
    if (curVM->memInfo.admitted) {
-      unsigned int allocatedPages, nonpaged;
-      signed int pages;
+      PageCnt allocatedPages, nonpaged;
+      int64 pages;
       MPN *mpns;
 
       /*
@@ -2397,10 +2339,7 @@ Vmx86_Admit(VMDriver *curVM,     // IN
        * XXX Do not free the pages but hand them directly to the admitted VM.
        */
 
-      for (pages = 0; pages < allocatedPages; pages += ALLOCATE_CHUNK_SIZE) {
-         Vmx86_FreeLockedPages(curVM, PtrToVA64(mpns + pages),
-                               MIN(ALLOCATE_CHUNK_SIZE, allocatedPages - pages), TRUE);
-      }
+      Vmx86_FreeLockedPages(curVM, mpns, allocatedPages);
       HostIF_FreeKernelMem(mpns);
 #undef ALLOCATE_CHUNK_SIZE
 
@@ -2429,11 +2368,11 @@ Vmx86_Admit(VMDriver *curVM,     // IN
 Bool
 Vmx86_Readmit(VMDriver *curVM, OvhdMem_Deltas *delta)
 {
-   unsigned globalMinAllocation, newMinAllocation;
+   PageCnt globalMinAllocation, newMinAllocation;
    Bool retval = FALSE;
-   int paged;
-   int nonpaged;
-   int anonymous;
+   int64 paged;
+   int64 nonpaged;
+   int64 anonymous;
 
    HostIF_GlobalLock(31);
    globalMinAllocation = Vmx86CalculateGlobalMinAllocation(minVmMemPct);
@@ -2542,19 +2481,20 @@ static void
 Vmx86EnableHVOnCPU(void)
 {
    if (CPUID_HostSupportsSVM()) {
-      uint64 vmCR = __GET_MSR(MSR_VM_CR);
+      uint64 vmCR = X86MSR_GetMSR(MSR_VM_CR);
       if (!SVM_LockedFromFeatures(vmCR)) {
          CPUIDRegs regs;
          __GET_CPUID(0x8000000A, &regs);
          if (CPUID_GET(0x8000000A, EDX, SVM_LOCK, regs.edx) != 0) {
-            __SET_MSR(MSR_VM_CR, (vmCR & ~MSR_VM_CR_SVME_DISABLE) |
-                                  MSR_VM_CR_SVM_LOCK);
+            X86MSR_SetMSR(MSR_VM_CR, (vmCR & ~MSR_VM_CR_SVME_DISABLE) |
+                                      MSR_VM_CR_SVM_LOCK);
          }
       }
    } else if (CPUID_HostSupportsVT()) {
-      uint64 featCtl = __GET_MSR(MSR_FEATCTL);
+      uint64 featCtl = X86MSR_GetMSR(MSR_FEATCTL);
       if (!VT_LockedFromFeatures(featCtl)) {
-         __SET_MSR(MSR_FEATCTL, featCtl | MSR_FEATCTL_LOCK | MSR_FEATCTL_VMXE);
+         X86MSR_SetMSR(MSR_FEATCTL,
+                       featCtl | MSR_FEATCTL_LOCK | MSR_FEATCTL_VMXE);
       }
    }
 }
@@ -2925,9 +2865,9 @@ Vmx86CheckVMXStatus(const char *operation, // IN: Operation string
 #ifdef __GNUC__
 #if __GNUC__== 4 && __GNUC_MINOR__ > 3
       if (status == VMX_FailValid) {
-         uint64 errorCode;
+         size_t errorCode;
          VMREAD_2_STATUS(VT_VMCS_VMINSTR_ERR, &errorCode);
-         Log("VM-instruction error: Error %"FMT64"d\n", errorCode);
+         Log("VM-instruction error: Error %"FMTSZ"d\n", errorCode);
       }
 #endif
 #endif
@@ -3169,12 +3109,12 @@ Vmx86PerfCtrInUse(Bool isGen, unsigned pmcNum, unsigned ctrlMSR,
                   unsigned cntMSR, Bool hasPGC)
 {
    volatile unsigned delay;
-   uint64 origPGC = hasPGC ? __GET_MSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR) : 0;
+   uint64 origPGC = hasPGC ? X86MSR_GetMSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR) : 0;
    uint64 pmcCtrl;
    uint64 pmcCount, count;
    uint64 ctrlEna, pgcEna;
 
-   pmcCtrl = __GET_MSR(ctrlMSR);
+   pmcCtrl = X86MSR_GetMSR(ctrlMSR);
    if (isGen) {
       ASSERT(pmcNum < 32);
       if ((pmcCtrl & PERFCTR_CPU_ENABLE) != 0) {
@@ -3191,21 +3131,21 @@ Vmx86PerfCtrInUse(Bool isGen, unsigned pmcNum, unsigned ctrlMSR,
       ctrlEna = pmcCtrl | PERFCTR_CORE_FIXED_KERNEL_MASKn(pmcNum);
       pgcEna = CONST64U(1) << (pmcNum + 32);
    }
-   pmcCount = __GET_MSR(cntMSR);
+   pmcCount = X86MSR_GetMSR(cntMSR);
    /* Enable the counter. */
-   __SET_MSR(ctrlMSR, ctrlEna);
+   X86MSR_SetMSR(ctrlMSR, ctrlEna);
    if (hasPGC) {
-      __SET_MSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR, pgcEna | origPGC);
+      X86MSR_SetMSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR, pgcEna | origPGC);
    }
    /* Retire some instructions and wait a few cycles. */
    for (delay = 0; delay < 100; delay++) ;
    /* Disable the counter. */
    if (hasPGC) {
-      __SET_MSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR, origPGC);
+      X86MSR_SetMSR(PERFCTR_CORE_GLOBAL_CTRL_ADDR, origPGC);
    }
-   count = __GET_MSR(cntMSR);
-   __SET_MSR(ctrlMSR, pmcCtrl);
-   __SET_MSR(cntMSR, pmcCount);
+   count = X86MSR_GetMSR(cntMSR);
+   X86MSR_SetMSR(ctrlMSR, pmcCtrl);
+   X86MSR_SetMSR(cntMSR, pmcCount);
    return count == pmcCount;
 }
 
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index b4cedc9e..4a8fb2fb 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -32,13 +32,14 @@
 #include "x86msr.h"
 #include "modulecall.h"
 #include "vcpuid.h"
-#include "initblock.h"
 #include "iocontrols.h"
 #include "numa_defs.h"
 #include "rateconv.h"
 #include "vmmem_shared.h"
 #include "apic.h"
 #include "bootstrap_vmm.h"
+#include "sharedAreaVmmon.h"
+#include "statVarsVmmon.h"
 
 typedef struct TSCDelta {
    Atomic_uint64 min;
@@ -55,23 +56,19 @@ struct VmmBlobInfo;
 typedef struct VMDriver {
    /* Unique (in the driver), strictly positive, VM ID used by userland. */
    int                     userID;
-
    Vcpuid                  numVCPUs;         /* Number of vcpus in VM. */
-
    struct VMDriver        *nextDriver;       /* Next on list of all VMDrivers */
-
    struct VMHost          *vmhost;           /* Host-specific fields. */
-
    MPN                    *ptRootMpns;       /* numVCPUs-sized array. */
    struct VmmBlobInfo     *blobInfo;         /* VMM bootstrap blob info. */
-
+   SharedAreaVmmon        *sharedArea;       /* VMMon shared area info. */
+   StatVarsVmmon          *statVars;         /* VMMon stat vars info. */
    /* Pointers to the crossover pages shared with the monitor. */
    struct VMCrossPage    **crosspage;        /* numVCPUs-sized array. */
    struct MemTrack        *ptpTracker;       /* Tracks page table patch pages */
    struct MemTrack        *vmmTracker;       /* Tracks allocated VMM pages */
    VCPUSet                *crosscallWaitSet; /* numVCPUs-sized array. */
    APICDescriptor          hostAPIC;
-
    struct MemTrack        *memtracker;       /* Memory tracker pointer */
    Bool                    checkFuncFailed;
    struct PerfCounter     *perfCounter;
@@ -81,6 +78,7 @@ typedef struct VMDriver {
    Atomic_uint64           ptscLatest;
    int64                  *ptscOffsets;      /* numVCPUs-sized array. */
    Atomic_uint32          *currentHostCpu;   /* numVCPUs-sized array. */
+   PageCnt                 numPTPPages;      /* Num PTP pages allocated. */
 } VMDriver;
 
 typedef struct MonLoaderArgs {
@@ -110,7 +108,7 @@ typedef struct PseudoTSC {
 
 extern PseudoTSC pseudoTSC;
 
-#define MAX_LOCKED_PAGES (-1)
+#define MAX_LOCKED_PAGES MAX_PPN
 
 extern void Vmx86_CacheNXState(void);
 extern VMDriver *Vmx86_CreateVM(VA64 bsBlob,
@@ -121,11 +119,10 @@ extern Bool Vmx86_ProcessBootstrap(VMDriver *vm,
                                    uint32 numBytes,
                                    uint32 headerOffset,
                                    uint16 numVCPUs,
-                                   UserVA64 *ptRootVAs,
+                                   PerVcpuPages *perVcpuPages,
                                    VMSharedRegion *shRegions);
 extern int Vmx86_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
 extern int Vmx86_ReleaseVM(VMDriver *vm);
-extern int Vmx86_InitVM(VMDriver *vm, InitBlock *initParams);
 extern int Vmx86_LateInitVM(VMDriver *vm);
 extern int Vmx86_RunVM(VMDriver *vm, Vcpuid vcpuid);
 extern void Vmx86_YieldToSet(VMDriver *vm, Vcpuid currVcpu, const VCPUSet *req,
@@ -142,22 +139,21 @@ extern int Vmx86_UnlockPage(VMDriver *vm, VA64 uAddr);
 extern int Vmx86_UnlockPageByMPN(VMDriver *vm, MPN mpn, VA64 uAddr);
 extern MPN Vmx86_GetRecycledPage(VMDriver *vm);
 extern int Vmx86_ReleaseAnonPage(VMDriver *vm, MPN mpn);
-extern int Vmx86_AllocLockedPages(VMDriver *vm, VA64 addr,
-                                  unsigned numPages, Bool kernelMPNBuffer,
-                                  Bool ignoreLimits);
-extern int Vmx86_FreeLockedPages(VMDriver *vm, VA64 addr,
-                                 unsigned numPages, Bool kernelMPNBuffer);
+extern int64 Vmx86_AllocLockedPages(VMDriver *vm, VA64 addr,
+                                    PageCnt numPages, Bool kernelMPNBuffer,
+                                    Bool ignoreLimits);
+extern int Vmx86_FreeLockedPages(VMDriver *vm, MPN *mpns, PageCnt numPages);
 extern MPN Vmx86_GetNextAnonPage(VMDriver *vm, MPN mpn);
+extern MPN Vmx86_GetNumAnonPages(VMDriver *vm);
 extern MPN Vmx86_AllocLowPage(VMDriver *vm, Bool ignoreLimits);
 extern void *Vmx86_Calloc(size_t numElements,
                           size_t elementSize,
-                          int nonPageable);
+                          Bool nonPageable);
 extern void  Vmx86_Free(void *ptr);
 
 extern int32 Vmx86_GetNumVMs(void);
-extern int32 Vmx86_GetTotalMemUsage(void);
-extern Bool Vmx86_SetConfiguredLockedPagesLimit(unsigned limit);
-extern void Vmx86_SetDynamicLockedPagesLimit(unsigned limit);
+extern Bool Vmx86_SetConfiguredLockedPagesLimit(PageCnt limit);
+extern void Vmx86_SetDynamicLockedPagesLimit(PageCnt limit);
 extern Bool Vmx86_GetMemInfo(VMDriver *curVM,
                              Bool curVMOnly,
                              VMMemInfoArgs *args,
diff --git a/vmmon-only/include/circList.h b/vmmon-only/include/circList.h
index fbdd4a98..ee04a9e1 100644
--- a/vmmon-only/include/circList.h
+++ b/vmmon-only/include/circList.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -345,6 +345,34 @@ CircList_Push(ListItem *p,               // IN
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * CircList_InsertAfter --
+ *
+ *      Adds a new member to the list after the provided item.  Assumes p
+ *      is not a member of a list already.
+ *
+ * Result:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE void
+CircList_InsertAfter(ListItem *p,      // IN:
+                     ListItem *after)  // IN:
+{
+   p->prev = after;
+   p->next = after->next;
+   p->next->prev = p;
+   after->next = p;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
diff --git a/vmmon-only/include/cpuid_info.h b/vmmon-only/include/cpuid_info.h
deleted file mode 100644
index 28465dd3..00000000
--- a/vmmon-only/include/cpuid_info.h
+++ /dev/null
@@ -1,77 +0,0 @@
-/*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef _CPUID_INFO_H
-#define _CPUID_INFO_H
-
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_VMKERNEL
-
-#include "includeCheck.h"
-
-#include "vm_basic_asm.h"
-#include "x86cpuid_asm.h"
-
-#if defined __cplusplus
-extern "C" {
-#endif
-
-
-typedef struct CPUID0 {
-   int numEntries;
-   char name[16];      // 4 extra bytes to null terminate
-} CPUID0;
-
-typedef struct CPUID1 {
-   uint32 version;
-   uint32 ebx;
-   uint32 ecxFeatures;
-   uint32 edxFeatures;
-} CPUID1;
-
-typedef struct CPUID80 {
-   uint32 numEntries;
-   uint32 ebx;
-   uint32 ecx;
-   uint32 edx;
-} CPUID80;
-
-typedef struct CPUID81 {
-   uint32 eax;
-   uint32 ebx;
-   uint32 ecxFeatures;
-   uint32 edxFeatures;
-} CPUID81;
-
-typedef struct CPUIDSummary {
-   CPUID0  id0;
-   CPUID1  id1;
-   CPUIDRegs ida;
-   CPUID80 id80;
-   CPUID81 id81;
-   CPUIDRegs id88, id8a;
-} CPUIDSummary;
-
-
-#if defined __cplusplus
-} // extern "C"
-#endif
-
-#endif // _CPUID_INFO_H
diff --git a/vmmon-only/include/includeCheck.h b/vmmon-only/include/includeCheck.h
index 08fd1e58..6875af84 100644
--- a/vmmon-only/include/includeCheck.h
+++ b/vmmon-only/include/includeCheck.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008,2018-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 60fa0ab4..8d5fdcdf 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,7 +37,6 @@
 #error iocontrols.h is for hosted vmmon, do not use on visor
 #endif
 
-#include "basic_initblock.h"
 #include "x86segdescrs.h"
 #include "rateconv.h"
 #include "overheadmem_types.h"
@@ -45,6 +44,8 @@
 #include "numa_defs.h"
 #include "bootstrap_vmm.h"
 #include "contextinfo.h"
+#include "vcpuid.h"
+#include "sharedAreaType.h"
 
 #if defined __cplusplus
 extern "C" {
@@ -144,7 +145,7 @@ PtrToVA64(void const *ptr) // IN
  * See bora/doc/vmcore details.
  */
 
-#define VMMON_VERSION           (361 << 16 | 0)
+#define VMMON_VERSION           (385 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -153,11 +154,8 @@ PtrToVA64(void const *ptr) // IN
  * ENOMEM returned after MAX_VMS virtual machines created
  */
 
-#ifdef VMX86_SERVER
-#define MAX_VMS 128
-#else
 #define MAX_VMS 64
-#endif
+
 /*
  * MsgWaitForMultipleObjects doesn't scale well enough on Win32.
  * Allocate with MAX_VMS so static buffers are large, but do
@@ -209,11 +207,13 @@ enum IOCTLCmd {
    IOCTLCMD(VERSION) = IOCTLCMD(FIRST),
    IOCTLCMD(CREATE_VM),
    IOCTLCMD(PROCESS_BOOTSTRAP),
+   IOCTLCMD(REGISTER_SHARED),
+   IOCTLCMD(REGISTER_STATVARS),
    IOCTLCMD(RELEASE_VM),
    IOCTLCMD(GET_NUM_VMS),
-   IOCTLCMD(INIT_VM),
    IOCTLCMD(RUN_VM),
    IOCTLCMD(LOOK_UP_MPN),
+   IOCTLCMD(GET_VMM_PAGE_ROOT),
    IOCTLCMD(LOCK_PAGE),
    IOCTLCMD(UNLOCK_PAGE),
    IOCTLCMD(APIC_INIT),
@@ -222,7 +222,6 @@ enum IOCTLCmd {
    IOCTLCMD(ADMIT),
    IOCTLCMD(UPDATE_MEM_INFO),
    IOCTLCMD(READMIT),
-   IOCTLCMD(GET_TOTAL_MEM_USAGE),
    IOCTLCMD(GET_KHZ_ESTIMATE),
    IOCTLCMD(SET_HOST_CLOCK_RATE),
    IOCTLCMD(READ_PAGE),
@@ -232,6 +231,7 @@ enum IOCTLCmd {
     /* AWE calls */
    IOCTLCMD(ALLOC_LOCKED_PAGES),
    IOCTLCMD(GET_NEXT_ANON_PAGE),
+   IOCTLCMD(GET_NUM_ANON_PAGES),
 
    IOCTLCMD(GET_ALL_MSRS),
 
@@ -277,7 +277,6 @@ enum IOCTLCmd {
 
 #if defined __APPLE__
    IOCTLCMD(GET_NUM_RESPONDING_CPUS),
-   IOCTLCMD(ALLOC_LOW_PAGES),
    IOCTLCMD(INIT_DRIVER),
    IOCTLCMD(BLUEPILL),
 #endif
@@ -318,13 +317,15 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_CREATE_VM           VMIOCTL_BUFFERED(CREATE_VM)
 #define IOCTL_VMX86_RELEASE_VM          VMIOCTL_BUFFERED(RELEASE_VM)
 #define IOCTL_VMX86_PROCESS_BOOTSTRAP   VMIOCTL_BUFFERED(PROCESS_BOOTSTRAP)
+#define IOCTL_VMX86_REGISTER_SHARED     VMIOCTL_BUFFERED(REGISTER_SHARED)
+#define IOCTL_VMX86_REGISTER_STATVARS   VMIOCTL_BUFFERED(REGISTER_STATVARS)
 #define IOCTL_VMX86_GET_NUM_VMS         VMIOCTL_BUFFERED(GET_NUM_VMS)
-#define IOCTL_VMX86_INIT_VM             VMIOCTL_BUFFERED(INIT_VM)
 #define IOCTL_VMX86_RUN_VM              VMIOCTL_NEITHER(RUN_VM)
 #define IOCTL_VMX86_SEND_IPI            VMIOCTL_NEITHER(SEND_IPI)
 #define IOCTL_VMX86_SEND_ONE_IPI        VMIOCTL_BUFFERED(SEND_ONE_IPI)
 #define IOCTL_VMX86_GET_IPI_VECTORS     VMIOCTL_BUFFERED(GET_IPI_VECTORS)
 #define IOCTL_VMX86_LOOK_UP_MPN         VMIOCTL_BUFFERED(LOOK_UP_MPN)
+#define IOCTL_VMX86_GET_VMM_PAGE_ROOT   VMIOCTL_BUFFERED(GET_VMM_PAGE_ROOT)
 #define IOCTL_VMX86_LOCK_PAGE           VMIOCTL_BUFFERED(LOCK_PAGE)
 #define IOCTL_VMX86_UNLOCK_PAGE         VMIOCTL_BUFFERED(UNLOCK_PAGE)
 #define IOCTL_VMX86_APIC_INIT           VMIOCTL_BUFFERED(APIC_INIT)
@@ -348,6 +349,7 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_UNLOCK_PAGE_BY_MPN  VMIOCTL_BUFFERED(UNLOCK_PAGE_BY_MPN)
 #define IOCTL_VMX86_ALLOC_LOCKED_PAGES  VMIOCTL_BUFFERED(ALLOC_LOCKED_PAGES)
 #define IOCTL_VMX86_GET_NEXT_ANON_PAGE  VMIOCTL_BUFFERED(GET_NEXT_ANON_PAGE)
+#define IOCTL_VMX86_GET_NUM_ANON_PAGES  VMIOCTL_BUFFERED(GET_NUM_ANON_PAGES)
 
 #define IOCTL_VMX86_READ_DISASM_PROC_BINARY \
                                       VMIOCTL_BUFFERED(READ_DISASM_PROC_BINARY)
@@ -370,6 +372,8 @@ enum IOCTLCmd {
 #endif
 
 
+#define INIT_BLOCK_MAGIC     (0x1789 + 14)
+
 /*
  * Flags sent into APICBASE ioctl
  */
@@ -396,6 +400,14 @@ union {
 #include "vmware_pack_end.h"
 VMLockPage;
 
+typedef
+#include "vmware_pack_begin.h"
+union {
+   Vcpuid vcpuid; // IN: VCPU
+   MPN pageRoot;  // OUT: MPN of the VCPU's page root
+}
+#include "vmware_pack_end.h"
+VcpuPageRoot;
 
 typedef struct VMAPICInfo {
    uint32 flags;
@@ -414,9 +426,9 @@ typedef struct VMAPICInfo {
  * all these values at any given time.
  */
 typedef struct LockedPageLimit {
-   uint32 host;        // driver calculated maximum for this host
-   uint32 configured;  // user defined maximum pages to lock
-   uint32 dynamic;     // authd hardLimitMonitor pages to lock
+   PageCnt host;        // driver calculated maximum for this host
+   PageCnt configured;  // user defined maximum pages to lock
+   PageCnt dynamic;     // authd hardLimitMonitor pages to lock
 } LockedPageLimit;
 
 /*
@@ -437,15 +449,15 @@ typedef struct LockedPageLimit {
  */
 
 typedef struct VMMemMgmtInfo {
-   uint32          minAllocation;   // minimum pages for vm
-   uint32          maxAllocation;   // maximum pages the vm could lock
+   PageCnt         minAllocation;   // minimum pages for vm
+   PageCnt         maxAllocation;   // maximum pages the vm could lock
+   PageCnt         nonpaged;        // overhead memory (guest, mmap)
+   PageCnt         paged;           // vmx memory (malloc, statics)
+   PageCnt         anonymous;       // vmm memory
+   PageCnt         mainMemSize;     // guest main memory size
+   PageCnt         locked;          // number of pages locked by this vm
+   PageCnt         perVMOverhead;   // memory for vmx/vmmon overheads
    uint32          shares;          // proportional sharing weight
-   uint32          nonpaged;        // overhead memory (guest, mmap)
-   uint32          paged;           // vmx memory (malloc, statics)
-   uint32          anonymous;       // vmm memory
-   uint32          mainMemSize;     // guest main memory size
-   uint32          locked;          // number of pages locked by this vm
-   uint32          perVMOverhead;   // memory for vmx/vmmon overheads
    Percent         touchedPct;      // % of guest memory being touched
    Percent         dirtiedPct;      // % of guest memory being dirtied
    Bool            admitted;        // admission control
@@ -468,14 +480,14 @@ typedef struct VMMemMgmtInfoPatch {
 
 typedef struct VMMemInfoArgs {
    uint64          currentTime;        // Host time in secs of the call.
-   uint32          minVmMemPct;        // % of vm that must fit in memory
-   uint32          globalMinAllocation;// pages that must fit in maxLockedPages
-   uint32          numLockedPages;     // total locked pages by all vms
+   PageCnt         globalMinAllocation;// pages that must fit in maxLockedPages
+   PageCnt         numLockedPages;     // total locked pages by all vms
    LockedPageLimit lockedPageLimit;    // set of locked page limits
-   uint32          maxLockedPages;     // effective limit on locked pages
+   PageCnt         maxLockedPages;     // effective limit on locked pages
    uint32          callerIndex;        // this vm's index memInfo array
    uint32          numVMs;             // number of running VMs
-   uint8           _pad[4];
+   Percent         minVmMemPct;        // % of vm that must fit in memory
+   uint8           _pad[7];
    VMMemMgmtInfo   memInfo[1];
 } VMMemInfoArgs;
 
@@ -488,9 +500,9 @@ typedef struct VMMPNNext {
 } VMMPNNext;
 
 typedef struct VMMPNList {
-   uint32    mpnCount;   // IN (and OUT on Mac OS)
+   PageCnt   mpnCount;   // IN (and OUT on Mac OS)
    Bool      ignoreLimits;
-   uint8     _pad[3];
+   uint8     _pad[7];
    VA64      mpnList;    // IN: User VA of an array of 64-bit MPNs.
 } VMMPNList;
 
@@ -526,8 +538,6 @@ typedef struct PTSCCheckParams {
    uint8  _pad[7];
 } PTSCCheckParams;
 
-#ifndef VMX86_SERVER
-
 typedef struct IPIVectors {
    /*
     * Vectors we have allocated or stolen for the monitor interrupts.
@@ -536,8 +546,6 @@ typedef struct IPIVectors {
    uint8 hvIPIVector;
 } IPIVectors;
 
-#endif
-
 /*
  * Arguments and return value for VM creation.
  */
@@ -552,11 +560,33 @@ typedef struct VMCreateBlock {
  * Information about a shared region.
  */
 typedef struct VMSharedRegion {
-   uint32 index;
-   VPN    baseVpn;
-   uint32 numPages;
+   SharedAreaType index;
+   VPN            baseVpn;
+   uint32         numPages;
 } VMSharedRegion;
 
+/*
+ * Arguments for VMM shared area registration.
+ */
+typedef struct VMSharedAreaRegistrationBlock {
+   Vcpuid vcpu;            // IN: VCPU being registered.
+   VMSharedRegion region;  // IN: Shared region being registered.
+} VMSharedAreaRegistrationBlock;
+
+/*
+ * Information about a VM's statvars.
+ */
+typedef struct VMStatVarsRegistrationBlock {
+   VPN     baseVpn;
+   PageCnt numPages;
+   Vcpuid  vcpu;
+} VMStatVarsRegistrationBlock;
+
+typedef struct {
+   VA64   crosspage; // IN: User VA of VCPU crosspage.
+   VA64   ptRoot;    // IN: User VA of VCPU L4 page table root.
+} PerVcpuPages;
+
 /*
  * Arguments for VMM bootstrap processing.
  */
@@ -565,10 +595,17 @@ typedef struct VMProcessBootstrapBlock {
    uint32         numBytes;      // IN: Size of VMM bootstrap blob.
    uint32         headerOffset;  // IN: Offset of header in blob.
    uint16         numVCPUs;      // IN: Number of VCPUs.
-   VA64           ptRootVAs[MAX_VCPUS];  // IN: User VA of PT roots.
    VMSharedRegion shRegions[ML_SHARED_REGIONS_MAX]; // IN: Shared regions.
+   PerVcpuPages   perVcpuPages[0];
 } VMProcessBootstrapBlock;
 
+static INLINE size_t
+GetVMProcessBootstrapBlockSize(unsigned numVCPUs)
+{
+   VMProcessBootstrapBlock *args = NULL;
+   return sizeof *args + numVCPUs * sizeof args->perVcpuPages[0];
+}
+
 /*
  * Arguments for VMM context retrieval.
  */
@@ -584,29 +621,20 @@ typedef union {
  * macros to marshall real arguments to mmap's made-up 'offset' argument.
  */
 
-#define VMMON_MAP_MT_LOW4GB     0
-#define VMMON_MAP_MT_LOW16MB    1
-#define VMMON_MAP_MT_ANY        2
-
 #define VMMON_MAP_OFFSET_SHIFT  0
 #define VMMON_MAP_OFFSET_MASK   0x00000FFF
 #define VMMON_MAP_ORDER_SHIFT   12
 #define VMMON_MAP_ORDER_MASK    0xF
-#define VMMON_MAP_MT_SHIFT      16
-#define VMMON_MAP_MT_MASK       0x7
-#define VMMON_MAP_RSVD_SHIFT    19
+#define VMMON_MAP_RSVD_SHIFT    16
 
 #define VMMON_MAP_RSVD(base)    \
                 ((base) >> VMMON_MAP_RSVD_SHIFT)
-#define VMMON_MAP_MT(base)      \
-                (((base) >> VMMON_MAP_MT_SHIFT) & VMMON_MAP_MT_MASK)
 #define VMMON_MAP_ORDER(base)   \
                 (((base) >> VMMON_MAP_ORDER_SHIFT) & VMMON_MAP_ORDER_MASK)
 #define VMMON_MAP_OFFSET(base)  \
                 (((base) >> VMMON_MAP_OFFSET_SHIFT) & VMMON_MAP_OFFSET_MASK)
 
-#define VMMON_MAP_BASE(mt, order)   (((mt) << VMMON_MAP_MT_SHIFT) | \
-                                     ((order) << VMMON_MAP_ORDER_SHIFT))
+#define VMMON_MAP_BASE(order)   ((order) << VMMON_MAP_ORDER_SHIFT)
 
 #elif defined _WIN32
 /*
@@ -617,7 +645,6 @@ typedef struct VMAllocContiguousMem {
    VA64   mpnList;  // IN: User VA of an array of 64-bit MPNs.
    uint32 mpnCount; // IN
    uint32 order;    // IN
-   MPN    maxMPN;   // IN
 } VMAllocContiguousMem;
 #elif defined __APPLE__
 #   include "iocontrolsMacos.h"
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index ef244df2..9187e326 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -42,8 +42,8 @@
 #include "mon_assert.h"
 
 #define NUM_EXCEPTIONS   20     /* EXC_DE ... EXC_XF. */
-#define CP_STUB_SIZE 16     /* A relative jmp instruction (5 bytes)
-                               padded to the next 16 byte boundary. */
+#define CP_STUB_SIZE     16     /* A relative jmp instruction (5 bytes)
+                                   padded to the next 16 byte boundary. */
 
 #define MODULECALL_TABLE                                                      \
    MC(INTR)                                                                   \
@@ -66,7 +66,10 @@
    MC(GET_MON_IPI_VECTOR)                                                     \
    MC(GET_HV_IPI_VECTOR)                                                      \
    MC(GET_HOST_TIMER_VECTORS)                                                 \
-   MC(BOOTSTRAP_CLEANUP)
+   MC(BOOTSTRAP_CLEANUP)                                                      \
+   MC(GET_SHARED_AREA)                                                        \
+   MC(GET_STAT_VARS)                                                          \
+   MC(GET_NUM_PTP_PAGES)
 
 /*
  *----------------------------------------------------------------------
@@ -292,7 +295,8 @@ struct VMCrossPageData {
    uint64   crosspageMA;
 
    uint64   hostDR[8];
-   LA64     hostCrossPageLA;   // where host has crosspage mapped
+   LA64     crossPageLA;       // where host/PTP map the cross page
+   LA64     crossGDTLA;        // where host/PTP map the cross GDT
    uint16   hostInitial64CS;
    uint8    hostDRSaved;       // Host DR spilled to hostDR[x].
    uint8    hostDRInHW;        // 0 -> shadowDR in h/w, 1 -> hostDR in h/w.
@@ -310,8 +314,6 @@ struct VMCrossPageData {
    Task64   monTask;          /* vmm's task */
 
    VMMPageTablePatch vmmPTP[MAX_SWITCH_PT_PATCHES]; /* page table patch */
-   LA64              vmmCrossPageLA;
-   LA64              vmmCrossGDTLA;   // where crossGDT is mapped by PT patch
 
    /*
     * The monitor may requests up to two actions when returning to the
@@ -391,6 +393,7 @@ struct VMCrossPageData {
    uint8         _pad7[4];
    uint64        wsUD2;                       // IP of ud2 instr or 0 if unset.
    uint64        specCtrl; /* host MSR_SPEC_CTRL value before world switch. */
+   uint8         _pad8[8];
 }
 #include "vmware_pack_end.h"
 VMCrossPageData;
@@ -447,17 +450,14 @@ struct VMCrossPage {
 #include "vmware_pack_end.h"
 VMCrossPage;
 
-#define CROSSPAGE_VERSION_BASE 0xc09 /* increment by 1 */
+#define CROSSPAGE_VERSION_BASE 0xc0c /* increment by 1 */
 #define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
 
 #if !defined(VMX86_SERVER) && defined(VMM)
-#define CROSS_PAGE  ((VMCrossPage * const) VPN_2_VA(CROSS_PAGE_START))
+#define CROSS_PAGE             ((VMCrossPage * const)VPN_2_VA(CROSS_PAGE_START))
 #define VMM_SWITCH_SHARED_DATA ((VMCrossPageData *)&CROSS_PAGE->crosspageData)
 #endif
 
-#define NULLPAGE_LINEAR_START  (MONITOR_LINEAR_START + \
-                                PAGE_SIZE * CPL0_GUARD_PAGE_START)
-
 #define MX_WAITINTERRUPTED     3
 #define MX_WAITTIMEDOUT        2
 #define MX_WAITNORMAL          1  // Must equal one; see linux module code.
diff --git a/vmmon-only/include/monAddrLayout.h b/vmmon-only/include/monAddrLayout.h
index 130124c0..43d2e992 100644
--- a/vmmon-only/include/monAddrLayout.h
+++ b/vmmon-only/include/monAddrLayout.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -25,6 +25,8 @@
 #ifndef _MON_ADDR_LAYOUT_H
 #define _MON_ADDR_LAYOUT_H
 
+#include "vm_pagetable.h"
+
 #define INCLUDE_ALLOW_VMCORE
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMKERNEL
@@ -37,6 +39,8 @@ typedef struct VMM64_AddrLayout {
     *All address are VPNs and all lengths are numPages
     */
    uint64 monBase;            // MONITOR_BASE_VPN
+   uint64 monL5Start;         // MON_PAGE_TABLE_L5_START
+   uint32 monL5Len;           // MON_PAGE_TABLE_L5_LEN
    uint64 monL4Start;         // MON_PAGE_TABLE_L4_START
    uint32 monL4Len;           // MON_PAGE_TABLE_L4_LEN
    uint64 monL3Start;         // MON_PAGE_TABLE_L3_START
@@ -51,7 +55,21 @@ typedef struct VMM64_AddrLayout {
 } VMM64_AddrLayout;
 #pragma pack(pop)
 
-#define VMM_MONAS_FIRST_L4OFF   1
-#define VMM_MONAS_LAST_L4OFF  127
+#define VMM_MONAS_4LP_FIRST_L4OFF   1
+#define VMM_MONAS_4LP_LAST_L4OFF  130
+
+#define VMM_MONAS_5LP_FIRST_L5OFF   1
+#define VMM_MONAS_5LP_LAST_L5OFF   34
+
+static INLINE PT_Level
+MonAS_GetPagingLevel(void)
+{
+   return PT_LEVEL_4;
+}
 
+static INLINE Bool
+MonAS_Uses5LevelPaging(void)
+{
+   return MonAS_GetPagingLevel() == PT_LEVEL_5;
+}
 #endif
diff --git a/vmmon-only/include/monLoader.h b/vmmon-only/include/monLoader.h
index 22ac0ae0..60731028 100644
--- a/vmmon-only/include/monLoader.h
+++ b/vmmon-only/include/monLoader.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,8 +31,8 @@
  * contains code and data statically built, empty but allocated space, shared
  * and run-time initialized content.  The monitor loader header regularizes
  * encoding of address space information, allowing a common representation and
- * common code to be re-used for different contexts (vmmon for hosted, vmkernel
- * for ESX, and the VMX while deprivileging of bootstrap is ongoing).
+ * common code to be re-used for different contexts (vmmon for hosted
+ * and vmkernel for ESX).
  *
  * The Header
  * ==========
@@ -87,7 +87,6 @@
  * MonLoaderCallout_Init(): Initialize MonLoader callouts.
  * MonLoaderCallout_GetSharedHostPage(subIdx, page): Get shared host page MPN.
  * MonLoaderCallout_GetSharedUserPage(subIdx, page): Get shared user page MPN.
- * MonLoaderCallout_SetEntrypoint(): Sets the entry code/stack for execution.
  *
  * Building vs Importing
  * =====================
@@ -119,21 +118,54 @@
 #define _MON_LOADER
 
 #include "vm_basic_types.h"
-#include "x86paging_common.h"
-#include "x86types.h" /* PT_L1E */
+#include "vm_pagetable.h"
 #include "vcpuid.h"   /* Vcpuid */
 
+#if defined VM_X86_64
+#include "x86paging_64.h"
+#elif defined VM_ARM_64
+#include "arm64_vmsa.h"
+#endif
+
 #define ML_NAME_MAX 16
 
 /* ML perms are simple and abbreviated. */
 
+#if defined VM_X86_64
+
 #define ML_PERM_RWX (PTE_P | PTE_RW)
 #define ML_PERM_RW  (PTE_P | PTE_RW | PTE_NX)
 #define ML_PERM_RO  (PTE_P |          PTE_NX)
 #define ML_PERM_RX   PTE_P
 
+#define ML_PERM_TBL   ML_PERM_RWX
 #define ML_PERM_MASK (PTE_P| PTE_RW | PTE_NX | PTE_US)
 
+#define ML_PERM_PRESENT(_flags)     (((_flags) & PTE_P) != 0)
+#define ML_PERM_WRITEABLE(_flags)   (((_flags) & PTE_RW) != 0)
+
+#define ML_PTE_2_PFN(_pte)          LM_PTE_2_PFN(_pte)
+
+#elif defined VM_ARM_64
+
+#define _ML_PERM_COMMON (ARM_PTE_BLOCK_AP(ARM_AP_PL0)   | ARM_PTE_BLOCK_AF | \
+                         ARM_PTE_BLOCK_SH(ARM_SH_OUTER) | ARM_PTE_BLOCK_L3_TYPE)
+#define ARM_PTE_BLOCK_AP_RO ARM_PTE_BLOCK_AP(ARM_AP_RO)
+
+#define ML_PERM_RW   (_ML_PERM_COMMON |                       ARM_PTE_BLOCK_XN)
+#define ML_PERM_RO   (_ML_PERM_COMMON | ARM_PTE_BLOCK_AP_RO | ARM_PTE_BLOCK_XN)
+#define ML_PERM_RX   (_ML_PERM_COMMON | ARM_PTE_BLOCK_AP_RO                   )
+
+#define ML_PERM_TBL   ML_PERM_RW
+#define ML_PERM_MASK (_ML_PERM_COMMON | ARM_PTE_BLOCK_AP_RO | ARM_PTE_BLOCK_XN)
+
+#define ML_PERM_PRESENT(_flags)   (((_flags) & ARM_PTE_VALID) != 0)
+#define ML_PERM_WRITEABLE(_flags) (((_flags) & ARM_PTE_BLOCK_AP_RO) == 0)
+
+#define ML_PTE_2_PFN(_pte)    (((_pte) & ARM_PTE_PFN_MASK) >> PT_PTE_PFN_SHIFT)
+
+#endif
+
 #define ML_PERMS_MATCH(x,p) (((x) & ML_PERM_MASK) == ((p) & ML_PERM_MASK))
 
 #define LOADER_HEADER_MAGIC 0x8675309E98675309
@@ -150,10 +182,10 @@ typedef enum {
    ML_CONTENT_SHARE,         /* Share data from external source. */
 } MonLoaderContentType;
 
-#define CONTENT_TO_PTLEVEL(x) (x == ML_CONTENT_PAGETABLE_L4 ? 4 : \
-                               x == ML_CONTENT_PAGETABLE_L3 ? 3 : \
-                               x == ML_CONTENT_PAGETABLE_L2 ? 2 : \
-                               x == ML_CONTENT_PAGETABLE_L1 ? 1 : \
+#define CONTENT_TO_PTLEVEL(x) (x == ML_CONTENT_PAGETABLE_L4 ? PT_LEVEL_4 : \
+                               x == ML_CONTENT_PAGETABLE_L3 ? PT_LEVEL_3 : \
+                               x == ML_CONTENT_PAGETABLE_L2 ? PT_LEVEL_2 : \
+                               x == ML_CONTENT_PAGETABLE_L1 ? PT_LEVEL_1 : \
                                0)
 
 /* Sources of content, for pages not zeroed, unmapped or otherwise special. */
@@ -183,11 +215,14 @@ typedef struct {
    } blobSrc;
    uint64               bspOnly;           /* Process only on BSP. */
    uint64               subIndex;          /* Region ID for ML_CONTENT_COPY. */
-   uint64               procVmmon;         /* Processed by the vmmon on hosted. */
 } MonLoaderEntry;
 
 
-/* Packed for easy consumption by bootstrap-offsets.pl. */
+/*
+ * Packed for easy consumption by bootstrap-offsets.pl. If the contents of the
+ * MonLoaderHeader struct are changed then $HEADER_SIZE must be updated
+ * accordingly in bootstrap-offsets.pl.
+ */
 #pragma pack(push, 1)
 typedef struct MonLoaderHeader {
    uint64         magic;
@@ -199,6 +234,8 @@ typedef struct MonLoaderHeader {
    /* ss:rip */
    uint16         stackSelector;
    VA64           stackEntrypoint;
+   LPN64          monStartLPN;
+   LPN64          monEndLPN;
    MonLoaderEntry entries[];
 } MonLoaderHeader;
 #pragma pack(pop)
@@ -217,16 +254,13 @@ MPN  MonLoaderCallout_GetPageRoot(struct MonLoaderEnvContext *, Vcpuid);
 Bool MonLoaderCallout_GetPTE(struct MonLoaderEnvContext *, MPN, unsigned,
                              Vcpuid, PT_L1E *);
 Bool MonLoaderCallout_ImportPage(struct MonLoaderEnvContext *, MPN, Vcpuid);
-Bool MonLoaderCallout_Init(void *, struct MonLoaderEnvContext **);
+Bool MonLoaderCallout_Init(void *, struct MonLoaderEnvContext **, unsigned);
 Bool MonLoaderCallout_MapMPNInPTE(struct MonLoaderEnvContext *, MPN, unsigned,
                                   uint64, MPN, Vcpuid);
 MPN  MonLoaderCallout_GetSharedUserPage(struct MonLoaderEnvContext *, uint64,
                                         unsigned, Vcpuid);
 MPN  MonLoaderCallout_GetSharedHostPage(struct MonLoaderEnvContext *, uint64,
                                         unsigned, Vcpuid);
-Bool MonLoaderCallout_IsPrivileged(struct MonLoaderEnvContext *);
-Bool MonLoaderCallout_SetEntrypoint(struct MonLoaderEnvContext *, uint16, VA64,
-                                    uint16, VA64);
 MPN  MonLoaderCallout_GetBlobMpn(struct MonLoaderEnvContext *, uint64);
 
 typedef enum MonLoaderError {
@@ -237,7 +271,6 @@ typedef enum MonLoaderError {
    ML_ERROR_ARGS,
    ML_ERROR_CALLOUT_INIT,
    ML_ERROR_CALLOUT_COPY,
-   ML_ERROR_CALLOUT_ENTRYPOINT,
    ML_ERROR_CALLOUT_GETPTE,
    ML_ERROR_CALLOUT_MAPINPTE,
    ML_ERROR_CALLOUT_PAGEROOT_GET,
@@ -259,8 +292,12 @@ typedef enum MonLoaderError {
 } MonLoaderError;
 
 
-/* A subindex above shared area subindices for sharing of MonLoaderHeader. */
+/*
+ * Values above shared area subindices for sharing of MonLoaderHeader
+ * and htSchedStateMap.
+ */
 #define MONLOADER_HEADER_IDX 6
+#define MONLOADER_HT_MAP_IDX 7
 
 
 MonLoaderError MonLoader_Process(MonLoaderHeader *header, unsigned numVCPUs,
diff --git a/vmmon-only/include/monLoaderLog.h b/vmmon-only/include/monLoaderLog.h
index 3fa0da6f..53fbd437 100644
--- a/vmmon-only/include/monLoaderLog.h
+++ b/vmmon-only/include/monLoaderLog.h
@@ -25,23 +25,7 @@
 #ifndef _MONLOADER_LOG_H_
 #define _MONLOADER_LOG_H_
 
-#ifdef VMX86_VMX
-
-#define LOGLEVEL_MODULE main
-#include "loglevel_vmcore.h"
-/*
- * Redefine LOG() to match the vmkernel calling convention.
- */
-#undef LOG_BYNAME
-#undef LOG
-
-#define LOG_BYNAME(_mod, _min, _fmt, ...) \
-        (DOLOG_BYNAME(_mod, _min) ? Log(_fmt "\n", ## __VA_ARGS__) : (void) 0)
-
-#define LOG(_min, _fmt, ...) \
-        LOG_BYNAME(LOGLEVEL_MODULE, _min, _fmt, ## __VA_ARGS__)
-
-#elif defined VMKERNEL
+#if defined VMKERNEL
 
 #define LOGLEVEL_MODULE MonLoader
 #include "log.h"
@@ -59,7 +43,7 @@ do {                                                 \
    }                                                 \
 } while (0)
 
-#else /* !defined VMX86_VMX && !defined VMKERNEL && !defined VMMON */
+#else /* !defined VMKERNEL && !defined VMMON */
 #error MonLoader cannot be built as part of this environment
 #endif
 
diff --git a/vmmon-only/include/mon_assert.h b/vmmon-only/include/mon_assert.h
index 3d047f89..363c9960 100644
--- a/vmmon-only/include/mon_assert.h
+++ b/vmmon-only/include/mon_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2007-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2007-2015,2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -60,20 +60,21 @@
  *     lengths, and this causes the 'monitor-modular-size' script to
  *     report differences in '.rodata'.
  *
- *   o To avoid differences in '.rodata', each __FILE__ is put into
- *     its own section.  The monitor's linker (not ld) will use the
- *     name of the section to recover the name of the source file.
+ *   o Each __FILE__ is put into its own .assert_pathname_##__FILE
+ *     section.  The monitor's runtime linker (not ld) then uses the name
+ *     of this section to recover the name of the corresponding source file.
  *
  *   o At run time, prior to loading, when our linker is creating an
  *     executable image of the monitor and extensions, all the file
  *     names are extracted from these sections, the '${VMTREE}' prefix
  *     is removed, and the resulting table of shortened file names is
- *     added to '.rodata'.
+ *     added to a non-loadable section called '.assert_pathnames' in the
+ *     VMX linker (not the bootstrap linker which does not need them).
  *
  *     Further, during linkage, each relocation to the original
  *     section containing the path name is modified so that the low
- *     16-bits contain an offset from '__vmm_pathnames_start' rather
- *     than the base of the original containing section.
+ *     16-bits contain an offset from the start of the .assert_pathnames
+ *     section rather than the base of the original containing section.
  *
  *     Only three types of relocations to the assertion strings are
  *     supported (32-bit PC-relative and 32-bit/64-bit absolute) because that
@@ -111,42 +112,12 @@ typedef struct Assert_Info {
    Assert_MonSrcLoc loc;
 } Assert_Info;
 
-/*
- * The portion of the __attribute__ line after __FILE__ is there so that
- * the .assert_pathname_* sections are not marked as ALLOC, since we only
- * need them in the vmx and do not need them loaded.
- */
-#define __VMM__FILE__SECTION \
-      __attribute__((section (".assert_pathname_" __FILE__ ",\"\"#")))
-#define __VMM__FILE__ ({                                                \
-         static __VMM__FILE__SECTION const char file[] = "";            \
-         file;                                                          \
-      })
-
 #define ASSERT_MONSRCFILEOFFSET(loc)    LOWORD(loc)
 #define ASSERT_MONSRCLINE(loc)          HIWORD(loc)
 
 #define ASSERT_NULL_MONSRCLOC     0             // there is never line 0
 
-#ifdef VMM // {
-#ifdef MONITOR_APP // {
-
-#define ASSERT_MONSRCLOC() ASSERT_NULL_MONSRCLOC
-
-#else // } {
-
-#define ASSERT_MONSRCLOC() ({                                           \
-   const uintptr_t offset = ((__LINE__ << 16) +                         \
-                             (uintptr_t)__VMM__FILE__);                 \
-   const Assert_MonSrcLoc loc = offset;                                 \
-   loc;                                                                 \
-})
-
-extern const char __vmm_pathnames_start;
-#define ASSERT_MONSRCFILE(loc) \
-   (&__vmm_pathnames_start + ASSERT_MONSRCFILEOFFSET(loc))
-
-
+#if defined(VMM) && !defined(MONITOR_APP) // {
 /*
  * Assertion information is collected in a non-loadable section
  * named .assert_info.  Each record in this section contains
@@ -176,6 +147,18 @@ extern const char __vmm_pathnames_start;
  */
 
 #ifndef VMM_BOOTSTRAP
+/*
+ * The portion of the __attribute__ line after __FILE__ is there so that
+ * the .assert_pathname_* sections are not marked as ALLOC, since we only
+ * need them in the vmx and do not need them loaded.
+ */
+#define __VMM__FILE__SECTION \
+      __attribute__((section (".assert_pathname_" __FILE__ ",\"\"#")))
+#define __VMM__FILE__ ({                                                \
+         static __VMM__FILE__SECTION const char file[] = "";            \
+         file;                                                          \
+      })
+
 #define ASSERT_RECORDINFO(assembly, assertType, bugNr)                   \
    __asm__ __volatile__(".pushsection .assert_info;"                     \
                         ".quad 0f;"                                      \
@@ -215,8 +198,6 @@ extern uint64 bsAssertRIP;
    ({COMPILER_MEM_BARRIER();                                             \
      ASSERT_RECORDINFO("", AssertType_##name##Bug, bug);                 \
      __builtin_trap();})
+#endif // VMM && !MONITOR_APP}
 
-#endif // MONITOR_APP }
-#endif // VMM }
-
-#endif
+#endif // _MON_ASSERT_H_
diff --git a/vmmon-only/include/pagelist.h b/vmmon-only/include/pagelist.h
index 8628c350..c261d4ec 100644
--- a/vmmon-only/include/pagelist.h
+++ b/vmmon-only/include/pagelist.h
@@ -52,7 +52,7 @@ extern "C" {
 typedef struct PageListEntry {
    CompressedBPN cbpn;
    Bool voided;
-   uint8 _pad[2];
+   uint8 _pad[1];
 } PageListEntry;
 #pragma pack(pop) 
 
diff --git a/vmmon-only/include/pcip_defs.h b/vmmon-only/include/pcip_defs.h
index b7620a92..87884066 100644
--- a/vmmon-only/include/pcip_defs.h
+++ b/vmmon-only/include/pcip_defs.h
@@ -55,12 +55,16 @@ typedef enum PCIPassthruVectorIndex {
 } PCIPassthruVectorIndex;
 
 typedef enum PCIPassthru_IntrType {
-   PCIPASSTHRU_INTR_NONE   = 0x00,
-   PCIPASSTHRU_INTR_IOAPIC = 0x01,
-   PCIPASSTHRU_INTR_MSI    = 0x02,
-   PCIPASSTHRU_INTR_MSIX   = 0x04,
+   PCIPASSTHRU_INTR_NONE    = 0x00,
+   PCIPASSTHRU_INTR_IOAPIC  = 0x01,
+   PCIPASSTHRU_INTR_MSI     = 0x02,
+   PCIPASSTHRU_INTR_MSIX    = 0x04,
+   PCIPASSTHRU_INTR_MSI_INT = 0x08,
 } PCIPassthru_IntrType;
 
+#define PCIPASSTHRU_INTR_MSI_COMBINED                   \
+   (PCIPASSTHRU_INTR_MSI | PCIPASSTHRU_INTR_MSI_INT)
+
 typedef struct FPTIntrProxyInfo {
    uint32            adapterIndex;
    uint32            vectorIndex;
diff --git a/vmmon-only/include/perfctr_generic.h b/vmmon-only/include/perfctr.h
similarity index 52%
rename from vmmon-only/include/perfctr_generic.h
rename to vmmon-only/include/perfctr.h
index 82a068ba..59fad251 100644
--- a/vmmon-only/include/perfctr_generic.h
+++ b/vmmon-only/include/perfctr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2012,2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2012,2014-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,12 +17,12 @@
  *********************************************************/
 
 /*
- * perfctr_generic.h --
+ * perfctr.h --
  *
  */
 
-#ifndef _PERFCTR_GENERIC_H_
-#define _PERFCTR_GENERIC_H_
+#ifndef _PERFCTR_H_
+#define _PERFCTR_H_
 
 #define INCLUDE_ALLOW_USERLEVEL
 
@@ -33,7 +33,9 @@
 
 #include "includeCheck.h"
 #include "vm_basic_types.h"
+#include "perfctr_arch.h"
 
+#define PERF_EVENT_NAME_LEN                      64
 /*
  * nmiNo      -- vmm peer is not attempting to do nmi profiling this run
  * nmiYes     -- vmm peer is doing nmi profiling and nmis are currently enabled
@@ -69,4 +71,51 @@ typedef struct {
    uint8  _pad[3];
 } CrossProfShared;
 
-#endif // ifndef _PERFCTR_GENERIC_H_
+/*
+ * PerfCtr_Config --
+ *      Describes configuration for a single hardware performance counter
+ *
+ *      Since this is only used to record general performance counters, we
+ *      made the assumption in nmiProfiler.c that the type is GENERAL and
+ *      index is counter number of type GENERAL.
+ *
+ *      **** x86 ****
+ *      On AMD K8 and GH:
+ *      index:        Which perf ctr, 0 to 3.  RDPMC argument
+ *      addr:         MSR of raw perf ctr              (0xc0010004 + index).
+ *      escrAddr:     MSR # of the Perf Event Selector (0xc0010000 + index).
+ *      escrVal:      Value placed in PerfEvtSel MSR; what to measure.
+ *
+ *      On AMD with PerfCtrExtCore support:
+ *      index:        Which perf ctr, 0 to 5.  RDPMC argument
+ *      addr:         MSR of raw perf ctr              (0xc0010201 + 2 * index).
+ *                                  aliased PMCs 0 - 3 (0xc0010004 + index).
+ *      escrAddr:     MSR # of the Perf Event Selector (0xc0010200 + 2 * index).
+ *                                  aliased PMCs 0 - 3 (0xc0010000 + index).
+ *      escrVal:      Value placed in PerfEvtSel MSR; what to measure.
+ *
+ *      On Intel Core architecture:
+ *      <to be documented>
+ *
+ *      **** ARM ****
+ *      escrVal:     Value placed in PMEVTYPER<n>_EL0 to configure event counter
+ *      index:       Index of the event counter.
+ */
+typedef struct PerfCtr_Config {
+   uint64 escrVal;
+   uint32 index;
+   uint32 periodMean;
+
+   /*
+    * Random number (whose absolute value is capped at
+    * periodJitterMask) is used to randomize sampling interval.
+    */
+   uint32  periodJitterMask;
+   uint32  seed;    // seed is used to compute next random number
+   uint16  config;
+   Bool    valid;
+   PERFCTR_CONFIG_ARCH_FIELDS
+} PerfCtr_Config;
+
+
+#endif // ifndef _PERFCTR_H_
diff --git a/vmmon-only/include/x86perfctr.h b/vmmon-only/include/perfctr_arch.h
similarity index 67%
rename from vmmon-only/include/x86perfctr.h
rename to vmmon-only/include/perfctr_arch.h
index b968a0a4..2e2a6df2 100644
--- a/vmmon-only/include/x86perfctr.h
+++ b/vmmon-only/include/perfctr_arch.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2012,2014-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2014, 2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,12 +17,17 @@
  *********************************************************/
 
 /*
- * x86perfctr.h --
+ * perfctr_arch.h --
  *
+ *      Performance counters (x64 specific).
  */
 
-#ifndef _X86PERFCTR_H_
-#define _X86PERFCTR_H_
+#ifndef _PERFCTR_ARCH_H
+#define _PERFCTR_ARCH_H
+
+#ifndef _PERFCTR_H_
+#error "This file can only be included by perfctr.h"
+#endif
 
 #define INCLUDE_ALLOW_USERLEVEL
 
@@ -30,25 +35,20 @@
 #define INCLUDE_ALLOW_MODULE
 #define INCLUDE_ALLOW_VMCORE
 #define INCLUDE_ALLOW_VMMON
-
 #include "includeCheck.h"
+
 #include "vm_asm.h"
 #include "x86cpuid_asm.h"
-#include "perfctr_generic.h"
 
-#define PERFCTR_PENTIUM4_NUM_COUNTERS            18
-#define PERFCTR_PENTIUM4_NUM_COUNTERS_WITH_L3    26
-#define PERFCTR_AMD_NUM_COUNTERS                 4 
+#define PERFCTR_AMD_NUM_COUNTERS                 4
 #define PERFCTR_AMD_EXT_NUM_COUNTERS             6
 #define PERFCTR_P6_NUM_COUNTERS                  2
 #define PERFCTR_NEHALEM_NUM_GEN_COUNTERS         4
 #define PERFCTR_NEHALEM_NUM_FIXED_COUNTERS       3
 #define PERFCTR_SANDYBRIDGE_NUM_GEN_COUNTERS     8 /* When HT is disabled */
-#define PERFCTR_CORE_NUM_ARCH_EVENTS             7
-#define PERFCTR_CORE_NUM_FIXED_COUNTERS          3
-#define PERFCTR_PENTIUM4_VAL_MASK                0xffffffffffLL
+#define PERFCTR_CORE_NUM_ARCH_EVENTS             8
+#define PERFCTR_CORE_NUM_FIXED_COUNTERS          4
 #define PERFCTR_AMD_VAL_MASK                     0xffffffffffffLL
-#define PERF_EVENT_NAME_LEN                      64
 /*
  * Even though the performance counters in P6 are 40 bits,
  * we can only write to the lower 32 bits.  Bit 31 is
@@ -59,7 +59,7 @@
 
 /*
  * Performance counter width is determined at runtime in CORE.
- * But the writables bits are fixed. we can only write to the 
+ * But the writables bits are fixed. we can only write to the
  * lower 32 bits.  Bit 31 is used to sign-extend the upper 8 bits.
  */
 #define PERFCTR_CORE_WRITE_MASK                  0xffffffff
@@ -124,7 +124,7 @@
 #define PERFCTR_AMD_CPU_CLK_UNHALTED                           0x76
 
 /* AMD Load/Store unit events */
-#define PERFCTR_AMD_SEGMENT_REGISTER_LOADS                     0x20 
+#define PERFCTR_AMD_SEGMENT_REGISTER_LOADS                     0x20
 #define PERFCTR_AMD_LS_BUFFER2_FULL                            0x23
 
 /*
@@ -198,8 +198,8 @@
 
 #define PERFCTR_AMD_MEM_CTRL_PAGE_TABLE_OVERFLOWS                   0xe1
 #define PERFCTR_AMD_CPU_IO_REQUESTS_TO_MEMORY_IO                    0xe9
-#define PERFCTR_AMD_PROBE_RESPONSE_AND_UPSTREAM_REQ                 0xec 
- 
+#define PERFCTR_AMD_PROBE_RESPONSE_AND_UPSTREAM_REQ                 0xec
+
 /* AMD HyperTransport Interface Events */
 
 #define PERFCTR_AMD_HT_L0_TX_BW                                     0xf6
@@ -219,9 +219,9 @@
  */
 
 /* P6 Data Cache Unit (DCU) */
-#define PERFCTR_P6_DATA_MEM_REFS                 0x00000043  
+#define PERFCTR_P6_DATA_MEM_REFS                 0x00000043
 #define PERFCTR_P6_DCU_LINES_IN                  0x00000045
-#define PERFCTR_P6_DCU_M_LINES_IN                0x00000046 
+#define PERFCTR_P6_DCU_M_LINES_IN                0x00000046
 #define PERFCTR_P6_DCU_MISS_OUTSTANDING          0x00000048
 
 /* P6 Instruction Fetch Unit (IFU) */
@@ -379,7 +379,7 @@
 #define PERFCTR_P6_APIC_INTR                     0x00100000
 #define PERFCTR_P6_ENABLE                        0x00400000
 #define PERFCTR_P6_INVERT_COUNTER_MASK           0x00800000
-#define PERFCTR_P6_COUNTER_MASK                  0xff000000        
+#define PERFCTR_P6_COUNTER_MASK                  0xff000000
 #define PERFCTR_P6_COUNTER_MASK_SHIFT            24
 #define PERFCTR_P6_SHIFT_BY_UNITMASK(e)          (e << 8)
 
@@ -436,6 +436,7 @@
 #define PERFCTR_CORE_KERNEL_MODE                    PERFCTR_CPU_KERNEL_MODE
 #define PERFCTR_CORE_APIC_INTR                      PERFCTR_CPU_APIC_INTR
 #define PERFCTR_CORE_ENABLE                         PERFCTR_CPU_ENABLE
+/* AnyThread Counting deprecated since PMU v5. */
 #define PERFCTR_CORE_ANYTHREAD                      0x00200000
 #define PERFCTR_CORE_IN_TX                          (CONST64U(1) << 32)
 #define PERFCTR_CORE_IN_TXCP                        (CONST64U(1) << 33)
@@ -463,6 +464,7 @@
 #define PERFCTR_CORE_INST_RETIRED                0xc0
 /* bus cycles */
 #define PERFCTR_CORE_UNHALTED_REF_CYCLES         (0x3c | (0x01 << 8))
+#define PERFCTR_CORE_TOPDOWN_SLOTS               (0xa4 | (0x01 << 8))
 
 /*
  * See Tables 30-2, 30-4 of the
@@ -558,132 +560,20 @@
 #define PERFCTR_NEHALEM_UNCORE_ENABLE            0x400000
 #define PERFCTR_NEHALEM_UNCORE_L3_LINES_IN       (0x0a | (0x0f << 8))
 
-
-/*
- * ----------------------------------------------------------------------
- *
- * Pentium 4
- *
- * ----------------------------------------------------------------------
- */
-
-/*
- * Pentium 4 Counter Configuration Control Register flags and fields
- */
-#define PERFCTR_PENTIUM4_CCCR_ENABLE                   0x00001000
-#define PERFCTR_PENTIUM4_CCCR_SET_ESCR(c, e)           ((c) |= (((e) & 0x7) << 13))
-#define PERFCTR_PENTIUM4_CCCR_REQRSVD                  0x00030000 // always set these bits
-#define PERFCTR_PENTIUM4_CCCR_COMPARE                  0x00040000
-#define PERFCTR_PENTIUM4_CCCR_COMPLEMENT               0x00080000
-#define PERFCTR_PENTIUM4_CCCR_SET_THRESHOLD(c, e)      ((c) |= (((e) & 0xf) << 20))
-#define PERFCTR_PENTIUM4_CCCR_EDGE                     0x01000000
-#define PERFCTR_PENTIUM4_CCCR_FORCE_OVF                0x02000000
-#define PERFCTR_PENTIUM4_CCCR_OVF_PMI_T0               0x04000000
-#define PERFCTR_PENTIUM4_CCCR_OVF_PMI_T1               0x08000000
-#define PERFCTR_PENTIUM4_CCCR_CASCADE                  0x40000000
-#define PERFCTR_PENTIUM4_CCCR_OVF                      0x80000000
-
-#define PERFCTR_PENTIUM4_COUNTER_BASEADDR              0x00000300
-#define PERFCTR_PENTIUM4_CCCR_BASE_ADDR                0x00000360
-
-#define PERFCTR_PENTIUM4_CCCR_THRESHOLD(e)             ((e & 0xf) << 20)
-#define PERFCTR_PENTIUM4_OPT_EDGE_DETECT (PERFCTR_PENTIUM4_CCCR_COMPARE | PERFCTR_PENTIUM4_CCCR_EDGE)
-
-/*
- * Pentium 4 Event Selection Control Register flags
- */
-#define PERFCTR_PENTIUM4_ESCR_USER_MODE_T0             0x00000004
-#define PERFCTR_PENTIUM4_ESCR_KERNEL_MODE_T0           0x00000008
-#define PERFCTR_PENTIUM4_ESCR_USER_MODE_T1             0x00000001
-#define PERFCTR_PENTIUM4_ESCR_KERNEL_MODE_T1           0x00000002
-#define PERFCTR_PENTIUM4_SHIFT_BY_UNITMASK(e)          (e << 9)
-#define PENTIUM4_EVTSEL(e)                             (e << 25)
-
-/*
- * Event definitions for Pentium4 Family Processors. 
- * There are many more of these possible.
- * See Appendix A.1 in Volume 3 of the IA32 manual.
- */
-
-#define PERFCTR_PENTIUM4_EVT_INSTR_RETIRED              PENTIUM4_EVTSEL(0x02)
-#define PERFCTR_PENTIUM4_EVT_INSTR_COMPLETED            PENTIUM4_EVTSEL(0x07)
-#define PERFCTR_PENTIUM4_EVT_BSQ_CACHE_REFERENCE        PENTIUM4_EVTSEL(0x0c)
-#define PERFCTR_PENTIUM4_EVT_ITLB_REFERENCE             PENTIUM4_EVTSEL(0x18)
-#define PERFCTR_PENTIUM4_EVT_PAGE_WALK_TYPE             PENTIUM4_EVTSEL(0x01)   
-#define PERFCTR_PENTIUM4_EVT_BPU_FETCH_REQUEST          PENTIUM4_EVTSEL(0x03)
-#define PERFCTR_PENTIUM4_EVT_BRANCH_RETIRED             PENTIUM4_EVTSEL(0x06)  
-#define PERFCTR_PENTIUM4_EVT_MISPRED_BRANCH_RETIRED     PENTIUM4_EVTSEL(0x03)
-#define PERFCTR_PENTIUM4_EVT_MACHINE_CLEAR              PENTIUM4_EVTSEL(0x02)
-#define PERFCTR_PENTIUM4_EVT_MEMORY_CANCEL              PENTIUM4_EVTSEL(0x02) 
-#define PERFCTR_PENTIUM4_GLOBAL_POWER_EVENTS            PENTIUM4_EVTSEL(0x13)
-
-/*
- * Pentium4 doesn't have an event for clock cycles, but Intel
- * outlines a method in the IA32 manual, vol 3, sec 14.9.9,
- * for measuring cycles which involves this event strategy.
- */
-
-#define PERFCTR_PENTIUM4_EVT_CLK_CYCLES \
-   PENTIUM4_EVTSEL(0x2) | \
-   PERFCTR_PENTIUM4_SHIFT_BY_UNITMASK (0x01 | 0x02 | 0x04 | 0x08)
-
-
-/*
- * PerfCtr_Config --
- *      Describes configuration for a single hardware performance counter
- *
- *      Since this is only used to record general performance counters, we
- *      made the assumption in nmiProfiler.c  that the type is GENERAL and
- *      index is counter number of type GENERAL.
- *      
- *      
- *      On AMD K8 and GH:
- *      index:        Which perf ctr, 0 to 3.  RDPMC argument
- *      addr:         MSR of raw perf ctr              (0xc0010004 + index).
- *      escrAddr:     MSR # of the Perf Event Selector (0xc0010000 + index).
- *      escrVal:      Value placed in PerfEvtSel MSR; what to measure.
- *
- *      On AMD with PerfCtrExtCore support:
- *      index:        Which perf ctr, 0 to 5.  RDPMC argument
- *      addr:         MSR of raw perf ctr              (0xc0010201 + 2 * index).
- *                                  aliased PMCs 0 - 3 (0xc0010004 + index).
- *      escrAddr:     MSR # of the Perf Event Selector (0xc0010200 + 2 * index).
- *                                  aliased PMCs 0 - 3 (0xc0010000 + index).
- *      escrVal:      Value placed in PerfEvtSel MSR; what to measure.
- * 
- *      No field should be greater than 32-bit as it is shared with monitor.
- *
- *      On Intel Core architecture:
- *      <to be documented>
- */
-typedef struct PerfCtr_Config {
-   uint64 escrVal;
-   uint32 index;
-   uint32 addr;
-   uint32 escrAddr;
-   uint32 resetHi;
-   uint32 periodMean;
-
-   /*
-    * Random number (whose absolute value is capped at
-    * periodJitterMask) is used to randomize sampling interval.
-    */
-   uint32  periodJitterMask;
-   uint32  seed;    // seed is used to compute next random number
-   uint16  config;
-   Bool    valid;
-   Bool    pebsEnabled;
-} PerfCtr_Config;
-
+#define PERFCTR_CONFIG_ARCH_FIELDS \
+   uint32 addr;      \
+   uint32 escrAddr;  \
+   uint32 resetHi;   \
+   Bool pebsEnabled; \
 
 /*
  * Program/reprogram event reg(s) associated w/perfctrs & start or stop perfctrs
  */
 static INLINE void
-PerfCtrWriteEvtSel(PerfCtr_Config *ctr,  // IN: counter to write
-                   uint32 escrVal)       // IN: event register value
+PerfCtr_WriteEvtSel(uint32 addr,       // IN: Event register to write
+                    uint32 escrVal)    // IN: event register value
 {
-   __SET_MSR(ctr->escrAddr, escrVal);
+   X86MSR_SetMSR(addr, escrVal);
 }
 
 
@@ -691,11 +581,10 @@ PerfCtrWriteEvtSel(PerfCtr_Config *ctr,  // IN: counter to write
  * Set/reset performance counters to engender desired period before overflow
  */
 static INLINE void
-PerfCtrWriteCounter(PerfCtr_Config *ctr,   // IN: counter to write
-                    uint32 valueLo,        // IN: low 32 bits of value to write
-                    uint32 valueHi)        // IN: high 32 bits of value to write
+PerfCtr_WriteCounter(uint32 addr,   // IN: counter to write
+                     uint64 value)  // IN: value to write
 {
-   WRMSR(ctr->addr, valueLo, valueHi);
+   X86MSR_SetMSR(addr, value);
 }
 
 
@@ -814,8 +703,9 @@ PerfCtr_PEBSAvailable(void)
    CPUIDRegs regs;
    __GET_CPUID(0, &regs);
    if (CPUID_IsVendorIntel(&regs) &&
-       ((__GET_MSR(MSR_MISC_ENABLE) & MSR_MISC_ENABLE_EMON_AVAILABLE) != 0) &&
-       ((__GET_MSR(MSR_MISC_ENABLE) & MSR_MISC_ENABLE_PEBS_UNAVAILABLE) == 0)) {
+       (X86MSR_GetMSR(MSR_MISC_ENABLE) &
+        (MSR_MISC_ENABLE_EMON_AVAILABLE | MSR_MISC_ENABLE_PEBS_UNAVAILABLE))
+       == MSR_MISC_ENABLE_EMON_AVAILABLE) {
       CPUIDRegs hvendor;
 
       /*
@@ -827,7 +717,7 @@ PerfCtr_PEBSAvailable(void)
              !CPUID_IsRawVendor(&hvendor,
                                 CPUID_HYPERV_HYPERVISOR_VENDOR_STRING);
    }
-   return FALSE; 
+   return FALSE;
 }
 
 /*
@@ -858,162 +748,4 @@ PerfCtr_PTAvailable(void)
    return FALSE;
 }
 
-/* The following are taken from the Intel Architecture Manual,
- * Book 3, Table 14-4. 
- */ 
-
-/* --------- BEGIN INTEL DEFINES ------------------------ */
-
-#define PENTIUM4_MSR_BPU_COUNTER0_IDX           0
-#define PENTIUM4_MSR_BPU_COUNTER0_ADDR          0x300
-#define PENTIUM4_MSR_BPU_CCCR0                  0x360
-#define PENTIUM4_MSR_BPU_COUNTER1_IDX           1
-#define PENTIUM4_MSR_BPU_COUNTER1_ADDR          0x301
-#define PENTIUM4_MSR_BPU_CCCR1                  0x361
-#define PENTIUM4_MSR_BPU_COUNTER2_IDX           2
-#define PENTIUM4_MSR_BPU_COUNTER2_ADDR          0x302
-#define PENTIUM4_MSR_BPU_CCCR2                  0x362
-#define PENTIUM4_MSR_BPU_COUNTER3_IDX           3
-#define PENTIUM4_MSR_BPU_COUNTER3_ADDR          0x303
-#define PENTIUM4_MSR_BPU_CCCR3                  0x363
-#define PENTIUM4_MSR_MS_COUNTER0_IDX            4
-#define PENTIUM4_MSR_MS_COUNTER0_ADDR           0x304
-#define PENTIUM4_MSR_MS_CCCR0                   0x364
-#define PENTIUM4_MSR_MS_COUNTER1_IDX            5
-#define PENTIUM4_MSR_MS_COUNTER1_ADDR           0x305
-#define PENTIUM4_MSR_MS_CCCR1                   0x365
-#define PENTIUM4_MSR_MS_COUNTER2_IDX            6
-#define PENTIUM4_MSR_MS_COUNTER2_ADDR           0x306
-#define PENTIUM4_MSR_MS_CCCR2                   0x366
-#define PENTIUM4_MSR_MS_COUNTER3_IDX            7
-#define PENTIUM4_MSR_MS_COUNTER3_ADDR           0x307
-#define PENTIUM4_MSR_MS_CCCR3                   0x367
-#define PENTIUM4_MSR_FLAME_COUNTER0_IDX         8
-#define PENTIUM4_MSR_FLAME_COUNTER0_ADDR        0x308
-#define PENTIUM4_MSR_FLAME_CCCR0                0x368
-#define PENTIUM4_MSR_FLAME_COUNTER1_IDX         9
-#define PENTIUM4_MSR_FLAME_COUNTER1_ADDR        0x309
-#define PENTIUM4_MSR_FLAME_CCCR1                0x369
-#define PENTIUM4_MSR_FLAME_COUNTER2_IDX         10
-#define PENTIUM4_MSR_FLAME_COUNTER2_ADDR        0x30A
-#define PENTIUM4_MSR_FLAME_CCCR2                0x36A
-#define PENTIUM4_MSR_FLAME_COUNTER3_IDX         11
-#define PENTIUM4_MSR_FLAME_COUNTER3_ADDR        0x30B
-#define PENTIUM4_MSR_FLAME_CCCR3                0x36B
-#define PENTIUM4_MSR_IQ_COUNTER0_IDX            12
-#define PENTIUM4_MSR_IQ_COUNTER0_ADDR           0x30C
-#define PENTIUM4_MSR_IQ_CCCR0                   0x36C
-#define PENTIUM4_MSR_IQ_COUNTER1_IDX            13
-#define PENTIUM4_MSR_IQ_COUNTER1_ADDR           0x30D
-#define PENTIUM4_MSR_IQ_CCCR1                   0x36D
-#define PENTIUM4_MSR_IQ_COUNTER2_IDX            14
-#define PENTIUM4_MSR_IQ_COUNTER2_ADDR           0x30E
-#define PENTIUM4_MSR_IQ_CCCR2                   0x36E
-#define PENTIUM4_MSR_IQ_COUNTER3_IDX            15
-#define PENTIUM4_MSR_IQ_COUNTER3_ADDR           0x30F
-#define PENTIUM4_MSR_IQ_CCCR3                   0x36F
-#define PENTIUM4_MSR_IQ_COUNTER4_IDX            16
-#define PENTIUM4_MSR_IQ_COUNTER4_ADDR           0x310
-#define PENTIUM4_MSR_IQ_CCCR4                   0x370
-#define PENTIUM4_MSR_IQ_COUNTER5_IDX            17
-#define PENTIUM4_MSR_IQ_COUNTER5_ADDR           0x311
-#define PENTIUM4_MSR_IQ_CCCR5                   0x371
-
-#define PENTIUM4_MSR_ALF_ESCR0_IDX              1
-#define PENTIUM4_MSR_ALF_ESCR0_ADDR             0x3CA
-#define PENTIUM4_MSR_ALF_ESCR1_IDX              1
-#define PENTIUM4_MSR_ALF_ESCR1_ADDR             0x3CB
-#define PENTIUM4_MSR_BPU_ESCR0_IDX              0
-#define PENTIUM4_MSR_BPU_ESCR0_ADDR             0x3B2
-#define PENTIUM4_MSR_BPU_ESCR1_IDX              0
-#define PENTIUM4_MSR_BPU_ESCR1_ADDR             0x3B3
-#define PENTIUM4_MSR_BSU_ESCR0_IDX              7
-#define PENTIUM4_MSR_BSU_ESCR0_ADDR             0x3A0
-#define PENTIUM4_MSR_BSU_ESCR1_IDX              7
-#define PENTIUM4_MSR_BSU_ESCR1_ADDR             0x3A1
-#define PENTIUM4_MSR_CRU_ESCR0_IDX              4
-#define PENTIUM4_MSR_CRU_ESCR0_ADDR             0x3B8
-#define PENTIUM4_MSR_CRU_ESCR1_IDX              4
-#define PENTIUM4_MSR_CRU_ESCR1_ADDR             0x3B9
-#define PENTIUM4_MSR_CRU_ESCR2_IDX              5
-#define PENTIUM4_MSR_CRU_ESCR2_ADDR             0x3CC
-#define PENTIUM4_MSR_CRU_ESCR3_IDX              5
-#define PENTIUM4_MSR_CRU_ESCR3_ADDR             0x3CD
-#define PENTIUM4_MSR_CRU_ESCR4_IDX              6
-#define PENTIUM4_MSR_CRU_ESCR4_ADDR             0x3E0
-#define PENTIUM4_MSR_CRU_ESCR5_IDX              6
-#define PENTIUM4_MSR_CRU_ESCR5_ADDR             0x3E1
-#define PENTIUM4_MSR_DAC_ESCR0_IDX              5
-#define PENTIUM4_MSR_DAC_ESCR0_ADDR             0x3A8
-#define PENTIUM4_MSR_DAC_ESCR1_IDX              5
-#define PENTIUM4_MSR_DAC_ESCR1_ADDR             0x3A9
-#define PENTIUM4_MSR_FIRM_ESCR0_IDX             1
-#define PENTIUM4_MSR_FIRM_ESCR0_ADDR            0x3A4
-#define PENTIUM4_MSR_FIRM_ESCR1_IDX             1
-#define PENTIUM4_MSR_FIRM_ESCR1_ADDR            0x3A5
-#define PENTIUM4_MSR_FLAME_ESCR0_IDX            0
-#define PENTIUM4_MSR_FLAME_ESCR0_ADDR           0x3A6
-#define PENTIUM4_MSR_FLAME_ESCR1_IDX            0
-#define PENTIUM4_MSR_FLAME_ESCR1_ADDR           0x3A7
-#define PENTIUM4_MSR_FSB_ESCR0_IDX              6
-#define PENTIUM4_MSR_FSB_ESCR0_ADDR             0x3A2
-#define PENTIUM4_MSR_FSB_ESCR1_IDX              6
-#define PENTIUM4_MSR_FSB_ESCR1_ADDR             0x3A3
-#define PENTIUM4_MSR_IQ_ESCR0_IDX               0
-#define PENTIUM4_MSR_IQ_ESCR0_ADDR              0x3BA
-#define PENTIUM4_MSR_IQ_ESCR1_IDX               0
-#define PENTIUM4_MSR_IQ_ESCR1_ADDR              0x3BB
-#define PENTIUM4_MSR_IS_ESCR0_IDX               1
-#define PENTIUM4_MSR_IS_ESCR0_ADDR              0x3B4
-#define PENTIUM4_MSR_IS_ESCR1_IDX               1
-#define PENTIUM4_MSR_IS_ESCR1_ADDR              0x3B5
-#define PENTIUM4_MSR_ITLB_ESCR0_IDX             3
-#define PENTIUM4_MSR_ITLB_ESCR0_ADDR            0x3B6
-#define PENTIUM4_MSR_ITLB_ESCR1_IDX             3
-#define PENTIUM4_MSR_ITLB_ESCR1_ADDR            0x3B7
-#define PENTIUM4_MSR_IX_ESCR0_IDX               5
-#define PENTIUM4_MSR_IX_ESCR0_ADDR              0x3C8
-#define PENTIUM4_MSR_IX_ESCR1_IDX               5
-#define PENTIUM4_MSR_IX_ESCR1_ADDR              0x3C9
-#define PENTIUM4_MSR_MOB_ESCR0_IDX              2
-#define PENTIUM4_MSR_MOB_ESCR0_ADDR             0x3AA
-#define PENTIUM4_MSR_MOB_ESCR1_IDX              2
-#define PENTIUM4_MSR_MOB_ESCR1_ADDR             0x3AB
-#define PENTIUM4_MSR_MS_ESCR0_IDX               0
-#define PENTIUM4_MSR_MS_ESCR0_ADDR              0x3C0
-#define PENTIUM4_MSR_MS_ESCR1_IDX               0
-#define PENTIUM4_MSR_MS_ESCR1_ADDR              0x3C1
-#define PENTIUM4_MSR_PMH_ESCR0_IDX              4
-#define PENTIUM4_MSR_PMH_ESCR0_ADDR             0x3AC
-#define PENTIUM4_MSR_PMH_ESCR1_IDX              4
-#define PENTIUM4_MSR_PMH_ESCR1_ADDR             0x3AD
-#define PENTIUM4_MSR_RAT_ESCR0_IDX              2
-#define PENTIUM4_MSR_RAT_ESCR0_ADDR             0x3BC
-#define PENTIUM4_MSR_RAT_ESCR1_IDX              2
-#define PENTIUM4_MSR_RAT_ESCR1_ADDR             0x3BD
-#define PENTIUM4_MSR_SAAT_ESCR0_IDX             2
-#define PENTIUM4_MSR_SAAT_ESCR0_ADDR            0x3AE
-#define PENTIUM4_MSR_SAAT_ESCR1_IDX             2
-#define PENTIUM4_MSR_SAAT_ESCR1_ADDR            0x3AF
-#define PENTIUM4_MSR_SSU_ESCR0_IDX              3
-#define PENTIUM4_MSR_SSU_ESCR0_ADDR             0x3BE
-#define PENTIUM4_MSR_TBPU_ESCR0_IDX             2
-#define PENTIUM4_MSR_TBPU_ESCR0_ADDR            0x3C2
-#define PENTIUM4_MSR_TBPU_ESCR1_IDX             2
-#define PENTIUM4_MSR_TBPU_ESCR1_ADDR            0x3C3
-#define PENTIUM4_MSR_TC_ESCR0_IDX               1
-#define PENTIUM4_MSR_TC_ESCR0_ADDR              0x3C4
-#define PENTIUM4_MSR_TC_ESCR1_IDX               1
-#define PENTIUM4_MSR_TC_ESCR1_ADDR              0x3C5
-#define PENTIUM4_MSR_U2L_ESCR0_IDX              3
-#define PENTIUM4_MSR_U2L_ESCR0_ADDR             0x3B0
-#define PENTIUM4_MSR_U2L_ESCR1_IDX              3
-#define PENTIUM4_MSR_U2L_ESCR1_ADDR             0x3B1
-
-#define PENTIUM4_MIN_ESCR_ADDR                  0x3A0
-#define PENTIUM4_MAX_ESCR_ADDR                  0x3E1
-#define PENTIUM4_NUM_ESCR_ADDRS                 (PENTIUM4_MAX_ESCR_ADDR - PENTIUM4_MIN_ESCR_ADDR + 1)
-
-/* -------- END INTEL DEFINES ------------------------- */
-
-#endif // ifndef _X86PERFCTR_H_ 
+#endif // _PERFCTR_ARCH_H
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
index e82db063..a85b62f7 100644
--- a/vmmon-only/include/ptsc.h
+++ b/vmmon-only/include/ptsc.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2017,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -173,35 +173,6 @@ int64 PTSC_CyclesToUS(VmRelativeTS ts);
  */
 #include "user_layout.h"
 
-#ifdef VM_ARM_64
-static INLINE VmAbsoluteTS
-PTSC_Get(void)
-{
-   extern __thread User_ThreadData vmkUserTdata;
-
-   register RateConv_Params params;
-   register uint64 pseudoTSC;
-
-   /*
-    * On ARM64 the generic timer guarantees that the counters are synchronous
-    * and independent of CPU frequency.
-    */
-   params = vmkUserTdata.pseudoTSCConv;
-   pseudoTSC = RDTSC();
-
-   /*
-    *  assert that conversion rate is `identity'.
-    * we'll have to revisit that when/if this assumption changes
-    * on some platform
-    */
-   ASSERT((params.mult == 1 && params.shift == 0) ||
-          (params.mult == 0x80000000 && params.shift == 31));
-
-   pseudoTSC += params.add;
-
-   return pseudoTSC;
-}
-#else
 static INLINE VmAbsoluteTS
 PTSC_Get(void)
 {
@@ -215,7 +186,7 @@ PTSC_Get(void)
    ASSERT((int64)ptsc >= 0);
    return ptsc;
 }
-#endif
+
 #else
 
 /*
diff --git a/vmmon-only/include/rateconv.h b/vmmon-only/include/rateconv.h
index bc76f845..b44b9217 100644
--- a/vmmon-only/include/rateconv.h
+++ b/vmmon-only/include/rateconv.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2016, 2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -97,7 +97,7 @@ void RateConv_LogRatio(const char *prefix,
 static INLINE uint64
 RateConv_Unsigned(const RateConv_Params *conv, uint64 x)
 {
-   return Mul64x3264(x, conv->mult, conv->shift) + conv->add;
+   return Mul64x3264(x, conv->mult, conv->shift) + (uint64)conv->add;
 }
 
 
diff --git a/vmmon-only/include/initblock.h b/vmmon-only/include/sharedAreaType.h
similarity index 63%
rename from vmmon-only/include/initblock.h
rename to vmmon-only/include/sharedAreaType.h
index e101e9ff..af85bd7e 100644
--- a/vmmon-only/include/initblock.h
+++ b/vmmon-only/include/sharedAreaType.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -16,28 +16,32 @@
  *
  *********************************************************/
 
-#ifndef _INITBLOCK_H
-#define _INITBLOCK_H
+/*
+ * sharedAreaType.h --
+ *
+ *      This file contains shared area type definitions.
+ */
 
+#ifndef _SHAREDAREATYPE_H_
+#define _SHAREDAREATYPE_H_
 
-#define INCLUDE_ALLOW_VMX
 #define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMX
 #define INCLUDE_ALLOW_VMMON
-#include "includeCheck.h"
-
-
-#include "basic_initblock.h"
-
-
-#define MAX_LOGFILE_NAME_LENGTH 256
-#define MAX_MONITOR_REGIONS     8
-#define INIT_BLOCK_MAGIC     (0x1789+14)
-
-
-/*
- * Option flags 
- */
-/* None yet */
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
 
+#include "includeCheck.h"
 
-#endif
+typedef enum {
+   SHARED_AREA_PER_VM_VMX = 0,
+   SHARED_AREA_INTER_VCPU_VMX,
+   SHARED_AREA_PER_VCPU_VMX,
+   SHARED_AREA_PER_VM,
+   SHARED_AREA_INTER_VCPU,
+   SHARED_AREA_PER_VCPU,
+   NUM_SHARED_AREAS
+} SharedAreaType;
+
+#endif // _SHAREDAREATYPE_H_
diff --git a/vmmon-only/include/sharedAreaVmmon.h b/vmmon-only/include/sharedAreaVmmon.h
new file mode 100644
index 00000000..a009fdaf
--- /dev/null
+++ b/vmmon-only/include/sharedAreaVmmon.h
@@ -0,0 +1,62 @@
+/*********************************************************
+ * Copyright (C) 2018 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * sharedAreaVmmon.h --
+ *
+ *     VMMon shared area management.
+ */
+
+#ifndef SHARED_AREA_VMMON_H
+#define SHARED_AREA_VMMON_H
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "iocontrols.h"
+
+struct VMDriver;
+
+/* A collection of pages backing a shared area region. */
+typedef struct SharedAreaVmmonRegion {
+   PageCnt pagesPerVcpu;
+   MPN *pages;
+} SharedAreaVmmonRegion;
+
+/* The VMMon Driver shared area. */
+typedef struct SharedAreaVmmon {
+   SharedAreaVmmonRegion regions[NUM_SHARED_AREAS];
+} SharedAreaVmmon;
+
+/* Request for a backing MPN for a shared area region at a given VCPU/offset. */
+typedef struct SharedAreaVmmonRequest {
+   SharedAreaType type;
+   Vcpuid vcpu;
+   PageCnt offset;
+} SharedAreaVmmonRequest;
+
+SharedAreaVmmon *SharedAreaVmmon_Init(struct VMDriver *vm);
+void SharedAreaVmmon_Cleanup(SharedAreaVmmon *area);
+Bool SharedAreaVmmon_RegisterRegion(struct VMDriver *driver,
+                                    VMSharedAreaRegistrationBlock *block);
+Bool SharedAreaVmmon_ValidateRegionArgs(struct VMDriver *driver,
+                                        VMSharedAreaRegistrationBlock *block);
+MPN SharedAreaVmmon_GetRegionMPN(struct VMDriver *vm,
+                                 SharedAreaVmmonRequest *request);
+#endif /* SHARED_AREA_VMMON_H */
diff --git a/vmmon-only/include/basic_initblock.h b/vmmon-only/include/statVarsVmmon.h
similarity index 54%
rename from vmmon-only/include/basic_initblock.h
rename to vmmon-only/include/statVarsVmmon.h
index f4b58e54..fa379d1c 100644
--- a/vmmon-only/include/basic_initblock.h
+++ b/vmmon-only/include/statVarsVmmon.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2018-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,45 +17,32 @@
  *********************************************************/
 
 /*
- * basic_initblock.h --
+ * statVarsVmmon.h --
  *
- *    VM initialization block.
+ *     VMMon stat vars management.
  */
 
-#ifndef _BASIC_INITBLOCK_H_
-#define _BASIC_INITBLOCK_H_
+#ifndef STAT_VARS_VMMON_H
+#define STAT_VARS_VMMON_H
 
-
-#define INCLUDE_ALLOW_USERLEVEL
-
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_VMK_MODULE
-#define INCLUDE_ALLOW_DISTRIBUTE
 #define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
 #include "includeCheck.h"
 
+#include "iocontrols.h"
 
-#include "vcpuid.h"
-
-
-#define MAX_INITBLOCK_CPUS     MAX_VCPUS
-
-
-typedef
-#include "vmware_pack_begin.h"
-struct InitBlock {
-   uint32 magicNumber;     /* Magic number (INIT_BLOCK_MAGIC) */
-   uint32 vmInitFailurePeriod;
-   VA64   crosspage[MAX_INITBLOCK_CPUS];
-   LPN64  monStartLPN;
-   LPN64  monEndLPN;
-   MPN    crossGDTMPN;
-   uint16 numPTPPages;
-}
-#include "vmware_pack_end.h"
-InitBlock;
+struct VMDriver;
 
+/* The VMMon Driver stat vars area. */
+typedef struct StatVarsVmmon {
+   PageCnt pagesPerVcpu;
+   MPN *pages;
+} StatVarsVmmon;
 
-#endif // _BASIC_INITBLOCK_H_
+StatVarsVmmon *StatVarsVmmon_Init(struct VMDriver *vm);
+void StatVarsVmmon_Cleanup(StatVarsVmmon *statVars);
+Bool StatVarsVmmon_RegisterVCPU(struct VMDriver *driver,
+                                VMStatVarsRegistrationBlock *block);
+MPN StatVarsVmmon_GetRegionMPN(struct VMDriver *vm, Vcpuid vcpuid,
+                               PageCnt offset);
+#endif /* STAT_VARS_VMMON_H */
diff --git a/vmmon-only/include/usercalldefs.h b/vmmon-only/include/usercalldefs.h
index 9b32ee79..90fd5059 100644
--- a/vmmon-only/include/usercalldefs.h
+++ b/vmmon-only/include/usercalldefs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 #ifndef USERCALLDEFS_H
 #define USERCALLDEFS_H
 
-#ifdef linux
+#ifdef __linux__
 #include <linux/errno.h>
 #define USERCALL_RESTART (-ERESTARTNOINTR)
 #else
diff --git a/vmmon-only/include/vcpuid.h b/vmmon-only/include/vcpuid.h
index ca327315..050d0b69 100644
--- a/vmmon-only/include/vcpuid.h
+++ b/vmmon-only/include/vcpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014, 2016-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014, 2016-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -42,7 +42,6 @@
 extern "C" {
 #endif
 
-
 typedef uint32 Vcpuid;                 // VCPU number
 
 #define VCPUID_INVALID  (~0U)
@@ -54,17 +53,11 @@ typedef uint32 Vcpuid;                 // VCPU number
 #define MAX_CORES_PER_SOCKET   64
 #define MAX_VCPU_SOCKETS      128
 
-#ifdef VMM
-#include "vcpuset.h"
-
-/* In VMM, CurVcpuid() is available everywhere. */
-extern const Vcpuid      curVcpuid;
-extern const VCPUSet     curVcpuidSet;
-#define CurVcpuid()         (curVcpuid)
-#define CurVcpuidSet()      (&curVcpuidSet)
-#define IS_BOOT_VCPU()      IS_BOOT_VCPUID(CurVcpuid())
-
-#endif  /* VMM */
+/*
+ * There are several properties of the VM which change at the 128 VCPU
+ * boundary.  EFI firmware, x2APIC, and IOMMU are required among others.
+ */
+#define MAX_SMALL_VM_VCPUS 128
 
 #if defined __cplusplus
 } // extern "C"
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
index 1cc97a2f..c9e81925 100644
--- a/vmmon-only/include/vcpuset.h
+++ b/vmmon-only/include/vcpuset.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -112,7 +112,7 @@ extern VCPUSet  vcpuSetFull;
 
 #define FOR_EACH_SUBSET_IN_SET(_setIndex)                                     \
    do {                                                                       \
-      int _setIndex;                                                          \
+      unsigned _setIndex;                                                     \
       for (_setIndex = 0; _setIndex < VCS_SUBSET_COUNT; _setIndex++) {
 
 #define ROF_EACH_SUBSET_IN_SET()                                              \
@@ -122,8 +122,8 @@ extern VCPUSet  vcpuSetFull;
 
 #define FOR_EACH_SUBSET_IN_SET_COUNTDOWN(_setIndex)                           \
    do {                                                                       \
-      int _setIndex;                                                          \
-      for (_setIndex = VCS_SUBSET_COUNT - 1; _setIndex >= 0; _setIndex--) {
+      unsigned _setIndex = VCS_SUBSET_COUNT;                                  \
+      while (_setIndex-- > 0) {
 
 #define ROF_EACH_SUBSET_IN_SET_COUNTDOWN()                                    \
       }                                                                       \
@@ -132,8 +132,8 @@ extern VCPUSet  vcpuSetFull;
 
 #define FOR_EACH_POPULATED_SUBSET_IN_SET(_setIndex, _numVcpus)                \
    do {                                                                       \
-      int _setIndex;                                                          \
-      int _maxSubsets = VCS_VCPUID_SUBSET_IDX(_numVcpus - 1);                 \
+      unsigned _setIndex;                                                     \
+      unsigned _maxSubsets = VCS_VCPUID_SUBSET_IDX(_numVcpus - 1);            \
       for (_setIndex = 0; _setIndex <= _maxSubsets; _setIndex++) {
 
 #define ROF_EACH_POPULATED_SUBSET_IN_SET()                                    \
@@ -307,7 +307,7 @@ VCPUSet_FindFirst(const VCPUSet *vcs)
    FOR_EACH_SUBSET_IN_SET(idx) {
       uint64 subset = vcs->subset[idx];
       if (subset != 0) {
-         return lssb64_0(subset) + (idx << VCS_SUBSET_SHIFT);
+         return lssb64(subset) - 1 + (idx << VCS_SUBSET_SHIFT);
       }
    } ROF_EACH_SUBSET_IN_SET();
    return VCPUID_INVALID;
@@ -319,7 +319,7 @@ VCPUSet_FindLast(const VCPUSet *vcs)
    FOR_EACH_SUBSET_IN_SET_COUNTDOWN(idx) {
       uint64 subset = vcs->subset[idx];
       if (subset != 0) {
-         return mssb64_0(subset) + (idx << VCS_SUBSET_SHIFT);
+         return mssb64(subset) - 1 + (idx << VCS_SUBSET_SHIFT);
       }
    } ROF_EACH_SUBSET_IN_SET_COUNTDOWN();
    return VCPUID_INVALID;
@@ -356,8 +356,7 @@ VCPUSet_FindFirstInSubset(const VCPUSet *vcs, uint64 *subset,
    ASSERT(*subsetIdx < maxSubsets && maxSubsets <= VCS_SUBSET_COUNT);
    do {
       if (*subset != 0) {
-         int bit;
-         bit = lssb64_0(*subset);
+         unsigned bit = (unsigned)lssb64_0(*subset);
          *subset &= ~(CONST64U(1) << bit);
          return bit + (*subsetIdx << VCS_SUBSET_SHIFT);
       }
@@ -672,7 +671,7 @@ static INLINE Vcpuid
 VCPUSet_FindSingleton(const VCPUSet *vcs)
 {
    uint64 foundSub = 0;
-   uint32 foundIdx;
+   uint32 foundIdx = 0;
    FOR_EACH_SUBSET_IN_SET(idx) {
       uint64 sub = vcs->subset[idx];
       if (sub != 0) {
@@ -683,8 +682,11 @@ VCPUSet_FindSingleton(const VCPUSet *vcs)
          foundIdx = idx;
       }
    } ROF_EACH_SUBSET_IN_SET();
-   return foundSub != 0 ? lssb64_0(foundSub) + (foundIdx << VCS_SUBSET_SHIFT) :
-                          VCPUID_INVALID;
+   if (foundSub != 0) {
+      return lssb64(foundSub) - 1 + (foundIdx << VCS_SUBSET_SHIFT);
+   } else {
+      return VCPUID_INVALID;
+   }
 }
 
 
@@ -863,27 +865,27 @@ VCPUSet_Intersection(VCPUSet *dest, const VCPUSet *src)
 
 #ifdef VCS_SNPRINTF
 static INLINE char *
-VCPUSet_LogFormat(char *buf, const int size, const VCPUSet *vcs)
+VCPUSet_LogFormat(char *buf, size_t size, const VCPUSet *vcs)
 {
-   int offset = 0;
-   Vcpuid highest = VCPUSet_FindLast(vcs);
-   int idx = (highest == VCPUID_INVALID) ? 0 : highest / 8;
+   unsigned offset  = 0;
+   Vcpuid   highest = VCPUSet_FindLast(vcs);
+   unsigned idx     = (highest == VCPUID_INVALID) ? 0 : highest / 8;
+
    ASSERT(size >= VCS_BUF_SIZE);
 #define VCS_LOGF(...)                                                   \
    {                                                                    \
       int ret = VCS_SNPRINTF(buf + offset, size - offset, __VA_ARGS__); \
-      ASSERT(0 <= ret && ret < size - offset);                          \
-      offset += ret;                                                    \
+      ASSERT(0 <= ret && size >= offset && ret < (int)(size - offset)); \
+      offset += (unsigned)ret;                                          \
    }
    /* Print the leading value with no zero-extension. */
-   VCS_LOGF("%#x", ((unsigned char *)vcs)[idx--]);
+   VCS_LOGF("%#x", ((unsigned char *)vcs)[idx]);
 
-   while (idx >= 0) {
+   while (idx-- > 0) {
       if ((idx + 1) % (VCS_SUBSET_WIDTH / 8) == 0) {
          VCS_LOGF(".");
       }
       VCS_LOGF("%02x", ((unsigned char *)vcs)[idx]);
-      idx--;
    }
    return buf;
 }
diff --git a/vmmon-only/include/vm_asm.h b/vmmon-only/include/vm_asm.h
index 0eb9cee5..bfcf011f 100644
--- a/vmmon-only/include/vm_asm.h
+++ b/vmmon-only/include/vm_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -41,52 +41,47 @@
 
 #include "vm_basic_asm.h"
 #include "x86msr.h"
-
-#ifdef VM_X86_64
-#include "vm_asm_x86_64.h"
-#else
 #include "vm_asm_x86.h"
-#endif
 
 
 static INLINE void
 SET_FS64(uint64 fs64)
 {
-   __SET_MSR(MSR_FSBASE, fs64);
+   X86MSR_SetMSR(MSR_FSBASE, fs64);
 }
 
 
 static INLINE void
 SET_GS64(uint64 gs64)
 {
-   __SET_MSR(MSR_GSBASE, gs64);
+   X86MSR_SetMSR(MSR_GSBASE, gs64);
 }
 
 static INLINE void
 SET_KernelGS64(uint64 kgs64)
 {
-   __SET_MSR(MSR_KERNELGSBASE, kgs64);
+   X86MSR_SetMSR(MSR_KERNELGSBASE, kgs64);
 }
 
 
 static INLINE uint64
 GET_FS64(void)
 {
-   return __GET_MSR(MSR_FSBASE);
+   return X86MSR_GetMSR(MSR_FSBASE);
 }
 
 
 static INLINE uint64
 GET_GS64(void)
 {
-   return __GET_MSR(MSR_GSBASE);
+   return X86MSR_GetMSR(MSR_GSBASE);
 }
 
 
 static INLINE uint64
 GET_KernelGS64(void)
 {
-   return __GET_MSR(MSR_KERNELGSBASE);
+   return X86MSR_GetMSR(MSR_KERNELGSBASE);
 }
 
 #endif // VM_ARM_64
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index bfc152a5..af45a5bf 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016-2017,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 /*
  * vm_asm_x86.h
  *
- *	IA32 asm macros
+ *      IA32 asm macros
  */
 
 #ifndef _VM_ASM_X86_H_
@@ -49,10 +49,6 @@
 
 #ifdef __GNUC__
 
-#if defined __APPLE__
-/* PR 352418: GCC produces error if the non-Apple version is used */
-#define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)
-#else
 /* ASSERT_ON_COMPILE_SELECTOR_SIZE:
  *
  *  - Selector must be 16-bits.
@@ -66,25 +62,15 @@
  *                    ((__builtin_constant_p(expr) ? ((expr) >> 16) == 0) \
  *                                                 : sizeof(expr) <= 2)
  */
-#if (__GNUC__ >= 4) && (__GNUC_MINOR__ >= 1) && !defined(USE_UBSAN)
+#ifndef USE_UBSAN
 #define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)                                \
    ASSERT_ON_COMPILE(sizeof(Selector) == 2 &&                                \
                      ((__builtin_constant_p(expr) && ((expr) >> 16) == 0) || \
                       sizeof(expr) <= 2))
 #else
-/* gcc 3.3.3 is not able to produce a constant expression (PR 356383) */
 #define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)
 #endif
-#endif
-
-
-/*
- * [GS]ET_[GI]DT() are defined as macros wrapping a function
- * so we can pass the argument implicitly by reference (requires
- * a macro) and get type checking too (requires a function).
- */
 
-#define SET_GDT(var) _Set_GDT(&(var))
 
 /* Checked against the Intel manual and GCC --hpreg */
 static INLINE void
@@ -97,8 +83,6 @@ _Set_GDT(_GETSET_DTR_TYPE *dtr)
    );
 }
 
-#define SET_IDT(var) _Set_IDT(&(var))
-
 /* Checked against the Intel manual and GCC --hpreg */
 static INLINE void
 _Set_IDT(_GETSET_DTR_TYPE *dtr)
@@ -110,8 +94,6 @@ _Set_IDT(_GETSET_DTR_TYPE *dtr)
    );
 }
 
-#define GET_GDT(var) _Get_GDT(&(var))
-
 /*
  * Checked against the Intel manual and GCC --hpreg
  * volatile because there's a hidden input (the [IG]DTR) that can change
@@ -126,8 +108,6 @@ _Get_GDT(_GETSET_DTR_TYPE *dtr)
    );
 }
 
-#define GET_IDT(var) _Get_IDT(&(var))
-
 /*
  * Checked against the Intel manual and GCC --hpreg
  * volatile because the [IG]DT can change without the compiler knowing it
@@ -218,22 +198,6 @@ _BUILD_GET_R(_GET_CR3, cr3)
 _BUILD_GET_R(_GET_CR4, cr4)
 _BUILD_GET_R(_GET_CR8, cr8)
 
-#if defined __APPLE__
-/* Mac OS gcc 4 uses DBx instead of DRx register names. */
-_BUILD_SET_R(_SET_DR0, db0)
-_BUILD_SET_R(_SET_DR1, db1)
-_BUILD_SET_R(_SET_DR2, db2)
-_BUILD_SET_R(_SET_DR3, db3)
-_BUILD_SET_R(_SET_DR6, db6)
-_BUILD_SET_R(_SET_DR7, db7)
-
-_BUILD_GET_R(_GET_DR0, db0)
-_BUILD_GET_R(_GET_DR1, db1)
-_BUILD_GET_R(_GET_DR2, db2)
-_BUILD_GET_R(_GET_DR3, db3)
-_BUILD_GET_R(_GET_DR6, db6)
-_BUILD_GET_R(_GET_DR7, db7)
-#else
 _BUILD_SET_R(_SET_DR0, dr0)
 _BUILD_SET_R(_SET_DR1, dr1)
 _BUILD_SET_R(_SET_DR2, dr2)
@@ -247,47 +211,8 @@ _BUILD_GET_R(_GET_DR2, dr2)
 _BUILD_GET_R(_GET_DR3, dr3)
 _BUILD_GET_R(_GET_DR6, dr6)
 _BUILD_GET_R(_GET_DR7, dr7)
-#endif
-
-#define SET_CR_DR(regType, regNum, expr)                     \
-   do {                                                      \
-      /* Ensure no implicit truncation of 'expr' */          \
-      ASSERT_ON_COMPILE(sizeof(expr) <= sizeof(uintptr_t));  \
-      _SET_##regType##regNum(expr);                          \
-   } while (0)
-
-#define GET_CR_DR(regType, regNum, var) \
-   do {                                 \
-      _GET_##regType##regNum(&(var));   \
-   } while (0)
 
-#define SET_CR0(expr) SET_CR_DR(CR, 0, expr)
 #define SET_CR2(expr) SET_CR_DR(CR, 2, expr)
-#define SET_CR3(expr) SET_CR_DR(CR, 3, expr)
-#define SET_CR4(expr) SET_CR_DR(CR, 4, expr)
-#define SET_CR8(expr) SET_CR_DR(CR, 8, expr)
-
-/* Undefine GET_CR0; it is defined in mach_asm.h for SLES cross-compile */
-#undef GET_CR0
-#define GET_CR0(var)  GET_CR_DR(CR, 0, var)
-#define GET_CR2(var)  GET_CR_DR(CR, 2, var)
-#define GET_CR3(var)  GET_CR_DR(CR, 3, var)
-#define GET_CR4(var)  GET_CR_DR(CR, 4, var)
-#define GET_CR8(var)  GET_CR_DR(CR, 8, var)
-
-#define SET_DR0(expr) SET_CR_DR(DR, 0, expr)
-#define SET_DR1(expr) SET_CR_DR(DR, 1, expr)
-#define SET_DR2(expr) SET_CR_DR(DR, 2, expr)
-#define SET_DR3(expr) SET_CR_DR(DR, 3, expr)
-#define SET_DR6(expr) SET_CR_DR(DR, 6, expr)
-#define SET_DR7(expr) SET_CR_DR(DR, 7, expr)
-
-#define GET_DR0(var)  GET_CR_DR(DR, 0, var)
-#define GET_DR1(var)  GET_CR_DR(DR, 1, var)
-#define GET_DR2(var)  GET_CR_DR(DR, 2, var)
-#define GET_DR3(var)  GET_CR_DR(DR, 3, var)
-#define GET_DR6(var)  GET_CR_DR(DR, 6, var)
-#define GET_DR7(var)  GET_CR_DR(DR, 7, var)
 
 #define SET_SEGREG(reg, expr)                                          \
    do {                                                                \
@@ -426,440 +351,347 @@ CLTS(void)
 /* Beginning of the section whose correctness has NOT been checked */
 #define FNCLEX()         __asm__("fnclex" ::);
 
-/* TLB_INVALIDATE_xxx are not checked yet */
+/* TLB_INVALIDATE_PAGE is not checked yet */
 #define TLB_INVALIDATE_PAGE(_addr) do { \
      __asm__ __volatile__("invlpg %0": :"m" (*(char *) (_addr)):"memory"); \
 } while (0)
 
-#define TLB_INVALIDATE_PAGE_OFF_FS(_addr) do { \
-     __asm__ __volatile__("fs; invlpg %0": :"m" (*(char *) (_addr)):"memory"); \
-} while (0)
-
 #define RESTORE_FLAGS _Set_flags
 #define ENABLE_INTERRUPTS() __asm__ __volatile__ ("sti": : :"memory")
 #define CLEAR_INTERRUPTS()  __asm__ __volatile__ ("cli": : :"memory")
 #define RAISE_INTERRUPT(_x)  __asm__ __volatile__("int %0" :: "g" (_x))
 #define RETURN_FROM_INT()   __asm__ __volatile__("iret" :: )
 
-#if ! defined(VMKERNEL)
-#define NO_INTERRUPTS_BEGIN()	do { \
-                                   uintptr_t _flags; \
-                                   SAVE_FLAGS(_flags); \
-                                   CLEAR_INTERRUPTS();
-
-#define NO_INTERRUPTS_END()	   RESTORE_FLAGS(_flags); \
-                                } while(0)
-#endif
-
 /* End of the section whose correctness has NOT been checked */
 
 #elif defined _MSC_VER  /* !__GNUC__ */
 
-#define SET_IDT(_idt)    _Set_IDT(&(_idt))
-#define SET_GDT(_gdt)    _Set_GDT(&(_gdt))
-#define SET_TR(_tr)      _Set_TR(_tr)
-#define SET_LDT(_tr)     _Set_LDT(_tr)
+#define _BUILD_SET_DR(func, reg)                      \
+   static INLINE void                                 \
+   func(uintptr_t r)                                  \
+   {                                                  \
+      __writedr(reg, r);                              \
+   }
 
-#define GET_IDT(_idt)    _Get_IDT(&(_idt))
-#define GET_GDT(_gdt)    _Get_GDT(&(_gdt))
-#define GET_TR(_tr)      do { _tr = _Get_TR();  } while (0)
-#define GET_LDT(_tr)     do { _tr = _Get_LDT(); } while (0)
+#define _BUILD_GET_DR(func, reg)                      \
+   static INLINE void                                 \
+   func(uintptr_t *result)                            \
+   {                                                  \
+      *result = __readdr(reg);                        \
+   }
 
-#define GET_CR0(_reg)    __asm mov eax, cr0 __asm mov _reg, eax
-#define SET_CR0(_reg)    __asm mov eax, _reg __asm mov cr0, eax
-#define GET_CR2(_reg)    __asm mov eax, cr2 __asm mov _reg, eax
-#define SET_CR2(_reg)    __asm mov eax, _reg __asm mov cr2, eax
-#define GET_CR3(_reg)    __asm mov eax, cr3 __asm mov _reg, eax
-#define SET_CR3(_reg)    __asm mov eax, _reg __asm mov cr3, eax
-/*
- * MSC doesn't seem to like CR4 in __asm statements. We emit
- * the opcode for MOV EAX,CR4 = 0xf020e0 and MOV CR4,EAX = 0xf022e0
- */
-#define GET_CR4(_reg) { \
- __asm _emit 0x0f __asm _emit 0x20 __asm _emit 0xe0 \
- __asm mov _reg, eax \
+#define _BUILD_SET_CR(func, reg)                      \
+   static INLINE void                                 \
+   func(uintptr_t r)                                  \
+   {                                                  \
+      __writecr##reg(r);                              \
+   }
+
+#define _BUILD_GET_CR(func, reg)                      \
+   static INLINE void                                 \
+   func(uintptr_t *result)                            \
+   {                                                  \
+      *result = __readcr##reg();                      \
+   }
+
+_BUILD_SET_DR(_SET_DR0, 0)
+_BUILD_SET_DR(_SET_DR1, 1)
+_BUILD_SET_DR(_SET_DR2, 2)
+_BUILD_SET_DR(_SET_DR3, 3)
+_BUILD_SET_DR(_SET_DR6, 6)
+_BUILD_SET_DR(_SET_DR7, 7)
+
+_BUILD_GET_DR(_GET_DR0, 0)
+_BUILD_GET_DR(_GET_DR1, 1)
+_BUILD_GET_DR(_GET_DR2, 2)
+_BUILD_GET_DR(_GET_DR3, 3)
+_BUILD_GET_DR(_GET_DR6, 6)
+_BUILD_GET_DR(_GET_DR7, 7)
+
+_BUILD_SET_CR(_SET_CR0, 0);
+_BUILD_SET_CR(_SET_CR3, 3);
+_BUILD_SET_CR(_SET_CR4, 4);
+_BUILD_SET_CR(_SET_CR8, 8);
+
+_BUILD_GET_CR(_GET_CR0, 0);
+_BUILD_GET_CR(_GET_CR2, 2);
+_BUILD_GET_CR(_GET_CR3, 3);
+_BUILD_GET_CR(_GET_CR4, 4);
+_BUILD_GET_CR(_GET_CR8, 8);
+
+static INLINE void
+_Set_GDT(_GETSET_DTR_TYPE *dtr)
+{
+#ifdef VM_X86_64
+   _lgdt(dtr);
+#else
+   /*
+    * timetools 32-bit targets use an old version of MSVC that doesn't support
+    * the _lgdt intrinsic. Luckily, 32-bit still supports inline asm.
+    */
+   __asm mov eax, dtr
+   __asm lgdt [eax]
+#endif
 }
-#define SET_CR4(_reg)    { \
-  __asm mov eax, _reg \
-  __asm _emit 0x0f __asm _emit 0x22 __asm _emit 0xe0 \
+
+static INLINE void
+_Get_GDT(_GETSET_DTR_TYPE *dtr)
+{
+#ifdef VM_X86_64
+   _sgdt(dtr);
+#else
+   /*
+    * timetools 32-bit targets use an old version of MSVC that doesn't support
+    * the _sgdt intrinsic. Luckily, 32-bit still supports inline asm.
+    */
+   __asm mov eax, dtr
+   __asm sgdt [eax]
+#endif
 }
 
+static INLINE void
+_Set_IDT(_GETSET_DTR_TYPE *dtr)
+{
+   __lidt(dtr);
+}
 
-#define GET_DR0(_reg) do { __asm mov eax,dr0 __asm mov _reg,eax } while (0)
-#define SET_DR0(_reg) do { __asm mov eax,_reg __asm mov dr0,eax } while (0)
-#define GET_DR1(_reg) do { __asm mov eax,dr1 __asm mov _reg,eax } while (0)
-#define SET_DR1(_reg) do { __asm mov eax,_reg __asm mov dr1,eax } while (0)
-#define GET_DR2(_reg) do { __asm mov eax,dr2 __asm mov _reg,eax } while (0)
-#define SET_DR2(_reg) do { __asm mov eax,_reg __asm mov dr2,eax } while (0)
-#define GET_DR3(_reg) do { __asm mov eax,dr3 __asm mov _reg,eax } while (0)
-#define SET_DR3(_reg) do { __asm mov eax,_reg __asm mov dr3,eax } while (0)
-#define GET_DR6(_reg) do { __asm mov eax,dr6 __asm mov _reg,eax } while (0)
-#define SET_DR6(_reg) do { __asm mov eax,_reg __asm mov dr6,eax } while (0)
-#define GET_DR7(_reg) do { __asm mov eax,dr7 __asm mov _reg,eax } while (0)
-#define SET_DR7(_reg) do { __asm mov eax,_reg __asm mov dr7,eax } while (0)
+static INLINE void
+_Get_IDT(_GETSET_DTR_TYPE *dtr)
+{
+   __sidt(dtr);
+}
 
 
-#define CLTS()           __asm clts
+#define ENABLE_INTERRUPTS() _enable()
+#define CLEAR_INTERRUPTS()  _disable()
 
-#define FNCLEX()         __asm fnclex
+#define SAVE_FLAGS(x) do { \
+   (x) = __readeflags();   \
+} while (0)
 
-#define TLB_INVALIDATE_PAGE(_addr) {  \
-	 void *_a = (_addr); \
-     __asm mov eax, _a __asm invlpg [eax] \
-}
+#define RESTORE_FLAGS(x) __writeeflags(x)
 
-#define TLB_INVALIDATE_PAGE_OFF_FS(_addr) { \
-	uint32 __a = (uint32) (_addr); \
-	__asm mov eax, __a _asm invlpg fs:[eax] \
-}
 
+#ifdef VM_X86_32
 
-#define ENABLE_INTERRUPTS() { __asm sti }
-#define CLEAR_INTERRUPTS()  { __asm cli }
+#define SET_TR(_tr)      _Set_TR(_tr)
+#define SET_LDT(_tr)     _Set_LDT(_tr)
 
-#define RAISE_INTERRUPT(_x)  {__asm int _x }
-#define RETURN_FROM_INT()   {__asm iretd }
+#define GET_TR(_tr)      do { _tr = _Get_TR();  } while (0)
+#define GET_LDT(_tr)     do { _tr = _Get_LDT(); } while (0)
 
+#define SET_CR2(_reg)    __asm mov eax, _reg __asm mov cr2, eax
+#define CLTS()           __asm clts
 
-#define SAVE_FLAGS(x) { \
-     __asm pushfd __asm pop eax __asm mov x, eax \
-}
+#define FNCLEX()         __asm fnclex
 
-#define RESTORE_FLAGS(x) { \
-     __asm push x __asm popfd\
+#define TLB_INVALIDATE_PAGE(_addr) {  \
+   void *_a = (_addr); \
+   __asm mov eax, _a __asm invlpg [eax] \
 }
 
+#define RAISE_INTERRUPT(_x)  {__asm int _x }
+#define RETURN_FROM_INT()   {__asm iretd }
 
 
-static INLINE void SET_DS(Selector val)
+static INLINE void
+SET_DS(Selector val)
 {
    __asm mov ax, val
    __asm mov ds, ax
 }
 
-static INLINE void SET_ES(Selector val)
+static INLINE void
+SET_ES(Selector val)
 {
    __asm mov ax, val
    __asm mov es, ax
 }
 
-static INLINE void SET_FS(Selector val)
+static INLINE void
+SET_FS(Selector val)
 {
    __asm mov ax, val
    __asm mov fs, ax
 }
 
-static INLINE void SET_GS(Selector val)
+static INLINE void
+SET_GS(Selector val)
 {
    __asm mov ax, val
    __asm mov gs, ax
 }
 
-static INLINE void SET_SS(Selector val)
+static INLINE void
+SET_SS(Selector val)
 {
    __asm mov ax, val
    __asm mov ss, ax
 }
 
-static INLINE Selector GET_FS(void)
+static INLINE Selector
+GET_FS(void)
 {
-	Selector _v;
-	__asm mov _v,fs
-	return _v;
+   Selector _v;
+   __asm mov _v,fs
+   return _v;
 }
 
-static INLINE Selector GET_GS(void)
+static INLINE Selector
+GET_GS(void)
 {
-	Selector _v;
-	__asm mov _v,gs
-	return _v;
+   Selector _v;
+   __asm mov _v,gs
+   return _v;
 }
 
-
-static INLINE Selector GET_DS(void)
+static INLINE Selector
+GET_DS(void)
 {
-	Selector _v;
-	__asm mov _v,ds
-	return _v;
+   Selector _v;
+   __asm mov _v,ds
+   return _v;
 }
 
-static INLINE Selector GET_ES(void)
+static INLINE Selector
+GET_ES(void)
 {
-	Selector _v;
-	__asm mov _v,es
-	return _v;
+   Selector _v;
+   __asm mov _v,es
+   return _v;
 }
 
-static INLINE Selector GET_SS(void)
+static INLINE Selector
+GET_SS(void)
 {
-	Selector _v;
-	__asm mov _v,ss
-	return _v;
+   Selector _v;
+   __asm mov _v,ss
+   return _v;
 }
 
-static INLINE Selector GET_CS(void)
+static INLINE Selector
+GET_CS(void)
 {
-	Selector _v;
-	__asm mov _v,cs
-	return _v;
-}
-
-#pragma warning( disable : 4035)
-
-static INLINE uint32  GET_WORD_FROM_FS(uint32 *_addr) {
-	__asm mov eax, _addr
-    __asm mov eax, fs:[eax]
-}
-
-static INLINE uint16  GET_SHORT_FROM_FS(uint16 *_addr) {
-	__asm mov eax, _addr
-    __asm mov ax, fs:[eax]
-}
-
-static INLINE uint8  GET_BYTE_FROM_FS(uint8 *_addr) {
-	__asm mov eax, _addr
-     __asm mov al, fs:[eax]
-}
-
-#pragma warning (default: 4035)
-
-static INLINE void  SET_WORD_FS(uint32 *_addr, uint32 _val) {
-    __asm mov eax, _addr
-    __asm mov ebx, _val
-    __asm mov fs:[eax], ebx
+   Selector _v;
+   __asm mov _v,cs
+   return _v;
 }
 
-static INLINE void  SET_SHORT_FS(uint32 *_addr, uint16 _val) {
-    __asm mov eax, _addr
-    __asm mov bx, _val
-    __asm mov fs:[eax], bx
-}
-
-static INLINE void  SET_BYTE_FS(uint32 *_addr, uint8 _val) {
-    __asm mov eax, _addr
-    __asm mov bl, _val
-    __asm mov fs:[eax], bl
-}
-
-static INLINE void _Set_GDT(_GETSET_DTR_TYPE *dtr) {
-   __asm mov eax, dtr
-   __asm lgdt [eax]
-}
-
-static INLINE void _Set_IDT(_GETSET_DTR_TYPE *dtr) {
-   __asm mov eax, dtr
-   __asm lidt [eax]
-}
-
-static INLINE void _Set_LDT(Selector val)
+static INLINE void
+_Set_LDT(Selector val)
 {
    __asm lldt val
 }
 
-static INLINE void _Set_TR(Selector val)
+static INLINE void
+_Set_TR(Selector val)
 {
    __asm ltr val
 }
 
-static INLINE void _Get_GDT(_GETSET_DTR_TYPE *dtr) {
-   __asm mov eax, dtr
-   __asm sgdt [eax]
-}
-
-static INLINE void _Get_IDT(_GETSET_DTR_TYPE *dtr) {
-   __asm mov eax, dtr
-   __asm sidt [eax]
-}
-
-static INLINE Selector _Get_LDT(void) {
+static INLINE Selector
+_Get_LDT(void)
+{
    Selector sel;
    __asm sldt sel
    return sel;
 }
 
-static INLINE Selector _Get_TR(void) {
+static INLINE Selector
+_Get_TR(void)
+{
    Selector sel;
    __asm str sel
    return sel;
 }
 
+#endif /* !VM_X86_32 */
+#endif /* !__GNUC__ && !_MSC_VER */
 
-static INLINE void
-MEMCOPY_TO_FS(VA to,
-              char * from,
-              unsigned long n)
-{
-   unsigned long i =0;
-   while (i+4  <=n) {
-      uint32 x = *(uint32*) (from + i);
-	  uint32 _faddr = (uint32) (to+i);
-	  __asm mov eax, _faddr
-	  __asm mov ebx, x
-	  __asm mov fs:[eax], ebx
-      i +=4;
-   }
-   while (i<n) {
-      uint8 x = from[i];
-	  uint32 _faddr = (uint32) (to+i);
-	  __asm mov eax, _faddr
-	  __asm mov bl, x
-	  __asm mov fs:[eax], bl
-      i++;
-   }
-}
 
+#define SET_CR_DR(regType, regNum, expr)                     \
+   do {                                                      \
+      /* Ensure no implicit truncation of 'expr' */          \
+      ASSERT_ON_COMPILE(sizeof(expr) <= sizeof(uintptr_t));  \
+      _SET_##regType##regNum(expr);                          \
+   } while (0)
 
+#define GET_CR_DR(regType, regNum, var) \
+   do {                                 \
+      _GET_##regType##regNum(&(var));   \
+   } while (0)
 
-static INLINE void
-MEMCOPY_FROM_FS(char * to,
-                VA from,
-                unsigned long n)
-{
-   unsigned long i =0;
-   while (i+4  <=n) {
-      uint32 x;
-	  uint32 _faddr = (uint32)(from+i);
-	  __asm mov eax, _faddr
-	  __asm mov ebx, fs:[eax]
-	  __asm mov x,ebx
-      *(uint32*)(to+i)=x;
-      i +=4;
-   }
-   while (i<n) {
-      uint8 x;
-	  uint32 _faddr = (uint32) (from+i);
-	  __asm mov eax, _faddr;
-      __asm mov bl, fs:[eax]
-	  __asm mov x, bl
-      *(uint8*)(to+i)=x;
-      i++;
-   }
-}
+#define SET_DR0(expr) SET_CR_DR(DR, 0, expr)
+#define SET_DR1(expr) SET_CR_DR(DR, 1, expr)
+#define SET_DR2(expr) SET_CR_DR(DR, 2, expr)
+#define SET_DR3(expr) SET_CR_DR(DR, 3, expr)
+#define SET_DR6(expr) SET_CR_DR(DR, 6, expr)
+#define SET_DR7(expr) SET_CR_DR(DR, 7, expr)
 
-#else
-#error No compiler defined for get/set
-#endif /* !__GNUC__ && !_MSC_VER */
+#define GET_DR0(var)  GET_CR_DR(DR, 0, var)
+#define GET_DR1(var)  GET_CR_DR(DR, 1, var)
+#define GET_DR2(var)  GET_CR_DR(DR, 2, var)
+#define GET_DR3(var)  GET_CR_DR(DR, 3, var)
+#define GET_DR6(var)  GET_CR_DR(DR, 6, var)
+#define GET_DR7(var)  GET_CR_DR(DR, 7, var)
 
+/* Undefine GET_CR0; it is defined in mach_asm.h for SLES cross-compile */
+#undef GET_CR0
+#define GET_CR0(var)  GET_CR_DR(CR, 0, var)
+#define GET_CR2(var)  GET_CR_DR(CR, 2, var)
+#define GET_CR3(var)  GET_CR_DR(CR, 3, var)
+#define GET_CR4(var)  GET_CR_DR(CR, 4, var)
+#define GET_CR8(var)  GET_CR_DR(CR, 8, var)
 
-#ifdef __GNUC__
-static INLINE unsigned CURRENT_CPL(void)
+#define SET_CR0(expr) SET_CR_DR(CR, 0, expr)
+#define SET_CR3(expr) SET_CR_DR(CR, 3, expr)
+#define SET_CR4(expr) SET_CR_DR(CR, 4, expr)
+#define SET_CR8(expr) SET_CR_DR(CR, 8, expr)
+
+static INLINE Bool
+INTERRUPTS_ENABLED(void)
 {
-   return SELECTOR_RPL(GET_CS());
-}
-#elif defined _MSC_VER
-static INLINE unsigned CURRENT_CPL(void) {
-   volatile Selector _v;
-   __asm mov ax, cs _asm mov _v, ax
-   return SELECTOR_RPL(_v);
+   uintptr_t flags;
+   SAVE_FLAGS(flags);
+   return ((flags & EFLAGS_IF) != 0);
 }
-#else
-#error No compiler defined for CURRENT_CPL
-#endif
 
+/*
+ * [GS]ET_[GI]DT() are defined as macros wrapping a function
+ * so we can pass the argument implicitly by reference (requires
+ * a macro) and get type checking too (requires a function).
+ */
 
-#ifdef __GNUC__
-/* Checked against the Intel manual and GCC --hpreg
+#define SET_GDT(_gdt)    _Set_GDT(&(_gdt))
+#define GET_GDT(_gdt)    _Get_GDT(&(_gdt))
 
-   volatile because the msr can change without the compiler knowing it
-   (when we use wrmsr). */
-static INLINE uint64 __GET_MSR(int cx)
-{
-   uint64 msr;
-#ifdef VM_X86_64
-   __asm__ __volatile__(
-      "rdmsr; shlq $32, %%rdx; orq %%rdx, %%rax"
-      : "=a" (msr)
-      : "c" (cx)
-      : "%rdx"
-   );
-#else
-   __asm__ __volatile__(
-      "rdmsr"
-      : "=A" (msr)
-      : "c" (cx)
-   );
-#endif
-   return msr;
-}
-#elif defined _MSC_VER
-#pragma warning( disable : 4035)
-static INLINE uint64 __GET_MSR(int input)
-{
-   __asm push ecx
-   __asm mov  ecx, input
-   __asm _emit 0x0f __asm _emit 0x32
-   __asm pop ecx
-}
-
-static INLINE void __SET_MSR(int input, uint64 val)
-{
-   uint32 hival = (uint32)(val >> 32);
-   uint32 loval = (uint32)val;
-   __asm push edx
-   __asm push ecx
-   __asm push eax
-   __asm mov  eax, loval
-   __asm mov  edx, hival
-   __asm mov  ecx, input
-   __asm _emit 0x0f __asm _emit 0x30
-   __asm pop eax
-   __asm pop ecx
-   __asm pop edx
-}
-#pragma warning (default: 4035)
-#else
-#error
+#define SET_IDT(_idt)    _Set_IDT(&(_idt))
+#define GET_IDT(_idt)    _Get_IDT(&(_idt))
+
+#if !defined(VMKERNEL)
+#define NO_INTERRUPTS_BEGIN() do { \
+                                   uintptr_t _flags; \
+                                   SAVE_FLAGS(_flags); \
+                                   CLEAR_INTERRUPTS();
+
+#define NO_INTERRUPTS_END()        RESTORE_FLAGS(_flags); \
+                                 } while(0)
 #endif
 
-#ifdef __GNUC__
-static INLINE void __SET_MSR(int cx, uint64 val)
+
+#if defined (__GNUC__) || (defined (_MSC_VER) && defined (VM_X86_32))
+static INLINE unsigned
+CURRENT_CPL(void)
 {
-#ifdef VM_X86_64
-   __asm__ __volatile__(
-      "wrmsr"
-      : /* no outputs */
-      : "a" ((uint32) val), "d" ((uint32)(val >> 32)), "c" (cx)
-    );
-#else
-   __asm__ __volatile__(
-      "wrmsr"
-      : /* no outputs */
-      : "A" (val),
-        "c" (cx)
-    );
-#endif
+   return SELECTOR_RPL(GET_CS());
 }
 #endif
 
 
-/*
- * RDMSR/WRMSR access the 64bit MSRs as two
- * 32 bit quantities, whereas GET_MSR/SET_MSR
- * above access the MSRs as one 64bit quantity.
- */
-#ifdef __GNUC__
-#undef RDMSR
-#undef WRMSR
-#define RDMSR(msrNum, low, high) do { \
-   __asm__ __volatile__(              \
-      "rdmsr"                         \
-      : "=a" (low), "=d" (high)       \
-      : "c" (msrNum)                  \
-   );                                 \
-} while (0)
-
-#define WRMSR(msrNum, low, high) do { \
-   __asm__ __volatile__(              \
-      "wrmsr"                         \
-      : /* no outputs */              \
-      : "c" (msrNum),                 \
-        "a" (low),                    \
-        "d" (high)                    \
-    );                                \
-} while (0)
-
-static INLINE uint64 RDPMC(int cx)
+static INLINE uint64
+RDPMC(int counter)
 {
+#ifdef __GNUC__
 #ifdef VM_X86_64
    uint64 pmcLow;
    uint64 pmcHigh;
@@ -867,7 +699,7 @@ static INLINE uint64 RDPMC(int cx)
    __asm__ __volatile__(
       "rdpmc"
       : "=a" (pmcLow), "=d" (pmcHigh)
-      : "c" (cx)
+      : "c" (counter)
    );
 
    return pmcHigh << 32 | pmcLow;
@@ -877,43 +709,26 @@ static INLINE uint64 RDPMC(int cx)
    __asm__ __volatile__(
       "rdpmc"
       : "=A" (pmc)
-      : "c" (cx)
+      : "c" (counter)
    );
 
    return pmc;
 #endif
-}
 #elif defined _MSC_VER
-#ifndef VM_X86_64 // XXX Switch to intrinsics with the new 32 and 64-bit compilers.
-
-static INLINE uint64 RDPMC(int counter)
-{
-   __asm mov ecx, counter
-   __asm rdpmc
-}
-
-static INLINE void WRMSR(uint32 msrNum, uint32 lo, uint32 hi)
-{
-   __asm mov ecx, msrNum
-   __asm mov eax, lo
-   __asm mov edx, hi
-   __asm wrmsr
-}
-#endif
+   return __readpmc(counter);
 #endif
+}
 
 
-#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
-static INLINE uint64 __XGETBV(int cx)
+#if defined(VMM) || defined(VMKERNEL) || defined(FROBOS) || defined (ULM)
+static INLINE uint64
+__XGETBV(int cx)
 {
+#ifdef __GNUC__
 #ifdef VM_X86_64
    uint64 lowval, hival;
    __asm__ __volatile__(
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-      ".byte 0x0f, 0x01, 0xd0"
-#else
       "xgetbv"
-#endif
       : "=a" (lowval), "=d" (hival)
       : "c" (cx)
    );
@@ -921,39 +736,41 @@ static INLINE uint64 __XGETBV(int cx)
 #else
    uint64 val;
    __asm__ __volatile__(
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-      ".byte 0x0f, 0x01, 0xd0"
-#else
       "xgetbv"
-#endif
       : "=A" (val)
       : "c" (cx)
    );
    return val;
 #endif
+#elif defined _MSC_VER
+   return _xgetbv((unsigned)cx);
+#endif
 }
 
-static INLINE void __XSETBV(int cx, uint64 val)
+static INLINE void
+__XSETBV(int cx, uint64 val)
 {
+#ifdef __GNUC__
    __asm__ __volatile__(
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-      ".byte 0x0f, 0x01, 0xd1"
-#else
       "xsetbv"
-#endif
       : /* no outputs */
       : "a" ((uint32)val), "d" ((uint32)(val >> 32)), "c" (cx)
     );
+#elif defined _MSC_VER
+   _xsetbv((unsigned)cx, val);
+#endif
 }
 
-static INLINE uint64 GET_XCR0(void)
+static INLINE uint64
+GET_XCR0(void)
 {
    return __XGETBV(0);
 }
 
 #define SET_XCR0(val) __XSETBV(0, val)
 
-static INLINE void SET_XCR0_IF_NEEDED(uint64 newVal, uint64 oldVal)
+static INLINE void
+SET_XCR0_IF_NEEDED(uint64 newVal, uint64 oldVal)
 {
 #ifndef VMM_BOOTSTRAP
    ASSERT(oldVal == GET_XCR0());
@@ -965,33 +782,45 @@ static INLINE void SET_XCR0_IF_NEEDED(uint64 newVal, uint64 oldVal)
 #endif
 
 
-#define START_TRACING() { \
-   uintptr_t flags;       \
-   SAVE_FLAGS(flags);     \
-   flags |= EFLAGS_TF;    \
-   RESTORE_FLAGS(flags);  \
-}
+static INLINE uint32
+RDTSCP_AuxOnly(void)
+{
+#ifdef __GNUC__
+   uint32 tscLow, tscHigh, tscAux;
 
-#define STOP_TRACING() {  \
-   uintptr_t flags;       \
-   SAVE_FLAGS(flags);     \
-   flags &= ~EFLAGS_TF;   \
-   RESTORE_FLAGS(flags);  \
-}
+   __asm__ __volatile__(
+      "rdtscp"
+      : "=a" (tscLow), "=d" (tscHigh), "=c" (tscAux)
+   );
 
+   return tscAux;
+#elif defined _MSC_VER
+   uint32 tscAux;
 
-static INLINE Bool
-INTERRUPTS_ENABLED(void)
-{
-   uintptr_t flags;
-   SAVE_FLAGS(flags);
-   return ((flags & EFLAGS_IF) != 0);
+   __rdtscp(&tscAux);
+
+   return tscAux;
+#endif
 }
 
-static INLINE void
-SET_KERNEL_PER_CORE(uint64 val)
+
+static INLINE uint64
+RDTSCP(void)
 {
-   __SET_MSR(MSR_GSBASE, val);
+#ifdef __GNUC__
+   uint32 tscLow, tscHigh, tscAux;
+
+   __asm__ __volatile__(
+      "rdtscp"
+      :"=a" (tscLow), "=d" (tscHigh), "=c" (tscAux)
+   );
+
+   return QWORD(tscHigh, tscLow);
+#elif defined _MSC_VER
+   uint32 tscAux;
+
+   return __rdtscp(&tscAux);
+#endif
 }
 
 #endif
diff --git a/vmmon-only/include/vm_asm_x86_64.h b/vmmon-only/include/vm_asm_x86_64.h
deleted file mode 100644
index db2131c7..00000000
--- a/vmmon-only/include/vm_asm_x86_64.h
+++ /dev/null
@@ -1,137 +0,0 @@
-/*********************************************************
- * Copyright (C) 1998-2015 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * vm_asm_x86_64.h
- *
- *	x86-64 asm macros
- */
-
-#ifndef _VM_ASM_X86_64_H_
-#define _VM_ASM_X86_64_H_
-
-
-#define INCLUDE_ALLOW_VMX
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMK_MODULE
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_DISTRIBUTE
-#include "includeCheck.h"
-
-#ifdef __GNUC__
-#include "vm_asm_x86.h"
-#endif
-
-/*
- * This file contains inline assembly routines used by x86_64 code.
- */
-
-#ifdef __GNUC__
-
-  /* nop; prevents #error for no compiler definition from firing */
-
-#elif defined _MSC_VER  /* !__GNUC__ */
-
-/*
- * x86-64 windows doesn't support inline asm so we have to use these
- * intrinsic functions defined in the compiler.  Not all of these are well
- * documented.  There is an array in the compiler dll (c1.dll) which has
- * an array of the names of all the intrinsics minus the leading
- * underscore.  Searching around in the ntddk.h file can also be helpful.
- *
- * The declarations for the intrinsic functions were taken from the DDK.
- * Our declarations must match the ddk's otherwise the 64-bit c++ compiler
- * will complain about second linkage of the intrinsic functions.
- * We define the intrinsic using the basic types corresponding to the
- * Windows typedefs. This avoids having to include windows header files
- * to get to the windows types.
- */
-
-#ifdef _WIN64
-#ifdef __cplusplus
-extern "C" {
-#endif
-unsigned __int64  __readmsr(unsigned long);
-void              __writemsr(unsigned long, unsigned __int64);
-#pragma intrinsic(__readmsr, __writemsr)
-#ifdef __cplusplus
-}
-#endif
-
-
-static INLINE uint64
-RDPMC(int counter)
-{
-   return __readpmc(counter);
-}
-
-
-static INLINE void
-WRMSR(uint32 msrNum, uint32 lo, uint32 hi)
-{
-   uint64 value = QWORD(hi, lo);
-   __writemsr(msrNum, value);
-}
-
-
-static INLINE uint64
-__GET_MSR(int input)
-{
-   return __readmsr((unsigned long)input);
-}
-
-
-static INLINE void
-__SET_MSR(int cx, uint64 val)
-{
-  __writemsr((unsigned long)cx, (unsigned __int64)val);
-}
-
-#endif
-
-#else
-#error No compiler defined for get/set
-#endif /* !__GNUC__ && !_MSC_VER */
-
-
-#ifdef __GNUC__
-static INLINE void
-SWAPGS(void)
-{
-   __asm__ __volatile__("swapgs");
-}
-
-
-static INLINE uint64
-RDTSCP_AuxOnly(void)
-{
-   uint64 tscLow, tscHigh, tscAux;
-
-   __asm__ __volatile__(
-      "rdtscp"
-      : "=a" (tscLow), "=d" (tscHigh), "=c" (tscAux)
-   );
-
-   return tscAux;
-}
-#endif
-
-#endif
diff --git a/vmmon-only/include/vm_assert.h b/vmmon-only/include/vm_assert.h
index 8cdbc93e..74cbc2fb 100644
--- a/vmmon-only/include/vm_assert.h
+++ b/vmmon-only/include/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -202,7 +202,7 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 
 #define NOT_TESTED_1024()                                               \
    do {                                                                 \
-      static uint16 count = 0;                                          \
+      static MONITOR_ONLY(PERVCPU) uint16 count = 0;                    \
       if (UNLIKELY(count == 0)) { NOT_TESTED(); }                       \
       count = (count + 1) & 1023;                                       \
    } while (0)
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index 5fa2fcaf..800b3eda 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -1317,7 +1317,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
 #else
    __asm mov eax, val
    __asm mov ebx, var
-   __asm lock and [ebx]Atomic_uint32.value, eax
+   __asm lock And [ebx]Atomic_uint32.value, eax
 #endif
 #else
 #error No compiler defined for Atomic_And
@@ -1382,7 +1382,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
 #else
    __asm mov eax, val
    __asm mov ebx, var
-   __asm lock or [ebx]Atomic_uint32.value, eax
+   __asm lock Or [ebx]Atomic_uint32.value, eax
 #endif
 #else
 #error No compiler defined for Atomic_Or
@@ -1447,7 +1447,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
 #else
    __asm mov eax, val
    __asm mov ebx, var
-   __asm lock xor [ebx]Atomic_uint32.value, eax
+   __asm lock Xor [ebx]Atomic_uint32.value, eax
 #endif
 #else
 #error No compiler defined for Atomic_Xor
@@ -2303,7 +2303,10 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
  *
  * Atomic_ReadSub64 --
  *
- *      Atomically subtracts a 64-bit integer to another
+ *      Atomically subtracts a 64-bit integer from another.
+ *
+ *      Note: It is expected that val <= var.  If untrue, the result
+ *            cannot be represented in an unsigned type.
  *
  * Results:
  *      Returns the old value just prior to the subtraction
@@ -2321,7 +2324,7 @@ Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
 #if defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
-   return Atomic_ReadAdd64(var, -(int64)val);
+   return Atomic_ReadAdd64(var, (uint64)-(int64)val);
 #endif
 }
 
@@ -3618,7 +3621,7 @@ Atomic_ReadInc16(Atomic_uint16 *var) // IN/OUT
 static INLINE uint16
 Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
 {
-   return Atomic_ReadAdd16(var, -1);
+   return Atomic_ReadAdd16(var, (uint16)-1);
 }
 #endif
 
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index 79bb2789..02172e64 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -221,8 +221,9 @@ mssb64_0(const uint64 value)
 #endif
 
 static INLINE int
-lssb32_0(uint32 value)
+lssb32_0(uint32 v)
 {
+   int value = (int)v;
 #ifdef USE_ARCH_X86_CUSTOM
    if (!__builtin_constant_p(value)) {
       if (UNLIKELY(value == 0)) {
@@ -262,8 +263,10 @@ mssb32_0(uint32 value)
 }
 
 static INLINE int
-lssb64_0(const uint64 value)
+lssb64_0(const uint64 v)
 {
+   int64 value = (int64)v;
+
 #ifdef USE_ARCH_X86_CUSTOM
    if (!__builtin_constant_p(value)) {
       if (UNLIKELY(value == 0)) {
@@ -373,10 +376,10 @@ lssbPtr_0(const uintptr_t value)
 #endif
 }
 
-static INLINE int
+static INLINE unsigned
 lssbPtr(const uintptr_t value)
 {
-   return lssbPtr_0(value) + 1;
+   return (unsigned)lssbPtr_0(value) + 1;
 }
 
 static INLINE int
@@ -389,34 +392,34 @@ mssbPtr_0(const uintptr_t value)
 #endif
 }
 
-static INLINE int
+static INLINE unsigned
 mssbPtr(const uintptr_t value)
 {
-   return mssbPtr_0(value) + 1;
+   return (unsigned)mssbPtr_0(value) + 1;
 }
 
-static INLINE int
+static INLINE unsigned
 lssb32(const uint32 value)
 {
-   return lssb32_0(value) + 1;
+   return (unsigned)lssb32_0(value) + 1;
 }
 
-static INLINE int
+static INLINE unsigned
 mssb32(const uint32 value)
 {
-   return mssb32_0(value) + 1;
+   return (unsigned)mssb32_0(value) + 1;
 }
 
-static INLINE int
+static INLINE unsigned
 lssb64(const uint64 value)
 {
-   return lssb64_0(value) + 1;
+   return (unsigned)lssb64_0(value) + 1;
 }
 
-static INLINE int
+static INLINE unsigned
 mssb64(const uint64 value)
 {
-   return mssb64_0(value) + 1;
+   return (unsigned)mssb64_0(value) + 1;
 }
 
 #ifdef __GNUC__
@@ -768,12 +771,14 @@ static INLINE void
 PAUSE(void)
 #if defined(__GNUC__) || defined(VM_ARM_32)
 {
-#ifdef VM_ARM_ANY
+#ifdef VM_ARM_64
+   __asm__ __volatile__("yield");
+#elif defined VM_ARM_32
    /*
-    * ARM has no instruction to execute "spin-wait loop", just leave it
-    * empty.
+    * YIELD is available in ARMv6K and above, so we could probably refine this
+    * instead of leaving it empty.
     */
-#else
+#else // x86
    __asm__ __volatile__( "pause" :);
 #endif
 }
@@ -888,7 +893,7 @@ RDTSC(void)
  *
  * {Clear,Set,Test}Bit{32,64} --
  *
- *    Sets or clears a specified single bit in the provided variable.
+ *    Sets tests or clears a specified single bit in the provided variable.
  *
  *    The index input value specifies which bit to modify and is 0-based.
  *    Index is truncated by hardware to a 5-bit or 6-bit offset for the
@@ -902,111 +907,39 @@ RDTSC(void)
  */
 
 static INLINE void
-SetBit32(uint32 *var, uint32 index)
+SetBit32(uint32 *var, unsigned index)
 {
-#if defined(__GNUC__) && defined(VM_X86_ANY)
-   __asm__ (
-      "bts %1, %0"
-      : "+mr" (*var)
-      : "rI" (index)
-      : "cc"
-   );
-#elif defined(_MSC_VER)
-   _bittestandset((long *)var, index);
-#else
-   *var |= (1 << index);
-#endif
+   *var |= 1 << index;
 }
 
 static INLINE void
-ClearBit32(uint32 *var, uint32 index)
+ClearBit32(uint32 *var, unsigned index)
 {
-#if defined(__GNUC__) && defined(VM_X86_ANY)
-   __asm__ (
-      "btr %1, %0"
-      : "+mr" (*var)
-      : "rI" (index)
-      : "cc"
-   );
-#elif defined(_MSC_VER)
-   _bittestandreset((long *)var, index);
-#else
    *var &= ~(1 << index);
-#endif
 }
 
 static INLINE void
-SetBit64(uint64 *var, uint64 index)
+SetBit64(uint64 *var, unsigned index)
 {
-#if defined(VM_64BIT) && !defined(VM_ARM_64)
-#ifdef __GNUC__
-   __asm__ (
-      "bts %1, %0"
-      : "+mr" (*var)
-      : "rJ" (index)
-      : "cc"
-   );
-#elif defined(_MSC_VER)
-   _bittestandset64((__int64 *)var, index);
-#endif
-#else
-   *var |= ((uint64)1 << index);
-#endif
+   *var |= CONST64U(1) << index;
 }
 
 static INLINE void
-ClearBit64(uint64 *var, uint64 index)
+ClearBit64(uint64 *var, unsigned index)
 {
-#if defined(VM_64BIT) && !defined(VM_ARM_64)
-#ifdef __GNUC__
-   __asm__ (
-      "btrq %1, %0"
-      : "+mr" (*var)
-      : "rJ" (index)
-      : "cc"
-   );
-#elif defined(_MSC_VER)
-   _bittestandreset64((__int64 *)var, index);
-#endif
-#else
-   *var &= ~((uint64)1 << index);
-#endif
+   *var &= ~(CONST64U(1) << index);
 }
 
 static INLINE Bool
-TestBit32(const uint32 *var, uint32 index)
+TestBit32(const uint32 *var, unsigned index)
 {
-#if defined(__GNUC__) && defined(VM_X86_ANY)
-   Bool bit;
-   __asm__ (
-      "bt %[index], %[var] \n"
-      "setc %[bit]"
-      : [bit] "=qQm" (bit)
-      : [index] "rI" (index), [var] "r" (*var)
-      : "cc"
-   );
-   return bit;
-#else
    return (*var & (1 << index)) != 0;
-#endif
 }
 
 static INLINE Bool
-TestBit64(const uint64 *var, uint64 index)
+TestBit64(const uint64 *var, unsigned index)
 {
-#if defined __GNUC__ && defined VM_X86_64
-   Bool bit;
-   __asm__ (
-      "bt %[index], %[var] \n"
-      "setc %[bit]"
-      : [bit] "=qQm" (bit)
-      : [index] "rJ" (index), [var] "r" (*var)
-      : "cc"
-   );
-   return bit;
-#else
    return (*var & (CONST64U(1) << index)) != 0;
-#endif
 }
 
 /*
@@ -1170,7 +1103,9 @@ RoundUpPow2C32(uint32 value)
    if (value <= 1 || value > (1U << 31)) {
       return 1; // Match the assembly's undefined value for large inputs.
    } else {
-      return (2 << mssb32_0(value - 1));
+      int mssb32 = mssb32_0(value - 1);
+      /* invariant: mssb32 >= 0 */
+      return (2U << (uint32)mssb32);
    }
 }
 
@@ -1226,6 +1161,101 @@ RoundUpPow2_32(uint32 value)
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PopCount32 --
+ *
+ *     Counts "1" bits in a uint32.
+ *
+ * Results:
+ *     Returns the number of bits set to 1.
+ *
+ * Side effects:
+ *     None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE unsigned
+PopCount32(uint32 value)
+{
+   /*
+    * Attribution:
+    *     This algorithm was copied from:
+    *         http://www.aggregate.org/MAGIC#Population Count (Ones Count)
+    *
+    *     A virtually identical version (but in assembly) appears in an
+    *     AMD reference manual.
+    *
+    *     No license appears in the original code, but the website
+    *     header states:
+    *
+    *     "None of the following coding tricks came from proprietary
+    *     sources; further, we believe that each of the tricks we did
+    *     not invent is essentially "standard engineering practice" in
+    *     the specialized niche where it applies. Thus, although we
+    *     have not conducted patent searches, etc., to confirm it, we
+    *     believe that these are tricks that freely can be used for
+    *     any purpose. Of course, The Aggregate accepts no
+    *     responsibility for your use of these tricks; you must
+    *     confirm that the trick does what you want and that you can
+    *     use it as you intend. That said, we do intend to maintain
+    *     this page by adding new algorithms and/or correcting
+    *     existing entries. If you have any comments, please contact
+    *     Professor Hank Dietz, http://aggregate.org/hankd/"
+    *
+    *     "This document should be cited using something like the
+    *     following bibtex entry:" (most recent retrieval date added)
+    *
+    *     @techreport{magicalgorithms,
+    *     author={Henry Gordon Dietz},
+    *     title={{The Aggregate Magic Algorithms}},
+    *     institution={University of Kentucky},
+    *     howpublished={Aggregate.Org online technical report},
+    *     URL={http://aggregate.org/MAGIC/},
+    *     urldate={2016-01-27}
+    *     }
+    */
+   value -= ((value >> 1) & 0x55555555);
+   value = (((value >> 2) & 0x33333333) + (value & 0x33333333));
+   value = (((value >> 4) + value) & 0x0f0f0f0f);
+   value += (value >> 8);
+   value += (value >> 16);
+   return value & 0x0000003f;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PopCount64 --
+ *
+ *     Counts "1" bits in a uint64.
+ *
+ * Results:
+ *     Returns the number of bits set to 1.
+ *
+ * Side effects:
+ *     None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE unsigned
+PopCount64(uint64 value)
+{
+   value -= (value >> 1) & 0x5555555555555555ULL;
+   value = ((value >> 2) & 0x3333333333333333ULL) +
+           (value & 0x3333333333333333ULL);
+   value = ((value >> 4) + value) & 0x0f0f0f0f0f0f0f0fULL;
+   value += value >> 8;
+   value += value >> 16;
+   value += value >> 32;
+   return (unsigned) (value & 0xff);
+}
+
+
 #if defined __cplusplus
 } // extern "C"
 #endif
diff --git a/vmmon-only/include/vm_basic_asm_x86.h b/vmmon-only/include/vm_basic_asm_x86.h
index e293ed25..9879dc6d 100644
--- a/vmmon-only/include/vm_basic_asm_x86.h
+++ b/vmmon-only/include/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -52,16 +52,25 @@ extern "C" {
  * XTEST
  *     Return TRUE if processor is in transaction region.
  *
+ *  Using condition codes as output values (=@ccnz) requires gcc6 or
+ *  above.  Clang does not support condition codes as output
+ *  constraints.
+ *
  */
 #if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
 static INLINE Bool
 xtest(void)
 {
-   uint8 al;
-   __asm__ __volatile__(".byte 0x0f, 0x01, 0xd6    # xtest \n"
-                        "setnz %%al\n"
-                        : "=a"(al) : : "cc");
-   return al;
+   Bool result;
+#if defined(__clang__)
+   __asm__ __volatile__("xtest\n"
+                        "setnz %%al"
+                        : "=a" (result) : : "cc");
+#else
+   __asm__ __volatile__("xtest"
+                        : "=@ccnz" (result) : : "cc");
+#endif
+   return result;
 }
 
 #endif /* __GNUC__ */
@@ -135,49 +144,32 @@ FXRSTOR_AMD_ES0(const void *load)
 static INLINE void 
 XSAVE_ES1(void *save, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x21 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
    __asm__ __volatile__ (
         "xsave %0 \n"
         : "=m" (*(uint8 *)save)
         : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
-#endif
 }
 
 static INLINE void 
 XSAVEOPT_ES1(void *save, uint64 mask)
 {
    __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x31 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        "xsaveopt %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
 }
 
 static INLINE void 
 XRSTOR_ES1(const void *load, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x29 \n"
-        :
-        : "c" ((const uint8 *)load),
-          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
    __asm__ __volatile__ (
         "xrstor %0 \n"
         :
         : "m" (*(const uint8 *)load),
           "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
-#endif
 }
 
 static INLINE void 
@@ -195,17 +187,10 @@ XRSTOR_AMD_ES0(const void *load, uint64 mask)
         "fildl   %0      \n"     // Dummy Load from "safe address" changes all
                                  // x87 exception pointers.
         "mov %%ebx, %%eax \n"
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-        ".byte 0x0f, 0xae, 0x29 \n"
-        :
-        : "m" (dummy), "c" ((const uint8 *)load),
-          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
-#else
         "xrstor %1 \n"
         :
         : "m" (dummy), "m" (*(const uint8 *)load),
           "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
-#endif
         : "eax", "memory");
 }
 #endif /* __GNUC__ */
@@ -415,7 +400,7 @@ Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
       shr  edx, cl
       jmp  SHORT l3
    l2:
-      xor  esi, esi
+      Xor  esi, esi
       shrd eax, edx, cl                     // result = hi(p2):hi(p1):lo(p1) >> shift
       adc  esi, 0                           // Get highest order bit shifted out, from CF
       shrd edx, ebx, cl
@@ -536,7 +521,7 @@ Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
       sar  edx, cl
       jmp  SHORT l3
    l2:
-      xor  esi, esi
+      Xor  esi, esi
       shrd eax, edx, cl                     // result = hi(p2):hi(p1):lo(p1) << shift
       adc  esi, 0                           // Get highest order bit shifted out, from CF
       shrd edx, ebx, cl
diff --git a/vmmon-only/include/vm_basic_asm_x86_64.h b/vmmon-only/include/vm_basic_asm_x86_64.h
index f9b255a9..ee1d1fb0 100644
--- a/vmmon-only/include/vm_basic_asm_x86_64.h
+++ b/vmmon-only/include/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -49,12 +49,29 @@ uint64 _umul128(uint64 multiplier, uint64 multiplicand,
 int64 _mul128(int64 multiplier, int64 multiplicand,
               int64 *highProduct);
 uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
+#ifdef ULM
+void _fxsave64(void *save);
+void _fxsave(void *save);
+void _fxrstor64(const void *load);
+void _fxrstor(const void *load);
+void _xsave64(void *save, uint64 mask);
+void _xsave(void *save, uint64 mask);
+void _xsaveopt64(void *save, uint64 mask);
+void _xsavec(void *save, uint64 mask);
+void _xrstor64(const void *load, uint64 mask);
+void _xrstor(const void *load, uint64 mask);
+#endif /* ULM */
 #ifdef __cplusplus
 }
 #endif
 
 #pragma intrinsic(_umul128, _mul128, __shiftright128)
 
+#ifdef ULM
+#pragma intrinsic(_fxsave64, _fxsave, _fxrstor64, _fxrstor, _xsave64, _xsave, \
+                  _xsaveopt64, _xsavec, _xrstor64, _xrstor)
+#endif /* ULM */
+
 #endif // _MSC_VER
 
 #if defined(__GNUC__)
@@ -113,40 +130,57 @@ uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
  * The workaround (FXRSTOR_AMD_ES0) only costs 1 cycle more than just doing an
  * fxrstor, on both AMD Opteron and Intel Core CPUs.
  */
-#if defined(__GNUC__)
 
-static INLINE void 
+#if defined(VMM) || defined(VMKERNEL) || defined(FROBOS) || defined(ULM)
+static INLINE void
 FXSAVE_ES1(void *save)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ ("fxsaveq %0  \n" : "=m" (*(uint8 *)save) : : "memory");
+#elif defined(_MSC_VER)
+   _fxsave64(save);
+#endif
 }
 
-static INLINE void 
+static INLINE void
 FXSAVE_COMPAT_ES1(void *save)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ ("fxsave %0  \n" : "=m" (*(uint8 *)save) : : "memory");
+#elif defined(_MSC_VER)
+   _fxsave(save);
+#endif
 }
 
-static INLINE void 
+static INLINE void
 FXRSTOR_ES1(const void *load)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ ("fxrstorq %0 \n"
                          : : "m" (*(const uint8 *)load) : "memory");
+#elif defined(_MSC_VER)
+   _fxrstor64(load);
+#endif
 }
 
-static INLINE void 
+static INLINE void
 FXRSTOR_COMPAT_ES1(const void *load)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ ("fxrstor %0 \n"
                          : : "m" (*(const uint8 *)load) : "memory");
+#elif defined(_MSC_VER)
+   _fxrstor(load);
+#endif
 }
 
-static INLINE void 
+#if defined(__GNUC__)
+static INLINE void
 FXRSTOR_AMD_ES0(const void *load)
 {
    uint64 dummy = 0;
 
-   __asm__ __volatile__ 
+   __asm__ __volatile__
        ("fnstsw  %%ax    \n"     // Grab x87 ES bit
         "bt      $7,%%ax \n"     // Test ES bit
         "jnc     1f      \n"     // Jump if ES=0
@@ -170,100 +204,100 @@ FXRSTOR_AMD_ES0(const void *load)
  * The pointer passed in must be 64-byte aligned.
  * See above comment for more information.
  */
-#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
 
-static INLINE void 
+static INLINE void
 XSAVE_ES1(void *save, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x48, 0x0f, 0xae, 0x21 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
+#ifdef __GNUC__
    __asm__ __volatile__ (
         "xsaveq %0 \n"
         : "=m" (*(uint8 *)save)
         : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xsave64(save, mask);
 #endif
 }
 
-static INLINE void 
+static INLINE void
 XSAVE_COMPAT_ES1(void *save, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x21 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
+#ifdef __GNUC__
    __asm__ __volatile__ (
         "xsave %0 \n"
         : "=m" (*(uint8 *)save)
         : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xsave(save, mask);
 #endif
 }
 
-static INLINE void 
+static INLINE void
 XSAVEOPT_ES1(void *save, uint64 mask)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ (
-        ".byte 0x48, 0x0f, 0xae, 0x31 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        "xsaveoptq %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xsaveopt64(save, mask);
+#endif
 }
 
-static INLINE void 
-XRSTOR_ES1(const void *load, uint64 mask)
+static INLINE void
+XSAVEC_COMPAT_ES1(void *save, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+#ifdef __GNUC__
    __asm__ __volatile__ (
-        ".byte 0x48, 0x0f, 0xae, 0x29 \n"
-        :
-        : "c" ((const uint8 *)load),
-          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        "xsavec %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
-#else
+#elif defined(_MSC_VER)
+   _xsavec(save, mask);
+#endif
+}
+
+static INLINE void
+XRSTOR_ES1(const void *load, uint64 mask)
+{
+#ifdef __GNUC__
    __asm__ __volatile__ (
         "xrstorq %0 \n"
         :
         : "m" (*(const uint8 *)load),
           "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xrstor64(load, mask);
 #endif
 }
 
-static INLINE void 
+static INLINE void
 XRSTOR_COMPAT_ES1(const void *load, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x29 \n"
-        :
-        : "c" ((const uint8 *)load),
-          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
+#ifdef __GNUC__
    __asm__ __volatile__ (
         "xrstor %0 \n"
         :
         : "m" (*(const uint8 *)load),
           "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xrstor(load, mask);
 #endif
 }
 
-static INLINE void 
+#if defined(__GNUC__)
+static INLINE void
 XRSTOR_AMD_ES0(const void *load, uint64 mask)
 {
    uint64 dummy = 0;
 
-   __asm__ __volatile__ 
+   __asm__ __volatile__
        ("fnstsw  %%ax    \n"     // Grab x87 ES bit
         "bt      $7,%%ax \n"     // Test ES bit
         "jnc     1f      \n"     // Jump if ES=0
@@ -273,36 +307,39 @@ XRSTOR_AMD_ES0(const void *load, uint64 mask)
         "fildl   %0      \n"     // Dummy Load from "safe address" changes all
                                  // x87 exception pointers.
         "mov %%ebx, %%eax \n"
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-        ".byte 0x48, 0x0f, 0xae, 0x29 \n"
-        :
-        : "m" (dummy), "c" ((const uint8 *)load),
-          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
-#else
         "xrstorq %1 \n"
         :
         : "m" (dummy), "m" (*(const uint8 *)load),
           "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
-#endif
         : "eax", "memory");
 }
 
 #endif /* __GNUC__ */
+#endif /* VMM || VMKERNEL || FROBOS || ULM */
 
 /*
  * XTEST
  *     Return TRUE if processor is in transaction region.
  *
+ *  Using condition codes as output values (=@ccnz) requires gcc6 or
+ *  above.  Clang does not support condition codes as output
+ *  constraints.
+ *
  */
 #if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
 static INLINE Bool
 xtest(void)
 {
-   uint8 al;
-   __asm__ __volatile__(".byte 0x0f, 0x01, 0xd6    # xtest \n"
-                        "setnz %%al\n"
-                        : "=a"(al) : : "cc"); 
-   return al;
+   Bool result;
+#if defined(__clang__)
+   __asm__ __volatile__("xtest\n"
+                        "setnz %%al"
+                        : "=a" (result) : : "cc");
+#else
+   __asm__ __volatile__("xtest"
+                        : "=@ccnz" (result) : : "cc");
+#endif
+   return result;
 }
 
 #endif /* __GNUC__ */
@@ -314,7 +351,7 @@ xtest(void)
  *
  *    Unsigned integer by fixed point multiplication, with rounding:
  *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
- * 
+ *
  *       Unsigned 64-bit integer multiplicand.
  *       Unsigned 64-bit fixed point multiplier, represented as
  *         (multiplier, shift), where shift < 64.
@@ -396,7 +433,7 @@ Mul64x6464(uint64 multiplicand,
  *
  *    Signed integer by fixed point multiplication, with rounding:
  *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
- * 
+ *
  *       Signed 64-bit integer multiplicand.
  *       Unsigned 64-bit fixed point multiplier, represented as
  *         (multiplier, shift), where shift < 64.
@@ -481,7 +518,7 @@ Muls64x64s64(int64 multiplicand,
  *
  *    Unsigned integer by fixed point multiplication, with rounding:
  *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
- * 
+ *
  *       Unsigned 64-bit integer multiplicand.
  *       Unsigned 32-bit fixed point multiplier, represented as
  *         (multiplier, shift), where shift < 64.
@@ -505,7 +542,7 @@ Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
  *
  *    Signed integer by fixed point multiplication, with rounding:
  *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
- * 
+ *
  *       Signed 64-bit integer multiplicand.
  *       Unsigned 32-bit fixed point multiplier, represented as
  *         (multiplier, shift), where shift < 64.
diff --git a/vmmon-only/include/vm_basic_asm_x86_common.h b/vmmon-only/include/vm_basic_asm_x86_common.h
index a724178e..9fc0cacb 100644
--- a/vmmon-only/include/vm_basic_asm_x86_common.h
+++ b/vmmon-only/include/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -244,9 +244,131 @@ GetCallerEFlags(void)
 
 /* Sequence recommended by Intel for the Pentium 4. */
 #define INTEL_MICROCODE_VERSION() (             \
-   __SET_MSR(MSR_BIOS_SIGN_ID, 0),              \
+   X86MSR_SetMSR(MSR_BIOS_SIGN_ID, 0),          \
    __GET_EAX_FROM_CPUID(1),                     \
-   __GET_MSR(MSR_BIOS_SIGN_ID))
+   X86MSR_GetMSR(MSR_BIOS_SIGN_ID))
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MFENCE --
+ *
+ *      Wrapper around the MFENCE instruction.
+ *
+ *      Caveat Emptor! This function is _NOT_ _PORTABLE_ and most certainly
+ *      not something you should use. Take a look at the SMP_*_BARRIER_*,
+ *      DMA_*_BARRIER_* and MMIO_*_BARRIER_* interfaces instead, when writing
+ *      general OS/VMM code.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      See MFENCE instruction in Intel SDM or AMD Programmer's Manual.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+MFENCE(void)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "mfence"
+      ::: "memory"
+   );
+#elif defined _MSC_VER
+   _ReadWriteBarrier();
+   _mm_mfence();
+   _ReadWriteBarrier();
+#else
+#error No compiler defined for MFENCE
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LFENCE --
+ *
+ *      Wrapper around the LFENCE instruction.
+ *
+ *      Caveat Emptor! This function is _NOT_ _PORTABLE_ and most certainly
+ *      not something you should use. Take a look at the SMP_*_BARRIER_*,
+ *      DMA_*_BARRIER_* and MMIO_*_BARRIER_* interfaces instead, when writing
+ *      general OS/VMM code.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      See LFENCE instruction in Intel SDM or AMD Programmer's Manual.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+LFENCE(void)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "lfence"
+      : : : "memory"
+   );
+#elif defined _MSC_VER
+   _ReadWriteBarrier();
+   _mm_lfence();
+   _ReadWriteBarrier();
+#else
+#error No compiler defined for LFENCE
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * SFENCE --
+ *
+ *      Wrapper around the SFENCE instruction.
+ *
+ *      Caveat Emptor! This function is _NOT_ _PORTABLE_ and most certainly
+ *      not something you should use. Take a look at the SMP_*_BARRIER_*,
+ *      DMA_*_BARRIER_* and MMIO_*_BARRIER_* interfaces instead, when writing
+ *      general OS/VMM code.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      See SFENCE instruction in Intel SDM or AMD Programmer's Manual.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+SFENCE(void)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "sfence"
+      : : : "memory"
+   );
+#elif defined _MSC_VER
+   _ReadWriteBarrier();
+#if defined VM_X86_32
+   __asm sfence;
+#else
+   _mm_sfence();
+#endif
+   _ReadWriteBarrier();
+#else
+#error No compiler defined for SFENCE
+#endif
+}
+
 
 /*
  *-----------------------------------------------------------------------------
@@ -278,24 +400,63 @@ GetCallerEFlags(void)
 static INLINE void
 RDTSC_BARRIER(void)
 {
-#ifdef __GNUC__
-   __asm__ __volatile__(
-      "mfence \n\t"
-      "lfence \n\t"
-      ::: "memory"
-   );
+   MFENCE();
+   LFENCE();
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LOCKED_INSN_BARRIER --
+ *
+ *      Implements a full WB load/store barrier using a locked instruction.
+ *
+ *      See PR 1674199 for details. You may choose to use this for
+ *      performance reasons over MFENCE iff you are only dealing with
+ *      WB memory accesses.
+ *
+ *      DANGER! Do not use this barrier instead of MFENCE when dealing
+ *      with non-temporal instructions or UC/WC memory accesses.
+ *
+ *      Caveat Emptor! This function is _NOT_ _PORTABLE_ and most certainly
+ *      not something you should use. Take a look at the SMP_*_BARRIER_*,
+ *      DMA_*_BARRIER_* and MMIO_*_BARRIER_* interfaces instead, when writing
+ *      general OS/VMM code.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Cause WB loads and stores before the call to be globally visible
+ *      before WB loads and stores after this call.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+LOCKED_INSN_BARRIER(void)
+{
+   volatile long temp = 0;
+
+#if defined __GNUC__
+   __asm__ __volatile__ (
+      "lock xorl $1, %0"
+      : "+m" (temp)
+      : /* no additional inputs */
+      : "cc", "memory");
 #elif defined _MSC_VER
-   /* Prevent compiler from moving code across mfence/lfence. */
-   _ReadWriteBarrier();
-   _mm_mfence();
-   _mm_lfence();
-   _ReadWriteBarrier();
+   /*
+    * Ignore warning about _InterlockedXor operation on a local variable; we are
+    * using the operation for its side-effects only.
+    */
+   #pragma warning(suppress:28113)
+   _InterlockedXor(&temp, 1);
 #else
-#error No compiler defined for RDTSC_BARRIER
+#error LOCKED_INSN_BARRIER not defined for this compiler
 #endif
 }
 
-
 /*
  * Memory Barriers
  * ===============
@@ -354,7 +515,6 @@ RDTSC_BARRIER(void)
 #   define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
 #endif
 
-
 /*
  * Memory barriers. These take the form of
  *
@@ -373,47 +533,73 @@ RDTSC_BARRIER(void)
  *
  * Thanks for pasting this whole comment into every architecture header.
  *
- * On x86, we only need to care specifically about store-load reordering on
- * normal memory types. In other cases, only a compiler barrier is needed.
- * SMP_W_BARRIER_R is implemented with a locked xor operation (instead of the
- * mfence instruction) for performance reasons. See PR 1674199 for more
- * details.
- *
- * On x64, special instructions are only provided for load-load (lfence) and
- * store-store (sfence) ordering, and they don't apply to normal memory.
+ * This is a simplified version of Table 7-3 (Memory Access Ordering Rules) from
+ * AMD AMD64 Architecture Programmer's Manual Volume 2: System Programming
+ * (September 2018, Publication 24593, Revision 3.30).
+ *
+ * https://www.amd.com/system/files/TechDocs/24593.pdf#page=228
+ *
+ * This table only includes the memory types we care about in the context of
+ * SMP, DMA and MMIO barriers.
+ *
+ * +-------------+------+------+------+------+------+------+
+ * |\ 2nd mem op |      |      |      |      |      |      |
+ * | `---------. | R WB | R UC | R WC | W WB | W UC | W WC |
+ * | 1st mem op \|      |      |      |      |      |      |
+ * +-------------+------+------+------+------+------+------+
+ * |    R WB     |      |      | LF1  |      |      |      |
+ * +-------------+------+------+------+------+------+------+
+ * |    R UC     |      |      | LF1  |      |      |      |
+ * +-------------+------+------+------+------+------+------+
+ * |    R WC     |      |      | LF1  |      |      |      |
+ * +-------------+------+------+------+------+------+------+
+ * |    W WB     | MF1  |      | MF1  |      |      | SF2  |
+ * +-------------+------+------+------+------+------+------+
+ * |    W UC     | MF1  |      | MF1  |      |      | SF2  |
+ * +-------------+------+------+------+------+------+------+
+ * |    W WC     | MF1  |      | MF1  | SF1  |      | SF2  |
+ * +-------------+------+------+------+------+------+------+
+ *
+ * MF1 - WB or WC load may pass a previous non-conflicting WB, WC or UC store.
+ *       Use MFENCE. This is a combination of rules 'e' and 'i' in the AMD
+ *       diagram.
+ * LF1 - WC load may pass a previous WB, WC or UC load. Use LFENCE. This is
+ *       rule 'b' in the AMD diagram.
+ * SF1 - WB store may pass a previous WC store. Use SFENCE. This is rule 'j' in
+ *       the AMD diagram.
+ * SF2 - WC store may pass a previous UC, WB or non-conflicting WC store. Use
+ *       SFENCE. This is rule 'h' in the AMD diagram.
+ *
+ * To figure out the specific barrier required, pick and collapse the relevant
+ * rows and columns, choosing the strongest barrier.
+ *
+ * SMP barriers only concern with access to "normal memory" (write-back cached
+ * i.e. WB using above terminology), so we only need to worry about store-load
+ * reordering. In other cases a compiler barrier is sufficient. SMP store-load
+ * reordering is handled with a locked XOR (instead of a proper MFENCE
+ * instructon) for performance reasons. See PR 1674199 for more details.
+ *
+ * DMA barriers are equivalent to SMP barriers on x86.
+ *
+ * MMIO barriers are used to mix access to different memory types, so more
+ * reordering is possible, and is handled via LFENCE/SFENCE. Also, a proper
+ * MFENCE must be used instead of the locked XOR trick, due to the latter
+ * not guarding non-temporal/WC accesses.
  */
 
-
-static INLINE void
-SMP_W_BARRIER_R(void)
-{
-   volatile long temp;
-
-#if defined __GNUC__
-   __asm__ __volatile__ (
-      "lock xorl $1, %0"
-      : "+m" (temp)
-      : /* no additional inputs */
-      : "cc", "memory");
-#elif defined _MSC_VER
-   _InterlockedXor(&temp, 1);
-#else
-#error SMP_W_BARRIER_R not defined for this compiler
-#endif
-}
-
 #define SMP_R_BARRIER_R()     COMPILER_READ_BARRIER()
 #define SMP_R_BARRIER_W()     COMPILER_MEM_BARRIER()
 #define SMP_R_BARRIER_RW()    COMPILER_MEM_BARRIER()
+#define SMP_W_BARRIER_R()     LOCKED_INSN_BARRIER()
 #define SMP_W_BARRIER_W()     COMPILER_WRITE_BARRIER()
-#define SMP_W_BARRIER_RW()    SMP_W_BARRIER_R()
-#define SMP_RW_BARRIER_R()    SMP_W_BARRIER_R()
+#define SMP_W_BARRIER_RW()    LOCKED_INSN_BARRIER()
+#define SMP_RW_BARRIER_R()    LOCKED_INSN_BARRIER()
 #define SMP_RW_BARRIER_W()    COMPILER_MEM_BARRIER()
-#define SMP_RW_BARRIER_RW()   SMP_W_BARRIER_R()
+#define SMP_RW_BARRIER_RW()   LOCKED_INSN_BARRIER()
 
 /*
  * Like the above, only for use with observers other than CPUs,
- * i.e. DMA masters.
+ * i.e. DMA masters. Same as SMP barriers for x86.
  */
 
 #define DMA_R_BARRIER_R()     SMP_R_BARRIER_R()
@@ -427,18 +613,178 @@ SMP_W_BARRIER_R(void)
 #define DMA_RW_BARRIER_RW()   SMP_RW_BARRIER_RW()
 
 /*
- * And finally a set for use with MMIO accesses.
+ * And finally a set for use with MMIO accesses. These barriers must be stronger
+ * because they are used when mixing accesses to different memory types.
  */
 
-#define MMIO_R_BARRIER_R()    SMP_R_BARRIER_R()
+#define MMIO_R_BARRIER_R()    LFENCE()
 #define MMIO_R_BARRIER_W()    SMP_R_BARRIER_W()
-#define MMIO_R_BARRIER_RW()   SMP_R_BARRIER_RW()
-#define MMIO_W_BARRIER_R()    SMP_W_BARRIER_R()
-#define MMIO_W_BARRIER_W()    SMP_W_BARRIER_W()
-#define MMIO_W_BARRIER_RW()   SMP_W_BARRIER_RW()
-#define MMIO_RW_BARRIER_R()   SMP_RW_BARRIER_R()
-#define MMIO_RW_BARRIER_W()   SMP_RW_BARRIER_W()
-#define MMIO_RW_BARRIER_RW()  SMP_RW_BARRIER_RW()
+#define MMIO_R_BARRIER_RW()   LFENCE()
+#define MMIO_W_BARRIER_R()    MFENCE()
+#define MMIO_W_BARRIER_W()    SFENCE()
+#define MMIO_W_BARRIER_RW()   MFENCE()
+#define MMIO_RW_BARRIER_R()   MFENCE()
+#define MMIO_RW_BARRIER_W()   SFENCE()
+#define MMIO_RW_BARRIER_RW()  MFENCE()
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIORead8 --
+ *
+ *      IO read from address "addr".
+ *
+ * Results:
+ *      8-bit value at given location.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint8
+MMIORead8(const volatile void *addr)
+{
+   volatile uint8 *addr8 = (volatile uint8 *) addr;
+
+   return *addr8;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIOWrite8 --
+ *
+ *      IO write to address "addr".
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE void
+MMIOWrite8(volatile void *addr, // IN
+           uint8 val)           // IN
+{
+   volatile uint8 *addr8 = (volatile uint8 *) addr;
+
+   *addr8 = val;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIORead16 --
+ *
+ *      IO read from address "addr".
+ *
+ * Results:
+ *      16-bit value at given location.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint16
+MMIORead16(const volatile void *addr)
+{
+   volatile uint16 *addr16 = (volatile uint16 *) addr;
 
+   return *addr16;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIOWrite16 --
+ *
+ *      IO write to address "addr".
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE void
+MMIOWrite16(volatile void *addr,  // IN
+            uint16 val)           // IN
+{
+   volatile uint16 *addr16 = (volatile uint16 *) addr;
+
+   *addr16 = val;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIORead32 --
+ *
+ *      IO read from address "addr".
+ *
+ * Results:
+ *      32-bit value at given location.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint32
+MMIORead32(const volatile void *addr)
+{
+   volatile uint32 *addr32 = (volatile uint32 *) addr;
+
+   return *addr32;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIOWrite32 --
+ *
+ *      IO write to address "addr".
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE void
+MMIOWrite32(volatile void *addr, // OUT
+            uint32 val)
+{
+   volatile uint32 *addr32 = (volatile uint32 *) addr;
+
+   *addr32 = val;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIORead64 --
+ *
+ *      IO read from address "addr".
+ *
+ * Results:
+ *      64-bit value at given location.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+MMIORead64(const volatile void *addr)
+{
+   volatile uint64 *addr64 = (volatile uint64 *) addr;
+
+   return *addr64;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIOWrite64 --
+ *
+ *      IO write to address "addr".
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE void
+MMIOWrite64(volatile void *addr, // OUT
+            uint64 val)
+{
+   volatile uint64 *addr64 = (volatile uint64 *) addr;
+
+   *addr64 = val;
+}
 
 #endif // _VM_BASIC_ASM_X86_COMMON_H_
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index b40e9b6a..29298257 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -44,56 +44,54 @@
 #endif
 #define __IS_FREEBSD_VER__(ver) (__IS_FREEBSD__ && __FreeBSD_version >= (ver))
 
-#if defined _WIN32 && defined USERLEVEL
-   #include <stddef.h>  /*
-                         * We redefine offsetof macro from stddef; make
-                         * sure that it's already defined before we do that.
-                         */
-   #include <windows.h>	// for Sleep() and LOWORD() etc.
-   #undef GetFreeSpace  // Unpollute preprocessor namespace.
-#endif
-
-
 /*
- * Simple macros
+ * <stddef.h> provides definitions for:
+ *   NULL, offsetof
+ * References:
+ *   C90 7.17, C99 7.19, C11 7.19
  */
+#if !defined(VMKERNEL)
+#  include <stddef.h>
+#else
+   /*
+    * Vmkernel's bogus __FreeBSD__ value causes gcc <stddef.h> to break.
+    * Work around by doing similar things. Bug 2116887 and 2229647.
+    */
+#  ifndef offsetof
+      /*
+       * We use the builtin offset for gcc/clang, except when we're running
+       * under the vmkernel's GDB macro preprocessor, since gdb doesn't
+       * understand __builtin_offsetof.
+       */
+#     if defined VMKERNEL_GDB_MACRO_BUILDER
+#        define offsetof(TYPE, MEMBER) ((size_t) &((TYPE *)0)->MEMBER)
+#     else
+#        define offsetof __builtin_offsetof
+#     endif
+#  endif
+
+#  ifndef NULL
+#     ifdef  __cplusplus
+#        define NULL    0
+#     else
+#        define NULL    ((void *)0)
+#     endif
+#  endif
+
+#endif  // VMKERNEL
 
-#ifndef vmw_offsetof
-#define vmw_offsetof(TYPE, MEMBER) ((size_t) &((TYPE *)0)->MEMBER)
+#if defined _WIN32 && defined USERLEVEL
+   #include <windows.h> // for Sleep() and LOWORD() etc.
+   #undef GetFreeSpace  // Unpollute preprocessor namespace.
 #endif
 
-#if (defined __APPLE__ || defined __FreeBSD__) && \
-    (!defined KERNEL && !defined _KERNEL && !defined VMKERNEL && !defined __KERNEL__)
-#   include <stddef.h>
-#else
-#ifndef offsetof
-#define VMW_DEFINED_OFFSETOF
 
 /*
- * XXX While the _WIN32 implementation appears to be identical to vmw_offsetof
- * in terms of behavior, they need to be separate to match verbatim the
- * definition used by the respective compilers, to avoid a redefinition warning.
- *
- * This is necessary until we eliminate the inclusion of <windows.h> above.
- */
-#ifdef _WIN32
-#define offsetof(s,m)   (size_t)&(((s *)0)->m)
-/*
- * We use the builtin offset for gcc/clang, except when we're running under the
- * vmkernel's GDB macro preprocessor, since gdb doesn't understand
- * __builtin_offsetof.
+ * Simple macros
  */
-#elif defined __GNUC__ && !defined VMKERNEL_GDB_MACRO_BUILDER
-#define offsetof __builtin_offsetof
-#else
-#define offsetof vmw_offsetof
-#endif
-
-#endif // offsetof
-#endif // __APPLE__
 
 #define VMW_CONTAINER_OF(ptr, type, member) \
-   ((type *)((char *)(ptr) - vmw_offsetof(type, member)))
+   ((type *)((char *)(ptr) - offsetof(type, member)))
 
 #ifndef ARRAYSIZE
 #define ARRAYSIZE(a) (sizeof (a) / sizeof *(a))
@@ -159,18 +157,6 @@ Max(int a, int b)
 
 #define IMPLIES(a,b) (!(a) || (b))
 
-/*
- * Not everybody (e.g., the monitor) has NULL
- */
-
-#ifndef NULL
-#ifdef  __cplusplus
-#define NULL    0
-#else
-#define NULL    ((void *)0)
-#endif
-#endif
-
 
 /*
  * Token concatenation
@@ -209,7 +195,7 @@ Max(int a, int b)
  */
 
 #ifndef PAGE_SHIFT // {
-#if defined VM_I386
+#if defined __x86_64__ || defined __i386__
    #define PAGE_SHIFT    12
 #elif defined __APPLE__
    #define PAGE_SHIFT    12
@@ -255,6 +241,10 @@ Max(int a, int b)
 #define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
 #endif
 
+#ifndef KBYTES_SHIFT
+#define KBYTES_SHIFT 10
+#endif
+
 #ifndef MBYTES_SHIFT
 #define MBYTES_SHIFT 20
 #endif
@@ -286,6 +276,14 @@ Max(int a, int b)
 #define PAGES_2_GBYTES(_npages) ((_npages) >> (30 - PAGE_SHIFT))
 #endif
 
+#ifndef BYTES_2_KBYTES
+#define BYTES_2_KBYTES(_nbytes) ((_nbytes) >> KBYTES_SHIFT)
+#endif
+
+#ifndef KBYTES_2_BYTES
+#define KBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << KBYTES_SHIFT)
+#endif
+
 #ifndef BYTES_2_MBYTES
 #define BYTES_2_MBYTES(_nbytes) ((_nbytes) >> MBYTES_SHIFT)
 #endif
@@ -556,10 +554,10 @@ typedef int pid_t;
 #undef DEBUG_ONLY
 #ifdef VMX86_DEBUG
 #define vmx86_debug      1
-#define DEBUG_ONLY(x)    x
+#define DEBUG_ONLY(...)  __VA_ARGS__
 #else
 #define vmx86_debug      0
-#define DEBUG_ONLY(x)
+#define DEBUG_ONLY(...)
 #endif
 
 #ifdef VMX86_STATS
@@ -664,6 +662,20 @@ typedef int pid_t;
 #define VMM_ONLY(x)
 #endif
 
+#ifdef ULM
+#define vmx86_ulm 1
+#define ULM_ONLY(x) x
+#else
+#define vmx86_ulm 0
+#define ULM_ONLY(x)
+#endif
+
+#if defined(VMM) || defined(ULM)
+#define MONITOR_ONLY(x) x
+#else
+#define MONITOR_ONLY(x)
+#endif
+
 #if defined(VMM) || defined(VMKERNEL)
 #define USER_ONLY(x)
 #else
@@ -702,12 +714,6 @@ typedef int pid_t;
 #endif
 #endif // _WIN32
 
-#ifdef HOSTED_LG_PG
-#define hosted_lg_pg 1
-#else
-#define hosted_lg_pg 0
-#endif
-
 /*
  * Use to initialize cbSize for this structure to preserve < Vista
  * compatibility.
@@ -718,7 +724,7 @@ typedef int pid_t;
 /* This is not intended to be thread-safe. */
 #define DO_ONCE(code)                                                   \
    do {                                                                 \
-      static Bool _doOnceDone = FALSE;                                  \
+      static MONITOR_ONLY(PERVCPU) Bool _doOnceDone = FALSE;            \
       if (UNLIKELY(!_doOnceDone)) {                                     \
          _doOnceDone = TRUE;                                            \
          code;                                                          \
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index 54f3e7e7..f7f5b93f 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -63,18 +63,9 @@
  * - VM_<arch>_32 for the 32-bit variant.
  * - VM_<arch>_64 for the 64-bit variant.
  * - VM_<arch>_ANY for any variant of <arch>.
- *
- * VM_X86_ANY is synonymous with the confusing and deprecated VM_I386 (which
- * should really be VM_X86_32).
  */
 
 #ifdef __i386__
-/*
- * VM_I386 is historically synonymous with VM_X86_ANY in bora, but misleading,
- * since it is confused with the __i386__ gcc but defined for both 32- and
- * 64-bit x86. We retain it here for legacy compatibility.
- */
-#define VM_I386
 #define VM_X86_32
 #define VM_X86_ANY
 #define VM_32BIT
@@ -83,7 +74,6 @@
 #ifdef __x86_64__
 #define VM_X86_64
 #define vm_x86_64 1
-#define VM_I386
 #define VM_X86_ANY
 #define VM_64BIT
 #else
@@ -120,14 +110,91 @@
 
 #endif
 
-#if defined(__cplusplus) && __cplusplus >= 201103L || \
-    defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L || \
-    defined(__APPLE__) || defined(HAVE_STDINT_H)
+#if defined(__FreeBSD__) && (__FreeBSD__ + 0 < 5)
+#  error FreeBSD detected without major version (PR 2116887)
+#endif
+
+/*
+ * C99 <stdint.h> or equivalent
+ * Special cases:
+ * - Linux kernel lacks <stdint.h>, preferring <linux/types.h>
+ *   (and defines uintptr_t since 2.6.24, but not intptr_t)
+ * - Solaris collides with gcc <stdint.h>, but has <sys/stdint.h>
+ * - VMKernel + FreeBSD collides with gcc <stdint.h>, but has <sys/stdint.h>
+ * - VMKernel (+DECODERLIB) share macros with Linux kernel
+ * - Windows only added <stdint.h> in vc10/vs2010 (MSC ver 1600),
+ *   and WDKs lack it.
+ *
+ * NB about LLP64 in LP64 environments:
+ * - Apple uses 'long long' uint64_t
+ * - Linux kernel uses 'long long' uint64_t
+ * - Linux userlevel uses 'long' uint64_t
+ */
+#if !defined(VMKERNEL) && !defined(DECODERLIB) && \
+    defined(__linux__) && defined(__KERNEL__)
+#  include <linux/types.h>
+#  include <linux/version.h>
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 24)
+   typedef unsigned long uintptr_t;
+#endif
+   typedef   signed long  intptr_t;
+#elif (defined(__sun__) && defined(_KERNEL)) || \
+      (defined(VMKERNEL) && defined(__FreeBSD__)) || \
+      defined(_SYS_STDINT_H_)
+#  include <sys/stdint.h>
+#elif !defined(_MSC_VER)
+   /* Common case */
+#  include <stdint.h>
+#else
+   /* COMPAT: until pre-vc10 is retired */
+#  include <crtdefs.h>  // uintptr_t
+   typedef unsigned __int64   uint64_t;
+   typedef unsigned int       uint32_t;
+   typedef unsigned short     uint16_t;
+   typedef unsigned char      uint8_t;
+
+   typedef __int64            int64_t;
+   typedef int                int32_t;
+   typedef short              int16_t;
+   typedef signed char        int8_t;
+#endif
+
 /*
- * We're using <stdint.h> instead of <cstdint> below because some C++ code
- * deliberately compiles without C++ include paths.
+ * size_t and ssize_t, or equivalent
+ * Options:
+ * C90+ <stddef.h> has size_t, but is incompatible with many kernels.
+ * POSIX <sys/types.h> has size_t and ssize_t, is always available at
+ *    userlevel but is missing from some kernels.
+ *
+ * Special cases:
+ * - Linux kernel (again) does everything via <linux/types.h>
+ * - VMKernel may or may not have POSIX headers (tcpip only)
+ * - VMM does not have POSIX headers
+ * - Windows <sys/types.h> does not define ssize_t
  */
-#include <stdint.h>
+#if defined(VMKERNEL) || defined(VMM) || defined(DECODERLIB)
+   /* Guard against FreeBSD <sys/types.h> collison. */
+#  if !defined(_SIZE_T_DEFINED) && !defined(_SIZE_T)
+#     define _SIZE_T_DEFINED
+#     define _SIZE_T
+      typedef __SIZE_TYPE__ size_t;
+#endif
+#  if !defined(_SSIZE_T_DEFINED) && !defined(_SSIZE_T)
+#     define _SSIZE_T_DEFINED
+#     define _SSIZE_T
+      typedef int64_t ssize_t;
+#  endif
+#elif defined(__linux__) && defined(__KERNEL__)
+   /* <linux/types.h> provided size_t, ssize_t. */
+#else
+#  include <sys/types.h>
+#  if defined(_WIN64)
+      typedef int64_t ssize_t;
+#  elif defined(_WIN32)
+      typedef int32_t ssize_t;
+#  endif
+#endif
+
 
 typedef uint64_t    uint64;
 typedef  int64_t     int64;
@@ -138,40 +205,6 @@ typedef  int16_t     int16;
 typedef  uint8_t     uint8;
 typedef   int8_t      int8;
 
-#else /* !HAVE_STDINT_H */
-
-/* Pre-c99 or pre-c++11; use compiler extension to get 64-bit types */
-#ifdef _MSC_VER
-
-typedef unsigned __int64 uint64;
-typedef signed __int64 int64;
-
-#elif __GNUC__
-#   if defined(VM_X86_64) || defined(VM_ARM_64)
-typedef unsigned long uint64;
-typedef long int64;
-#   else
-/*
- * Only strict c90 (without extensions) lacks a 'long long' type.
- * If this declaration fails ... use -std=c99 or -std=gnu90.
- */
-typedef unsigned long long uint64;
-typedef long long int64;
-#   endif
-#else
-#   error - Need compiler define for int64/uint64
-#endif /* _MSC_VER */
-
-typedef unsigned int       uint32;
-typedef unsigned short     uint16;
-typedef unsigned char      uint8;
-
-typedef int                int32;
-typedef short              int16;
-typedef signed char        int8;
-
-#endif /* HAVE_STDINT_H */
-
 
 /*
  * The _XTYPEDEF_BOOL guard prevents colliding with:
@@ -202,14 +235,6 @@ typedef char           Bool;
 #define IS_BOOL(x)     (((x) & ~1) == 0)
 
 
-/*
- * FreeBSD (for the tools build) unconditionally defines these in
- * sys/inttypes.h so don't redefine them if this file has already
- * been included. [greg]
- *
- * This applies to Solaris as well.
- */
-
 /*
  * Before trying to do the includes based on OS defines, see if we can use
  * feature-based defines to get as much functionality as possible
@@ -218,9 +243,6 @@ typedef char           Bool;
 #ifdef HAVE_INTTYPES_H
 #include <inttypes.h>
 #endif
-#ifdef HAVE_SYS_TYPES_H
-#include <sys/types.h>
-#endif
 #ifdef HAVE_SYS_INTTYPES_H
 #include <sys/inttypes.h>
 #endif
@@ -234,14 +256,11 @@ typedef char           Bool;
 
 #if !defined(USING_AUTOCONF)
 #   if defined(__FreeBSD__) || defined(sun)
-#      ifdef KLD_MODULE
-#         include <sys/types.h>
-#      else
+#      ifndef KLD_MODULE
 #         if __FreeBSD_version >= 500043
 #            if !defined(VMKERNEL)
 #               include <inttypes.h>
 #            endif
-#            include <sys/types.h>
 #         else
 #            include <sys/inttypes.h>
 #         endif
@@ -249,46 +268,10 @@ typedef char           Bool;
 #   elif defined __APPLE__
 #      if KERNEL
 #         include <sys/unistd.h>
-#         include <sys/types.h> /* mostly for size_t */
-#         include <stdint.h>
 #      else
 #         include <unistd.h>
 #         include <inttypes.h>
 #         include <stdlib.h>
-#         include <stdint.h>
-#      endif
-#   elif defined __ANDROID__
-#      include <stdint.h>
-#   else
-#      if !defined(__intptr_t_defined) && !defined(intptr_t)
-#         ifdef VM_I386
-#            define __intptr_t_defined
-#            if defined(VM_X86_64)
-typedef int64     intptr_t;
-#            else
-typedef int32     intptr_t;
-#            endif
-#         elif defined(VM_ARM_64)
-#            define __intptr_t_defined
-typedef int64     intptr_t;
-#         elif defined(__arm__)
-#            define __intptr_t_defined
-typedef int32     intptr_t;
-#         endif
-#      endif
-
-#      ifndef _STDINT_H
-#         ifdef VM_I386
-#            if defined(VM_X86_64)
-typedef uint64    uintptr_t;
-#            else
-typedef uint32    uintptr_t;
-#            endif
-#         elif defined(VM_ARM_64)
-typedef uint64    uintptr_t;
-#         elif defined(__arm__)
-typedef uint32    uintptr_t;
-#         endif
 #      endif
 #   endif
 #endif
@@ -337,10 +320,11 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
       #define FMTPD      "I"
       #define FMTH       "I"
    #endif
-#elif defined __APPLE__
-   /* macOS hosts use the same formatters for 32- and 64-bit. */
+#elif defined __APPLE__ || (!defined VMKERNEL && !defined DECODERLIB && \
+                            defined __linux__ && defined __KERNEL__)
+   /* semi-LLP64 targets; 'long' is 64-bit, but uint64_t is 'long long' */
    #define FMT64         "ll"
-   #if KERNEL
+   #if defined(__APPLE__) && KERNEL
       /* macOS osfmk/kern added 'z' length specifier in 10.13 */
       #define FMTSZ      "l"
    #else
@@ -452,7 +436,6 @@ typedef uintptr_t VPN;
 
 typedef uint64    PA;
 typedef uint64    PPN;
-typedef uint32    PPNTMP;
 
 typedef uint64    TPA;
 typedef uint64    TPPN;
@@ -470,9 +453,7 @@ typedef uint64    BPN;
 #define UINT64_2_BPN(u) ((BPN)(u))
 #define BPN_2_UINT64(b) ((uint64)(b))
 
-typedef uint64    PgCnt64;
 typedef uint64    PageCnt;
-typedef uint64    PgNum64;
 typedef uint64    PageNum;
 typedef unsigned  MemHandle;
 typedef unsigned  IoHandle;
@@ -515,7 +496,7 @@ typedef uint128 UReg128;
 #endif
 
 #if defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
-    defined (VMKERNEL) || defined (VMKBOOT)
+    defined (VMKERNEL) || defined (VMKBOOT) || defined (ULM)
 typedef  Reg64  Reg;
 typedef UReg64 UReg;
 #endif
@@ -598,15 +579,14 @@ typedef void * UserVA;
 
 
 /* Maximal observable PPN value. */
-#define MAX_PPN_BITS      31
-#define MAX_PPN           (((PPN64)1 << MAX_PPN_BITS) - 1)
+#define MAX_PPN_BITS      33
+#define MAX_PPN           (((PPN)1 << MAX_PPN_BITS) - 1)
 
-#define INVALID_PPN       ((PPN64)0xffffffff)
+#define INVALID_PPN       ((PPN)0x000fffffffffffffull)
 #define INVALID_PPN32     ((PPN32)0xffffffff)
-#define INVALID_PPN64     ((PPN64)0xffffffffffffffffull)
-#define APIC_INVALID_PPN  ((PPN64)0xfffffffe)
+#define APIC_INVALID_PPN  ((PPN)0x000ffffffffffffeull)
 
-#define INVALID_BPN       ((BPN)0x000000ffffffffffull)
+#define INVALID_BPN       ((BPN)0x0000ffffffffffffull)
 
 #define MPN38_MASK        ((1ull << 38) - 1)
 
@@ -624,7 +604,8 @@ typedef void * UserVA;
 #define INVALID_LPN       ((LPN)-1)
 #define INVALID_VPN       ((VPN)-1)
 #define INVALID_LPN64     ((LPN64)-1)
-#define INVALID_PAGENUM   ((uint32)-1)
+#define INVALID_PAGENUM   ((PageNum)0x000000ffffffffffull)
+#define INVALID_PAGENUM32 ((uint32)-1)
 
 /*
  * Format modifier for printing VA, LA, and VPN.
@@ -837,7 +818,7 @@ typedef void * UserVA;
  * will convert any !=0 to a 1.
  */
 #define LIKELY(_exp)     __builtin_expect(!!(_exp), 1)
-#define UNLIKELY(_exp)   __builtin_expect((_exp), 0)
+#define UNLIKELY(_exp)   __builtin_expect(!!(_exp), 0)
 #else
 #define LIKELY(_exp)      (_exp)
 #define UNLIKELY(_exp)    (_exp)
@@ -934,82 +915,6 @@ typedef void * UserVA;
 
 #define INFINITE_LOOP()           do { } while (1)
 
-/*
- * On FreeBSD (for the tools build), size_t is typedef'd if _BSD_SIZE_T_
- * is defined. Use the same logic here so we don't define it twice. [greg]
- */
-#ifdef __FreeBSD__
-#   ifdef _BSD_SIZE_T_
-#      undef _BSD_SIZE_T_
-#      ifdef VM_I386
-#         ifdef VM_X86_64
-             typedef uint64 size_t;
-#         else
-             typedef uint32 size_t;
-#         endif
-#      endif /* VM_I386 */
-#   endif
-
-#   ifdef _BSD_SSIZE_T_
-#      undef _BSD_SSIZE_T_
-#      ifdef VM_I386
-#         ifdef VM_X86_64
-             typedef int64 ssize_t;
-#         else
-             typedef int32 ssize_t;
-#         endif
-#      endif /* VM_I386 */
-#   endif
-
-#else
-#   if !defined(_SIZE_T) && !defined(_SIZE_T_DEFINED)
-#      ifdef VM_I386
-#         define _SIZE_T
-#         ifdef VM_X86_64
-             typedef uint64 size_t;
-#         else
-             typedef uint32 size_t;
-#         endif
-#      elif defined(VM_ARM_64)
-#         define _SIZE_T
-          typedef uint64 size_t;
-#      elif defined(__arm__)
-#         define _SIZE_T
-          typedef uint32 size_t;
-#      endif
-#   endif
-
-#   if !defined(FROBOS) && !defined(_SSIZE_T) && !defined(_SSIZE_T_) && \
-       !defined(ssize_t) && !defined(__ssize_t_defined) && \
-       !defined(_SSIZE_T_DECLARED) && !defined(_SSIZE_T_DEFINED) && \
-       !defined(_SSIZE_T_DEFINED_)
-#      ifdef VM_I386
-#         define _SSIZE_T
-#         define __ssize_t_defined
-#         define _SSIZE_T_DECLARED
-#         define _SSIZE_T_DEFINED_
-#         ifdef VM_X86_64
-             typedef int64 ssize_t;
-#         else
-             typedef int32 ssize_t;
-#         endif
-#      elif defined(VM_ARM_64)
-#         define _SSIZE_T
-#         define __ssize_t_defined
-#         define _SSIZE_T_DECLARED
-#         define _SSIZE_T_DEFINED_
-          typedef int64 ssize_t;
-#      elif defined(__arm__)
-#         define _SSIZE_T
-#         define __ssize_t_defined
-#         define _SSIZE_T_DECLARED
-#         define _SSIZE_T_DEFINED_
-             typedef int32 ssize_t;
-#      endif
-#   endif
-
-#endif
-
 /*
  * Format modifier for printing pid_t.  On sun the pid_t is a ulong, but on
  * Linux it's an int.
diff --git a/vmmon-only/include/vm_pagetable.h b/vmmon-only/include/vm_pagetable.h
index ddac52a1..a433e57b 100644
--- a/vmmon-only/include/vm_pagetable.h
+++ b/vmmon-only/include/vm_pagetable.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2014-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2014-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,22 +40,25 @@
 /*
  * These definitions suit both the x64 and arm64 architectures. In particular
  * - At all levels, a page table is a 4KB page containing 512 8-byte entries.
- * - Each entry maps 39, 30, 21 and 12 bits at the respective page table
+ * - Each entry maps 48, 39, 30, 21 and 12 bits at the respective page table
  *   levels (with standard page sizes).
  */
 
-typedef uint64 PT_L4E;
-typedef uint64 PT_L3E;
-typedef uint64 PT_L2E;
-typedef uint64 PT_L1E;
+typedef uint64 PT_Entry;
+typedef PT_Entry PT_L5E;
+typedef PT_Entry PT_L4E;
+typedef PT_Entry PT_L3E;
+typedef PT_Entry PT_L2E;
+typedef PT_Entry PT_L1E;
 
 typedef enum {
    PT_LEVEL_1 = 1,
    PT_LEVEL_2,
    PT_LEVEL_3,
    PT_LEVEL_4,
+   PT_LEVEL_5,
    PT_LEVEL_STOP = PT_LEVEL_1,
-   PT_MAX_LEVELS = PT_LEVEL_4
+   PT_MAX_LEVELS = PT_LEVEL_5
 } PT_Level;
 
 #define PT_PTE_SIZE           8
@@ -76,6 +79,7 @@ typedef enum {
 
 /* Address space size (in 4KB pages) covered by a level-_l page table entry. */
 #define PT_PAGES_PER_LE(_l)   ((uint64)1 << PT_LE_PG_SHIFT(_l))
+#define PT_PAGES_PER_L5E      PT_PAGES_PER_LE(PT_LEVEL_5)
 #define PT_PAGES_PER_L4E      PT_PAGES_PER_LE(PT_LEVEL_4)
 #define PT_PAGES_PER_L3E      PT_PAGES_PER_LE(PT_LEVEL_3)
 #define PT_PAGES_PER_L2E      PT_PAGES_PER_LE(PT_LEVEL_2)
@@ -86,6 +90,7 @@ typedef enum {
  * address space size (in bytes) covered by a level-_l page table entry.
  */
 #define PT_LE_SHIFT(_l)       (PAGE_SHIFT + PT_LE_PG_SHIFT(_l))
+#define PT_L5E_SHIFT          PT_LE_SHIFT(PT_LEVEL_5)
 #define PT_L4E_SHIFT          PT_LE_SHIFT(PT_LEVEL_4)
 #define PT_L3E_SHIFT          PT_LE_SHIFT(PT_LEVEL_3)
 #define PT_L2E_SHIFT          PT_LE_SHIFT(PT_LEVEL_2)
@@ -93,6 +98,7 @@ typedef enum {
 
 /* Address space size (in bytes) covered by a level-_l page table entry. */
 #define PT_LE_SIZE(_l)        ((uint64)1 << PT_LE_SHIFT(_l))
+#define PT_L5E_SIZE           PT_LE_SIZE(PT_LEVEL_5)
 #define PT_L4E_SIZE           PT_LE_SIZE(PT_LEVEL_4)
 #define PT_L3E_SIZE           PT_LE_SIZE(PT_LEVEL_3)
 #define PT_L2E_SIZE           PT_LE_SIZE(PT_LEVEL_2)
@@ -103,6 +109,7 @@ typedef enum {
  * determine the offset (== index) of the level-_l page table entry.
  */
 #define PT_LA_2_LOFF(_a, _l)  (((_a) >> PT_LE_SHIFT(_l)) & PT_OFF_MASK)
+#define PT_LA_2_L5OFF(_a)     PT_LA_2_LOFF(_a, PT_LEVEL_5)
 #define PT_LA_2_L4OFF(_a)     PT_LA_2_LOFF(_a, PT_LEVEL_4)
 #define PT_LA_2_L3OFF(_a)     PT_LA_2_LOFF(_a, PT_LEVEL_3)
 #define PT_LA_2_L2OFF(_a)     PT_LA_2_LOFF(_a, PT_LEVEL_2)
@@ -113,6 +120,7 @@ typedef enum {
  * determine the offset (== index) of the level-_l page table entry.
  */
 #define PT_LPN_2_LOFF(_a, _l) (((_a) >> PT_LE_PG_SHIFT(_l)) & PT_OFF_MASK)
+#define PT_LPN_2_L5OFF(_a)    PT_LPN_2_LOFF(_a, PT_LEVEL_5)
 #define PT_LPN_2_L4OFF(_a)    PT_LPN_2_LOFF(_a, PT_LEVEL_4)
 #define PT_LPN_2_L3OFF(_a)    PT_LPN_2_LOFF(_a, PT_LEVEL_3)
 #define PT_LPN_2_L2OFF(_a)    PT_LPN_2_LOFF(_a, PT_LEVEL_2)
diff --git a/vmmon-only/include/vmm_constants.h b/vmmon-only/include/vmm_constants.h
index b3e820d1..06800ff2 100644
--- a/vmmon-only/include/vmm_constants.h
+++ b/vmmon-only/include/vmm_constants.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -30,9 +30,6 @@
 #define INCLUDE_ALLOW_VMMON
 #include "includeCheck.h"
 
-#define INTERRUPT_REDIRECTION_BITMAP_SIZE 32
-#define IO_PERMISSION_BITMAP_SIZE 0
-
 
 #define VMM_PANIC_NONE         0
 #define VMM_PANIC_MSG_COPYING  1
diff --git a/vmmon-only/include/vmmem_shared.h b/vmmon-only/include/vmmem_shared.h
index ffd2efc1..c8e58030 100644
--- a/vmmon-only/include/vmmem_shared.h
+++ b/vmmon-only/include/vmmem_shared.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2000-2015,2017-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2000-2015,2017-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -83,7 +83,7 @@
  * Structure used to query platform about the page state.
  */
 typedef struct PlatformPageInfoList {
-   PgCnt64 numPages;
+   PageCnt numPages;
    BPN     bpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // bpns to check
    MPN     mpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // filled in by host
    uint8   flags[MAX_PLATFORM_PAGE_INFO_PAGES];  // filled in by host
@@ -96,9 +96,10 @@ typedef struct PlatformPageInfoList {
 #define VMMEM_SERVICES_CLEAR_MASK(typeMask, type)         \
            (typeMask & ~VMMEM_SERVICES_TYPE_2_MASK(type))
 
-#define VMMEM_SERVICES_DEFS                               \
-   MDEF(VMMEM_SERVICES_TYPE_P2M,  P2MUpdate_FilterPages)  \
-   MDEF(VMMEM_SERVICES_TYPE_SWAP, BusMemSwap_FilterPages)
+#define VMMEM_SERVICES_DEFS                                       \
+   MDEF(VMMEM_SERVICES_TYPE_P2M,         P2MUpdate_FilterPages)   \
+   MDEF(VMMEM_SERVICES_TYPE_SWAP,        BusMemSwap_FilterPages)  \
+   MDEF(VMMEM_SERVICES_TYPE_DIRTY_CLEAR, DirtyDrainer_ClearDirty)
 
 #define MDEF(_type, _cb) _type,
 typedef enum VmMemServices_Type {
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index f9e6b4fa..bd1f870d 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -89,6 +89,8 @@
 #define CR4_PCE        0x00000100
 #define CR4_OSFXSR     0x00000200 // CPU/OS supports SIMD insts
 #define CR4_OSXMMEXCPT 0x00000400 // #XF exception enable PIII only
+#define CR4_UMIP       0x00000800
+#define CR4_LA57       0x00001000
 #define CR4_VMXE       0x00002000
 #define CR4_SMXE       0x00004000
 #define CR4_FSGSBASE   0x00010000
@@ -97,7 +99,7 @@
 #define CR4_SMEP       0x00100000
 #define CR4_SMAP       0x00200000
 #define CR4_PKE        0x00400000
-#define CR4_RESERVED   CONST64U(0xffffffffff889800)
+#define CR4_RESERVED   CONST64U(0xffffffffff889000)
 #define CR8_RESERVED   CONST64U(0xfffffffffffffff0)
 
 /*
@@ -201,8 +203,15 @@
 #define EXC_MC           18
 #define EXC_XF           19  // SIMD exception.
 #define EXC_VE           20  // Virtualization exception - VT only.
+#define EXC_VC           29  // VMM communication exception (SVM / SEV-ES only).
 #define EXC_SX           30  // Security exception (SVM only).
 
+/* Bitmap of the exception vectors that have associated error codes. */
+#define EXC_WITH_ERR_CODE_MASK ((1u << EXC_DF) | (1u << EXC_TS) | \
+                                (1u << EXC_NP) | (1u << EXC_SS) | \
+                                (1u << EXC_GP) | (1u << EXC_PF) | \
+                                (1u << EXC_AC))
+
 /*
  * eflag/rflag definitions.
  */
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 9c6a81b0..daf24abc 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -187,8 +187,9 @@ enum {
 #define CPUID_SGX_FEATURES         0x12
 #define CPUID_PT_FEATURES          0x14
 #define CPUID_HYPERVISOR_LEVEL_0   0x40000000
+#define CPUID_VMW_FEATURES         0x40000010
 #define CPUID_SVM_FEATURES         0x8000000a
-
+#define CPUID_SEV_INFO             0x8000001f
 
 /*
  * CPUID result registers
@@ -250,12 +251,10 @@ typedef enum {
  *
  * The eighth parameter specifies the first virtual hardware version that
  * implements the field (if 7th field is YES or ANY), or 0 (if 7th field is
- * NO or NA).  The field's hardware version must match the version in
- * defaultMasks (cpuidcompat.c) if defined there, and must be less than or
- * equal to the version of the cpuid leaf it's in.
- *
- * The ninth parameter describes whether the feature is capable of being used
- * by usermode code (TRUE), or just CPL0 kernel code (FALSE).
+ * NO or NA).  The value FUT means HW_VERSION_FUTURE.  The field's hardware
+ * version must match the version in defaultMasks (cpuidcompat.c) if defined
+ * there, and must be less than or equal to the version of the cpuid leaf
+ * it's in.
  *
  * FLAG is defined identically to FIELD, but its accessors are more appropriate
  * for 1-bit flags, and compile-time asserts enforce that the size is 1 bit
@@ -281,22 +280,13 @@ typedef enum {
  *     guest cpuid value is recomputed at power on, ignoring the default
  *     value.
  *
- *
  *     NA: Only legal for levels not masked/tested by default (see
  *     above for this definition).  Such fields must always be marked
  *     as NA.
  *
- * These distinctions, when combined with the feature's CPL3
- * properties can be translated into a common CPUID mask string as
+ * These distinctions can be translated into a common CPUID mask string as
  * follows:
  *
- *     NO + CPL3 --> "R" (Reserved).  We don't support the feature,
- *     but we can't properly hide this from applications when using
- *     direct execution or HV with apps that do try/catch/fail, so we
- *     must still perform compatibility checks.
- *
- *     NO + !CPL3 --> "0" (Masked).  We can hide this from the guest.
- *
  *     YES --> "H" (Host).  We support the feature, so show it to the
  *     guest if the host has the feature.
  *
@@ -307,6 +297,12 @@ typedef enum {
  *     See lib/cpuidcompat/cpuidcompat.c for any possible overrides to
  *     these defaults.
  */
+
+/*
+ * XSAVEOPT was incorrectly missed until HWv11. See comment for
+ * DisableReqHWVersion in vmFeatureCPUID.c for more detail.
+ */
+
 typedef enum {
    CPUID_FIELD_SUPPORTED_NO,
    CPUID_FIELD_SUPPORTED_YES,
@@ -315,823 +311,842 @@ typedef enum {
    CPUID_NUM_FIELD_SUPPORTEDS
 } CpuidFieldSupported;
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_0                                               \
-FIELD(  0,  0, EAX,  0, 32, NUMLEVELS,                         ANY,  4, FALSE) \
-FIELD(  0,  0, EBX,  0, 32, VENDOR1,                           YES,  4, TRUE)  \
-FIELD(  0,  0, ECX,  0, 32, VENDOR3,                           YES,  4, TRUE)  \
-FIELD(  0,  0, EDX,  0, 32, VENDOR2,                           YES,  4, TRUE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_1                                               \
-FIELD(  1,  0, EAX,  0,  4, STEPPING,                          ANY,  4, FALSE) \
-FIELD(  1,  0, EAX,  4,  4, MODEL,                             ANY,  4, FALSE) \
-FIELD(  1,  0, EAX,  8,  4, FAMILY,                            YES,  4, FALSE) \
-FIELD(  1,  0, EAX, 12,  2, TYPE,                              ANY,  4, FALSE) \
-FIELD(  1,  0, EAX, 16,  4, EXTENDED_MODEL,                    ANY,  4, FALSE) \
-FIELD(  1,  0, EAX, 20,  8, EXTENDED_FAMILY,                   YES,  4, FALSE) \
-FIELD(  1,  0, EBX,  0,  8, BRAND_ID,                          ANY,  4, FALSE) \
-FIELD(  1,  0, EBX,  8,  8, CLFL_SIZE,                         ANY,  4, FALSE) \
-FIELD(  1,  0, EBX, 16,  8, LCPU_COUNT,                        ANY,  4, FALSE) \
-FIELD(  1,  0, EBX, 24,  8, APICID,                            ANY,  4, FALSE) \
-FLAG(   1,  0, ECX,  0,  1, SSE3,                              YES,  4, TRUE)  \
-FLAG(   1,  0, ECX,  1,  1, PCLMULQDQ,                         YES,  7, TRUE)  \
-FLAG(   1,  0, ECX,  2,  1, DTES64,                            NO,   0, FALSE) \
-FLAG(   1,  0, ECX,  3,  1, MWAIT,                             YES,  4, FALSE) \
-FLAG(   1,  0, ECX,  4,  1, DSCPL,                             NO,   0, FALSE) \
-FLAG(   1,  0, ECX,  5,  1, VMX,                               YES,  4, FALSE) \
-FLAG(   1,  0, ECX,  6,  1, SMX,                               YES, 17, FALSE) \
-FLAG(   1,  0, ECX,  7,  1, EIST,                              NO,   0, FALSE) \
-FLAG(   1,  0, ECX,  8,  1, TM2,                               NO,   0, FALSE) \
-FLAG(   1,  0, ECX,  9,  1, SSSE3,                             YES,  4, TRUE)  \
-FLAG(   1,  0, ECX, 10,  1, CNXTID,                            NO,   0, FALSE) \
-FLAG(   1,  0, ECX, 11,  1, SDBG,                              NO,   0, FALSE) \
-FLAG(   1,  0, ECX, 12,  1, FMA,                               YES,  8, TRUE)  \
-FLAG(   1,  0, ECX, 13,  1, CMPXCHG16B,                        YES,  4, TRUE)  \
-FLAG(   1,  0, ECX, 14,  1, xTPR,                              NO,   0, FALSE) \
-FLAG(   1,  0, ECX, 15,  1, PDCM,                              NO,   0, FALSE) \
-FLAG(   1,  0, ECX, 17,  1, PCID,                              YES,  8, FALSE) \
-FLAG(   1,  0, ECX, 18,  1, DCA,                               NO,   0, FALSE) \
-FLAG(   1,  0, ECX, 19,  1, SSE41,                             YES,  4, TRUE)  \
-FLAG(   1,  0, ECX, 20,  1, SSE42,                             YES,  4, TRUE)  \
-FLAG(   1,  0, ECX, 21,  1, x2APIC,                            ANY,  9, FALSE) \
-FLAG(   1,  0, ECX, 22,  1, MOVBE,                             YES,  7, TRUE)  \
-FLAG(   1,  0, ECX, 23,  1, POPCNT,                            YES,  4, TRUE)  \
-FLAG(   1,  0, ECX, 24,  1, TSC_DEADLINE,                      ANY, 11, FALSE) \
-FLAG(   1,  0, ECX, 25,  1, AES,                               YES,  7, TRUE)  \
-FLAG(   1,  0, ECX, 26,  1, XSAVE,                             YES,  8, FALSE) \
-FLAG(   1,  0, ECX, 27,  1, OSXSAVE,                           ANY,  8, FALSE) \
-FLAG(   1,  0, ECX, 28,  1, AVX,                               YES,  8, FALSE) \
-FLAG(   1,  0, ECX, 29,  1, F16C,                              YES,  9, TRUE)  \
-FLAG(   1,  0, ECX, 30,  1, RDRAND,                            YES,  9, TRUE)  \
-FLAG(   1,  0, ECX, 31,  1, HYPERVISOR,                        ANY,  4, TRUE)  \
-FLAG(   1,  0, EDX,  0,  1, FPU,                               YES,  4, TRUE)  \
-FLAG(   1,  0, EDX,  1,  1, VME,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX,  2,  1, DE,                                YES,  4, FALSE) \
-FLAG(   1,  0, EDX,  3,  1, PSE,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX,  4,  1, TSC,                               YES,  4, TRUE)  \
-FLAG(   1,  0, EDX,  5,  1, MSR,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX,  6,  1, PAE,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX,  7,  1, MCE,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX,  8,  1, CX8,                               YES,  4, TRUE)  \
-FLAG(   1,  0, EDX,  9,  1, APIC,                              ANY,  4, FALSE) \
-FLAG(   1,  0, EDX, 11,  1, SEP,                               YES,  4, TRUE)  \
-FLAG(   1,  0, EDX, 12,  1, MTRR,                              YES,  4, FALSE) \
-FLAG(   1,  0, EDX, 13,  1, PGE,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX, 14,  1, MCA,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX, 15,  1, CMOV,                              YES,  4, TRUE)  \
-FLAG(   1,  0, EDX, 16,  1, PAT,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX, 17,  1, PSE36,                             YES,  4, FALSE) \
-FLAG(   1,  0, EDX, 18,  1, PSN,                               YES,  4, FALSE) \
-FLAG(   1,  0, EDX, 19,  1, CLFSH,                             YES,  4, TRUE)  \
-FLAG(   1,  0, EDX, 21,  1, DS,                                YES,  4, FALSE) \
-FLAG(   1,  0, EDX, 22,  1, ACPI,                              ANY,  4, FALSE) \
-FLAG(   1,  0, EDX, 23,  1, MMX,                               YES,  4, TRUE)  \
-FLAG(   1,  0, EDX, 24,  1, FXSR,                              YES,  4, TRUE)  \
-FLAG(   1,  0, EDX, 25,  1, SSE,                               YES,  4, TRUE)  \
-FLAG(   1,  0, EDX, 26,  1, SSE2,                              YES,  4, TRUE)  \
-FLAG(   1,  0, EDX, 27,  1, SS,                                YES,  4, FALSE) \
-FLAG(   1,  0, EDX, 28,  1, HTT,                               ANY,  7, FALSE) \
-FLAG(   1,  0, EDX, 29,  1, TM,                                NO,   0, FALSE) \
-FLAG(   1,  0, EDX, 30,  1, IA64,                              NO,   0, FALSE) \
-FLAG(   1,  0, EDX, 31,  1, PBE,                               NO,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_2                                               \
-FIELD(  2,  0, EAX,  0,  8, LEAF2_COUNT,                       NA,   0, FALSE) \
-FIELD(  2,  0, EAX,  8,  8, LEAF2_CACHE1,                      NA,   0, FALSE) \
-FIELD(  2,  0, EAX, 16,  8, LEAF2_CACHE2,                      NA,   0, FALSE) \
-FIELD(  2,  0, EAX, 24,  8, LEAF2_CACHE3,                      NA,   0, FALSE) \
-FIELD(  2,  0, EBX,  0,  8, LEAF2_CACHE4,                      NA,   0, FALSE) \
-FIELD(  2,  0, EBX,  8,  8, LEAF2_CACHE5,                      NA,   0, FALSE) \
-FIELD(  2,  0, EBX, 16,  8, LEAF2_CACHE6,                      NA,   0, FALSE) \
-FIELD(  2,  0, EBX, 24,  8, LEAF2_CACHE7,                      NA,   0, FALSE) \
-FIELD(  2,  0, ECX,  0,  8, LEAF2_CACHE8,                      NA,   0, FALSE) \
-FIELD(  2,  0, ECX,  8,  8, LEAF2_CACHE9,                      NA,   0, FALSE) \
-FIELD(  2,  0, ECX, 16,  8, LEAF2_CACHE10,                     NA,   0, FALSE) \
-FIELD(  2,  0, ECX, 24,  8, LEAF2_CACHE11,                     NA,   0, FALSE) \
-FIELD(  2,  0, EDX,  0,  8, LEAF2_CACHE12,                     NA,   0, FALSE) \
-FIELD(  2,  0, EDX,  8,  8, LEAF2_CACHE13,                     NA,   0, FALSE) \
-FIELD(  2,  0, EDX, 16,  8, LEAF2_CACHE14,                     NA,   0, FALSE) \
-FIELD(  2,  0, EDX, 24,  8, LEAF2_CACHE15,                     NA,   0, FALSE) \
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_4                                               \
-FIELD(  4,  0, EAX,  0,  5, LEAF4_CACHE_TYPE,                  NA,   0, FALSE) \
-FIELD(  4,  0, EAX,  5,  3, LEAF4_CACHE_LEVEL,                 NA,   0, FALSE) \
-FLAG(   4,  0, EAX,  8,  1, LEAF4_CACHE_SELF_INIT,             NA,   0, FALSE) \
-FLAG(   4,  0, EAX,  9,  1, LEAF4_CACHE_FULLY_ASSOC,           NA,   0, FALSE) \
-FIELD(  4,  0, EAX, 14, 12, LEAF4_CACHE_NUMHT_SHARING,         NA,   0, FALSE) \
-FIELD(  4,  0, EAX, 26,  6, LEAF4_CORE_COUNT,                  NA,   0, FALSE) \
-FIELD(  4,  0, EBX,  0, 12, LEAF4_CACHE_LINE,                  NA,   0, FALSE) \
-FIELD(  4,  0, EBX, 12, 10, LEAF4_CACHE_PART,                  NA,   0, FALSE) \
-FIELD(  4,  0, EBX, 22, 10, LEAF4_CACHE_WAYS,                  NA,   0, FALSE) \
-FIELD(  4,  0, ECX,  0, 32, LEAF4_CACHE_SETS,                  NA,   0, FALSE) \
-FLAG(   4,  0, EDX,  0,  1, LEAF4_CACHE_WBINVD_NOT_GUARANTEED, NA,   0, FALSE) \
-FLAG(   4,  0, EDX,  1,  1, LEAF4_CACHE_IS_INCLUSIVE,          NA,   0, FALSE) \
-FLAG(   4,  0, EDX,  2,  1, LEAF4_CACHE_COMPLEX_INDEXING,      NA,   0, FALSE)
-
-/*     LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,            MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_5                                               \
-FIELD(  5,  0, EAX,  0, 16, MWAIT_MIN_SIZE,                    NA,   0, FALSE) \
-FIELD(  5,  0, EBX,  0, 16, MWAIT_MAX_SIZE,                    NA,   0, FALSE) \
-FLAG(   5,  0, ECX,  0,  1, MWAIT_EXTENSIONS,                  NA,   0, FALSE) \
-FLAG(   5,  0, ECX,  1,  1, MWAIT_INTR_BREAK,                  NA,   0, FALSE) \
-FIELD(  5,  0, EDX,  0,  4, MWAIT_C0_SUBSTATE,                 NA,   0, FALSE) \
-FIELD(  5,  0, EDX,  4,  4, MWAIT_C1_SUBSTATE,                 NA,   0, FALSE) \
-FIELD(  5,  0, EDX,  8,  4, MWAIT_C2_SUBSTATE,                 NA,   0, FALSE) \
-FIELD(  5,  0, EDX, 12,  4, MWAIT_C3_SUBSTATE,                 NA,   0, FALSE) \
-FIELD(  5,  0, EDX, 16,  4, MWAIT_C4_SUBSTATE,                 NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_6                                               \
-FLAG(   6,  0, EAX,  0,  1, THERMAL_SENSOR,                    NO,   0, FALSE) \
-FLAG(   6,  0, EAX,  1,  1, TURBO_MODE,                        NO,   0, FALSE) \
-FLAG(   6,  0, EAX,  2,  1, APIC_INVARIANT,                    ANY, 13, FALSE) \
-FLAG(   6,  0, EAX,  4,  1, PLN,                               NO,   0, FALSE) \
-FLAG(   6,  0, EAX,  5,  1, ECMD,                              NO,   0, FALSE) \
-FLAG(   6,  0, EAX,  6,  1, PTM,                               NO,   0, FALSE) \
-FLAG(   6,  0, EAX,  7,  1, HWP,                               NO,   0, FALSE) \
-FLAG(   6,  0, EAX,  8,  1, HWP_NOTIFICATION,                  NO,   0, FALSE) \
-FLAG(   6,  0, EAX,  9,  1, HWP_ACTIVITY_WINDOW,               NO,   0, FALSE) \
-FLAG(   6,  0, EAX, 10,  1, HWP_ENERGY_PERFORMANCE_PREFERENCE, NO,   0, FALSE) \
-FLAG(   6,  0, EAX, 11,  1, HWP_PACKAGE_LEVEL_REQUEST,         NO,   0, FALSE) \
-FLAG(   6,  0, EAX, 13,  1, HDC,                               NO,   0, FALSE) \
-FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,               NO,   0, FALSE) \
-FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                 NO,   0, FALSE) \
-FLAG(   6,  0, ECX,  1,  1, ACNT2,                             ANY, 13, FALSE) \
-FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                  NO,   0, FALSE)
-
-#define CPUID_7_EDX_28 \
-FLAG(   7,  0, EDX, 28,  1, LEVEL7EDX_RSVD1,                    NO,  0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_0                                            \
+FIELD(  0,  0, EAX,  0, 32, NUMLEVELS,                           ANY,   4 ) \
+FIELD(  0,  0, EBX,  0, 32, VENDOR1,                             YES,   4 ) \
+FIELD(  0,  0, ECX,  0, 32, VENDOR3,                             YES,   4 ) \
+FIELD(  0,  0, EDX,  0, 32, VENDOR2,                             YES,   4 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_1                                            \
+FIELD(  1,  0, EAX,  0,  4, STEPPING,                            ANY,   4 ) \
+FIELD(  1,  0, EAX,  4,  4, MODEL,                               ANY,   4 ) \
+FIELD(  1,  0, EAX,  8,  4, FAMILY,                              YES,   4 ) \
+FIELD(  1,  0, EAX, 12,  2, TYPE,                                ANY,   4 ) \
+FIELD(  1,  0, EAX, 16,  4, EXTENDED_MODEL,                      ANY,   4 ) \
+FIELD(  1,  0, EAX, 20,  8, EXTENDED_FAMILY,                     YES,   4 ) \
+FIELD(  1,  0, EBX,  0,  8, BRAND_ID,                            ANY,   4 ) \
+FIELD(  1,  0, EBX,  8,  8, CLFL_SIZE,                           ANY,   4 ) \
+FIELD(  1,  0, EBX, 16,  8, LCPU_COUNT,                          ANY,   4 ) \
+FIELD(  1,  0, EBX, 24,  8, APICID,                              ANY,   4 ) \
+FLAG(   1,  0, ECX,  0,  1, SSE3,                                YES,   4 ) \
+FLAG(   1,  0, ECX,  1,  1, PCLMULQDQ,                           YES,   4 ) \
+FLAG(   1,  0, ECX,  2,  1, DTES64,                              NO,    0 ) \
+FLAG(   1,  0, ECX,  3,  1, MWAIT,                               YES,   4 ) \
+FLAG(   1,  0, ECX,  4,  1, DSCPL,                               NO,    0 ) \
+FLAG(   1,  0, ECX,  5,  1, VMX,                                 YES,   8 ) \
+FLAG(   1,  0, ECX,  6,  1, SMX,                                 YES, FUT ) \
+FLAG(   1,  0, ECX,  7,  1, EIST,                                NO,    0 ) \
+FLAG(   1,  0, ECX,  8,  1, TM2,                                 NO,    0 ) \
+FLAG(   1,  0, ECX,  9,  1, SSSE3,                               YES,   4 ) \
+FLAG(   1,  0, ECX, 10,  1, CNXTID,                              NO,    0 ) \
+FLAG(   1,  0, ECX, 11,  1, SDBG,                                NO,    0 ) \
+FLAG(   1,  0, ECX, 12,  1, FMA,                                 YES,   8 ) \
+FLAG(   1,  0, ECX, 13,  1, CMPXCHG16B,                          YES,   4 ) \
+FLAG(   1,  0, ECX, 14,  1, xTPR,                                NO,    0 ) \
+FLAG(   1,  0, ECX, 15,  1, PDCM,                                NO,    0 ) \
+FLAG(   1,  0, ECX, 17,  1, PCID,                                YES,   9 ) \
+FLAG(   1,  0, ECX, 18,  1, DCA,                                 NO,    0 ) \
+FLAG(   1,  0, ECX, 19,  1, SSE41,                               YES,   4 ) \
+FLAG(   1,  0, ECX, 20,  1, SSE42,                               YES,   4 ) \
+FLAG(   1,  0, ECX, 21,  1, x2APIC,                              ANY,   9 ) \
+FLAG(   1,  0, ECX, 22,  1, MOVBE,                               YES,   4 ) \
+FLAG(   1,  0, ECX, 23,  1, POPCNT,                              YES,   4 ) \
+FLAG(   1,  0, ECX, 24,  1, TSC_DEADLINE,                        ANY,  11 ) \
+FLAG(   1,  0, ECX, 25,  1, AES,                                 YES,   4 ) \
+FLAG(   1,  0, ECX, 26,  1, XSAVE,                               YES,   8 ) \
+FLAG(   1,  0, ECX, 27,  1, OSXSAVE,                             ANY,   8 ) \
+FLAG(   1,  0, ECX, 28,  1, AVX,                                 YES,   8 ) \
+FLAG(   1,  0, ECX, 29,  1, F16C,                                YES,   9 ) \
+FLAG(   1,  0, ECX, 30,  1, RDRAND,                              YES,   9 ) \
+FLAG(   1,  0, ECX, 31,  1, HYPERVISOR,                          ANY,   4 ) \
+FLAG(   1,  0, EDX,  0,  1, FPU,                                 YES,   4 ) \
+FLAG(   1,  0, EDX,  1,  1, VME,                                 YES,   4 ) \
+FLAG(   1,  0, EDX,  2,  1, DE,                                  YES,   4 ) \
+FLAG(   1,  0, EDX,  3,  1, PSE,                                 YES,   4 ) \
+FLAG(   1,  0, EDX,  4,  1, TSC,                                 YES,   4 ) \
+FLAG(   1,  0, EDX,  5,  1, MSR,                                 YES,   4 ) \
+FLAG(   1,  0, EDX,  6,  1, PAE,                                 YES,   4 ) \
+FLAG(   1,  0, EDX,  7,  1, MCE,                                 YES,   4 ) \
+FLAG(   1,  0, EDX,  8,  1, CX8,                                 YES,   4 ) \
+FLAG(   1,  0, EDX,  9,  1, APIC,                                ANY,   4 ) \
+FLAG(   1,  0, EDX, 11,  1, SEP,                                 YES,   4 ) \
+FLAG(   1,  0, EDX, 12,  1, MTRR,                                YES,   4 ) \
+FLAG(   1,  0, EDX, 13,  1, PGE,                                 YES,   4 ) \
+FLAG(   1,  0, EDX, 14,  1, MCA,                                 YES,   4 ) \
+FLAG(   1,  0, EDX, 15,  1, CMOV,                                YES,   4 ) \
+FLAG(   1,  0, EDX, 16,  1, PAT,                                 YES,   4 ) \
+FLAG(   1,  0, EDX, 17,  1, PSE36,                               YES,   4 ) \
+FLAG(   1,  0, EDX, 18,  1, PSN,                                 YES,   4 ) \
+FLAG(   1,  0, EDX, 19,  1, CLFSH,                               YES,   4 ) \
+FLAG(   1,  0, EDX, 21,  1, DS,                                  YES,   4 ) \
+FLAG(   1,  0, EDX, 22,  1, ACPI,                                ANY,   4 ) \
+FLAG(   1,  0, EDX, 23,  1, MMX,                                 YES,   4 ) \
+FLAG(   1,  0, EDX, 24,  1, FXSR,                                YES,   4 ) \
+FLAG(   1,  0, EDX, 25,  1, SSE,                                 YES,   4 ) \
+FLAG(   1,  0, EDX, 26,  1, SSE2,                                YES,   4 ) \
+FLAG(   1,  0, EDX, 27,  1, SS,                                  YES,   4 ) \
+FLAG(   1,  0, EDX, 28,  1, HTT,                                 ANY,   7 ) \
+FLAG(   1,  0, EDX, 29,  1, TM,                                  NO,    0 ) \
+FLAG(   1,  0, EDX, 30,  1, IA64,                                NO,    0 ) \
+FLAG(   1,  0, EDX, 31,  1, PBE,                                 NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_2                                            \
+FIELD(  2,  0, EAX,  0,  8, LEAF2_COUNT,                         NA,    0 ) \
+FIELD(  2,  0, EAX,  8,  8, LEAF2_CACHE1,                        NA,    0 ) \
+FIELD(  2,  0, EAX, 16,  8, LEAF2_CACHE2,                        NA,    0 ) \
+FIELD(  2,  0, EAX, 24,  8, LEAF2_CACHE3,                        NA,    0 ) \
+FIELD(  2,  0, EBX,  0,  8, LEAF2_CACHE4,                        NA,    0 ) \
+FIELD(  2,  0, EBX,  8,  8, LEAF2_CACHE5,                        NA,    0 ) \
+FIELD(  2,  0, EBX, 16,  8, LEAF2_CACHE6,                        NA,    0 ) \
+FIELD(  2,  0, EBX, 24,  8, LEAF2_CACHE7,                        NA,    0 ) \
+FIELD(  2,  0, ECX,  0,  8, LEAF2_CACHE8,                        NA,    0 ) \
+FIELD(  2,  0, ECX,  8,  8, LEAF2_CACHE9,                        NA,    0 ) \
+FIELD(  2,  0, ECX, 16,  8, LEAF2_CACHE10,                       NA,    0 ) \
+FIELD(  2,  0, ECX, 24,  8, LEAF2_CACHE11,                       NA,    0 ) \
+FIELD(  2,  0, EDX,  0,  8, LEAF2_CACHE12,                       NA,    0 ) \
+FIELD(  2,  0, EDX,  8,  8, LEAF2_CACHE13,                       NA,    0 ) \
+FIELD(  2,  0, EDX, 16,  8, LEAF2_CACHE14,                       NA,    0 ) \
+FIELD(  2,  0, EDX, 24,  8, LEAF2_CACHE15,                       NA,    0 ) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_4                                            \
+FIELD(  4,  0, EAX,  0,  5, LEAF4_CACHE_TYPE,                    NA,    0 ) \
+FIELD(  4,  0, EAX,  5,  3, LEAF4_CACHE_LEVEL,                   NA,    0 ) \
+FLAG(   4,  0, EAX,  8,  1, LEAF4_CACHE_SELF_INIT,               NA,    0 ) \
+FLAG(   4,  0, EAX,  9,  1, LEAF4_CACHE_FULLY_ASSOC,             NA,    0 ) \
+FIELD(  4,  0, EAX, 14, 12, LEAF4_CACHE_NUMHT_SHARING,           NA,    0 ) \
+FIELD(  4,  0, EAX, 26,  6, LEAF4_CORE_COUNT,                    NA,    0 ) \
+FIELD(  4,  0, EBX,  0, 12, LEAF4_CACHE_LINE,                    NA,    0 ) \
+FIELD(  4,  0, EBX, 12, 10, LEAF4_CACHE_PART,                    NA,    0 ) \
+FIELD(  4,  0, EBX, 22, 10, LEAF4_CACHE_WAYS,                    NA,    0 ) \
+FIELD(  4,  0, ECX,  0, 32, LEAF4_CACHE_SETS,                    NA,    0 ) \
+FLAG(   4,  0, EDX,  0,  1, LEAF4_CACHE_WBINVD_NOT_GUARANTEED,   NA,    0 ) \
+FLAG(   4,  0, EDX,  1,  1, LEAF4_CACHE_IS_INCLUSIVE,            NA,    0 ) \
+FLAG(   4,  0, EDX,  2,  1, LEAF4_CACHE_COMPLEX_INDEXING,        NA,    0 )
+
+/*     LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,              MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_5                                            \
+FIELD(  5,  0, EAX,  0, 16, MWAIT_MIN_SIZE,                      NA,    0 ) \
+FIELD(  5,  0, EBX,  0, 16, MWAIT_MAX_SIZE,                      NA,    0 ) \
+FLAG(   5,  0, ECX,  0,  1, MWAIT_EXTENSIONS,                    NA,    0 ) \
+FLAG(   5,  0, ECX,  1,  1, MWAIT_INTR_BREAK,                    NA,    0 ) \
+FIELD(  5,  0, EDX,  0,  4, MWAIT_C0_SUBSTATE,                   NA,    0 ) \
+FIELD(  5,  0, EDX,  4,  4, MWAIT_C1_SUBSTATE,                   NA,    0 ) \
+FIELD(  5,  0, EDX,  8,  4, MWAIT_C2_SUBSTATE,                   NA,    0 ) \
+FIELD(  5,  0, EDX, 12,  4, MWAIT_C3_SUBSTATE,                   NA,    0 ) \
+FIELD(  5,  0, EDX, 16,  4, MWAIT_C4_SUBSTATE,                   NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_6                                            \
+FLAG(   6,  0, EAX,  0,  1, THERMAL_SENSOR,                      NO,    0 ) \
+FLAG(   6,  0, EAX,  1,  1, TURBO_MODE,                          NO,    0 ) \
+FLAG(   6,  0, EAX,  2,  1, APIC_INVARIANT,                      ANY,   4 ) \
+FLAG(   6,  0, EAX,  4,  1, PLN,                                 NO,    0 ) \
+FLAG(   6,  0, EAX,  5,  1, ECMD,                                NO,    0 ) \
+FLAG(   6,  0, EAX,  6,  1, PTM,                                 NO,    0 ) \
+FLAG(   6,  0, EAX,  7,  1, HWP,                                 NO,    0 ) \
+FLAG(   6,  0, EAX,  8,  1, HWP_NOTIFICATION,                    NO,    0 ) \
+FLAG(   6,  0, EAX,  9,  1, HWP_ACTIVITY_WINDOW,                 NO,    0 ) \
+FLAG(   6,  0, EAX, 10,  1, HWP_ENERGY_PERFORMANCE_PREFERENCE,   NO,    0 ) \
+FLAG(   6,  0, EAX, 11,  1, HWP_PACKAGE_LEVEL_REQUEST,           NO,    0 ) \
+FLAG(   6,  0, EAX, 13,  1, HDC,                                 NO,    0 ) \
+FLAG(   6,  0, EAX, 19,  1, HW_FEEDBACK,                         NO,    0 ) \
+FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,                 NO,    0 ) \
+FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                   NO,    0 ) \
+FLAG(   6,  0, ECX,  1,  1, ACNT2,                               ANY,  13 ) \
+FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                    NO,    0 ) \
+FLAG(   6,  0, EDX,  0,  1, PERF_CAP_REPORTING,                  NO,    0 ) \
+FLAG(   6,  0, EDX,  1,  1, ENERGY_CAP_REPORTING,                NO,    0 ) \
+FIELD(  6,  0, EDX,  8,  4, HW_FEEDBACK_SIZE,                    NO,    0 ) \
+FIELD(  6,  0, EDX, 16, 16, HW_FEEDBACK_INDEX,                   NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_7_EDX_10 \
-FLAG(   7,  0, EDX, 10,  1, LEAF7_RSVD,                         NO,  0, FALSE)
-#define CPUID_7_EDX_31 \
-FLAG(   7,  0, EDX, 31,  1, LEVEL7EDX_RSVD2,                    NO,  0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_7                                               \
-FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                          YES,  9, FALSE) \
-FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                        ANY, 11, FALSE) \
-FLAG(   7,  0, EBX,  2,  1, SGX,                               YES, 17, FALSE) \
-FLAG(   7,  0, EBX,  3,  1, BMI1,                              YES,  9, TRUE)  \
-FLAG(   7,  0, EBX,  4,  1, HLE,                               YES, 11, TRUE)  \
-FLAG(   7,  0, EBX,  5,  1, AVX2,                              YES, 11, TRUE)  \
-FLAG(   7,  0, EBX,  6,  1, FDP_EXCPTN_ONLY,                   ANY, 13, TRUE)  \
-FLAG(   7,  0, EBX,  7,  1, SMEP,                              YES,  9, FALSE) \
-FLAG(   7,  0, EBX,  8,  1, BMI2,                              YES, 11, TRUE)  \
-FLAG(   7,  0, EBX,  9,  1, ENFSTRG,                           YES,  9, FALSE) \
-FLAG(   7,  0, EBX, 10,  1, INVPCID,                           YES, 11, FALSE) \
-FLAG(   7,  0, EBX, 11,  1, RTM,                               YES, 11, TRUE)  \
-FLAG(   7,  0, EBX, 12,  1, PQM,                               NO,   0, FALSE) \
-FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                   ANY, 11, TRUE)  \
-FLAG(   7,  0, EBX, 14,  1, MPX,                               YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 15,  1, PQE,                               NO,   0, FALSE) \
-FLAG(   7,  0, EBX, 16,  1, AVX512F,                           YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 17,  1, AVX512DQ,                          YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 18,  1, RDSEED,                            YES, 11, TRUE)  \
-FLAG(   7,  0, EBX, 19,  1, ADX,                               YES, 11, TRUE)  \
-FLAG(   7,  0, EBX, 20,  1, SMAP,                              YES, 11, FALSE) \
-FLAG(   7,  0, EBX, 21,  1, AVX512IFMA,                        YES, 17, TRUE)  \
-FLAG(   7,  0, EBX, 23,  1, CLFLUSHOPT,                        YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 24,  1, CLWB,                              YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 25,  1, PT,                                YES, 17, FALSE) \
-FLAG(   7,  0, EBX, 26,  1, AVX512PF,                          YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 27,  1, AVX512ER,                          YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 28,  1, AVX512CD,                          YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 29,  1, SHA,                               YES, 14, TRUE)  \
-FLAG(   7,  0, EBX, 30,  1, AVX512BW,                          YES, 13, TRUE)  \
-FLAG(   7,  0, EBX, 31,  1, AVX512VL,                          YES, 13, TRUE)  \
-FLAG(   7,  0, ECX,  0,  1, PREFETCHWT1,                       YES, 13, TRUE)  \
-FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                        YES, 17, TRUE)  \
-FLAG(   7,  0, ECX,  2,  1, UMIP,                              NO,   0, FALSE) \
-FLAG(   7,  0, ECX,  3,  1, PKU,                               YES, 13, TRUE)  \
-FLAG(   7,  0, ECX,  4,  1, OSPKE,                             ANY, 13, TRUE)  \
-FLAG(   7,  0, ECX,  6,  1, AVX512VBMI2,                       NO,   0, TRUE)  \
-FLAG(   7,  0, ECX,  8,  1, GFNI,                              NO,   0, TRUE)  \
-FLAG(   7,  0, ECX,  9,  1, VAES,                              NO,   0, TRUE)  \
-FLAG(   7,  0, ECX, 10,  1, VPCLMULQDQ,                        NO,   0, TRUE)  \
-FLAG(   7,  0, ECX, 11,  1, AVX512VNNI,                        NO,   0, TRUE)  \
-FLAG(   7,  0, ECX, 12,  1, AVX512BITALG,                      NO,   0, TRUE)  \
-FLAG(   7,  0, ECX, 14,  1, AVX512VPOPCNTDQ,                   YES, 16, TRUE)  \
-FLAG(   7,  0, ECX, 16,  1, VA57,                              NO,   0, TRUE)  \
-FIELD(  7,  0, ECX, 17,  5, MAWA,                              NO,   0, TRUE)  \
-FLAG(   7,  0, ECX, 22,  1, RDPID,                             NO,   0, TRUE)  \
-FLAG(   7,  0, ECX, 30,  1, SGX_LC,                            YES, 17, FALSE) \
-FLAG(   7,  0, EDX,  2,  1, AVX512QVNNIW,                      YES, 16, TRUE)  \
-FLAG(   7,  0, EDX,  3,  1, AVX512QFMAPS,                      YES, 16, TRUE)  \
-CPUID_7_EDX_10                                                                 \
-FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                          ANY,  9, FALSE) \
-FLAG(   7,  0, EDX, 27,  1, STIBP,                             YES,  9, FALSE) \
-CPUID_7_EDX_28                                                                 \
-FLAG(   7,  0, EDX, 29,  1, ARCH_CAPABILITIES,                 ANY,  9, FALSE) \
-CPUID_7_EDX_31
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_A                                               \
-FIELD(  A,  0, EAX,  0,  8, PMC_VERSION,                       NA,   0, FALSE) \
-FIELD(  A,  0, EAX,  8,  8, PMC_NUM_GEN,                       NA,   0, FALSE) \
-FIELD(  A,  0, EAX, 16,  8, PMC_WIDTH_GEN,                     NA,   0, FALSE) \
-FIELD(  A,  0, EAX, 24,  8, PMC_EBX_LENGTH,                    NA,   0, FALSE) \
-FLAG(   A,  0, EBX,  0,  1, PMC_CORE_CYCLES,                   NA,   0, FALSE) \
-FLAG(   A,  0, EBX,  1,  1, PMC_INSTR_RETIRED,                 NA,   0, FALSE) \
-FLAG(   A,  0, EBX,  2,  1, PMC_REF_CYCLES,                    NA,   0, FALSE) \
-FLAG(   A,  0, EBX,  3,  1, PMC_LAST_LVL_CREF,                 NA,   0, FALSE) \
-FLAG(   A,  0, EBX,  4,  1, PMC_LAST_LVL_CMISS,                NA,   0, FALSE) \
-FLAG(   A,  0, EBX,  5,  1, PMC_BR_INST_RETIRED,               NA,   0, FALSE) \
-FLAG(   A,  0, EBX,  6,  1, PMC_BR_MISS_RETIRED,               NA,   0, FALSE) \
-FIELD(  A,  0, EDX,  0,  5, PMC_NUM_FIXED,                     NA,   0, FALSE) \
-FIELD(  A,  0, EDX,  5,  8, PMC_WIDTH_FIXED,                   NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_B                                               \
-FIELD(  B,  0, EAX,  0,  5, TOPOLOGY_MASK_WIDTH,               NA,   0, FALSE) \
-FIELD(  B,  0, EBX,  0, 16, TOPOLOGY_CPUS_SHARING_LEVEL,       NA,   0, FALSE) \
-FIELD(  B,  0, ECX,  0,  8, TOPOLOGY_LEVEL_NUMBER,             NA,   0, FALSE) \
-FIELD(  B,  0, ECX,  8,  8, TOPOLOGY_LEVEL_TYPE,               NA,   0, FALSE) \
-FIELD(  B,  0, EDX,  0, 32, TOPOLOGY_X2APIC_ID,                NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_D                                               \
-FLAG(   D,  0, EAX,  0,  1, XCR0_MASTER_LEGACY_FP,             YES,  8, FALSE) \
-FLAG(   D,  0, EAX,  1,  1, XCR0_MASTER_SSE,                   YES,  8, FALSE) \
-FLAG(   D,  0, EAX,  2,  1, XCR0_MASTER_YMM_H,                 YES,  8, FALSE) \
-FLAG(   D,  0, EAX,  3,  1, XCR0_MASTER_BNDREGS,               YES, 13, FALSE) \
-FLAG(   D,  0, EAX,  4,  1, XCR0_MASTER_BNDCSR,                YES, 13, FALSE) \
-FLAG(   D,  0, EAX,  5,  1, XCR0_MASTER_OPMASK,                YES, 13, FALSE) \
-FLAG(   D,  0, EAX,  6,  1, XCR0_MASTER_ZMM_H,                 YES, 13, FALSE) \
-FLAG(   D,  0, EAX,  7,  1, XCR0_MASTER_HI16_ZMM,              YES, 13, FALSE) \
-FLAG(   D,  0, EAX,  8,  1, XCR0_MASTER_XSS,                   NO,   0, FALSE) \
-FLAG(   D,  0, EAX,  9,  1, XCR0_MASTER_PKRU,                  YES, 13, FALSE) \
-FIELD(  D,  0, EAX,  10,22, XCR0_MASTER_LOWER,                 NO,   0, FALSE) \
-FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                ANY,  8, FALSE) \
-FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                    YES,  8, FALSE) \
-FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                 NO,   0, FALSE) \
-FLAG(   D,  0, EDX, 30,  1, XCR0_MASTER_LWP,                   NO,   0, FALSE) \
-FLAG(   D,  0, EDX, 31,  1, XCR0_MASTER_EXTENDED_XSAVE,        NO,   0, FALSE) \
-FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                          YES, 11, FALSE) \
-FLAG(   D,  1, EAX,  1,  1, XSAVEC,                            YES, 13, FALSE) \
-FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                       NO,   0, FALSE) \
-FLAG(   D,  1, EAX,  3,  1, XSAVES,                            YES, 13, FALSE) \
-FIELD(  D,  1, EBX,  0, 32, XSAVES_ENABLED_SIZE,               ANY, 13, FALSE) \
-FIELD(  D,  1, ECX,  0,  7, XSS_XCR0_USED0,                    NO,   0, FALSE) \
-FLAG(   D,  1, ECX,  8,  1, XSS_PT,                            NO,   0, FALSE) \
-FIELD(  D,  1, ECX,  9,  1, XSS_XCR0_USED1,                    NO,   0, FALSE) \
-FIELD(  D,  1, ECX,  10,22, XSS_RSVD0,                         NO,   0, FALSE) \
-FIELD(  D,  1, EDX,  0, 32, XSS_RSVD1,                         NO,   0, FALSE) \
-FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                    YES,  9, FALSE) \
-FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                  YES,  9, FALSE) \
-FLAG(   D,  2, ECX,  0,  1, XSAVE_YMM_SUP_BY_XSS,              NO,   0, FALSE) \
-FLAG(   D,  2, ECX,  1,  1, XSAVE_YMM_ALIGN,                   YES, 13, FALSE) \
-FIELD(  D,  2, ECX,  2, 30, XSAVE_YMM_RSVD1,                   NO,   0, FALSE) \
-FIELD(  D,  2, EDX,  0, 32, XSAVE_YMM_RSVD2,                   NO,   0, FALSE) \
-FIELD(  D,  3, EAX,  0, 32, XSAVE_BNDREGS_SIZE,                YES, 13, FALSE) \
-FIELD(  D,  3, EBX,  0, 32, XSAVE_BNDREGS_OFFSET,              YES, 13, FALSE) \
-FLAG(   D,  3, ECX,  0,  1, XSAVE_BNDREGS_SUP_BY_XSS,          NO,   0, FALSE) \
-FLAG(   D,  3, ECX,  1,  1, XSAVE_BNDREGS_ALIGN,               YES, 13, FALSE) \
-FIELD(  D,  3, ECX,  2, 30, XSAVE_BNDREGS_RSVD1,               NO,   0, FALSE) \
-FIELD(  D,  3, EDX,  0, 32, XSAVE_BNDREGS_RSVD2,               NO,   0, FALSE) \
-FIELD(  D,  4, EAX,  0, 32, XSAVE_BNDCSR_SIZE,                 YES, 13, FALSE) \
-FIELD(  D,  4, EBX,  0, 32, XSAVE_BNDCSR_OFFSET,               YES, 13, FALSE) \
-FLAG(   D,  4, ECX,  0,  1, XSAVE_BNDCSR_SUP_BY_XSS,           NO,   0, FALSE) \
-FLAG(   D,  4, ECX,  1,  1, XSAVE_BNDCSR_ALIGN,                YES, 13, FALSE) \
-FIELD(  D,  4, ECX,  2, 30, XSAVE_BNDCSR_RSVD1,                NO,   0, FALSE) \
-FIELD(  D,  4, EDX,  0, 32, XSAVE_BNDCSR_RSVD2,                NO,   0, FALSE) \
-FIELD(  D,  5, EAX,  0, 32, XSAVE_OPMASK_SIZE,                 YES, 13, FALSE) \
-FIELD(  D,  5, EBX,  0, 32, XSAVE_OPMASK_OFFSET,               YES, 13, FALSE) \
-FLAG(   D,  5, ECX,  0,  1, XSAVE_OPMASK_SUP_BY_XSS,           NO,   0, FALSE) \
-FLAG(   D,  5, ECX,  1,  1, XSAVE_OPMASK_ALIGN,                YES, 13, FALSE) \
-FIELD(  D,  5, ECX,  2, 30, XSAVE_OPMASK_RSVD1,                NO,   0, FALSE) \
-FIELD(  D,  5, EDX,  0, 32, XSAVE_OPMASK_RSVD2,                NO,   0, FALSE) \
-FIELD(  D,  6, EAX,  0, 32, XSAVE_ZMM_H_SIZE,                  YES, 13, FALSE) \
-FIELD(  D,  6, EBX,  0, 32, XSAVE_ZMM_H_OFFSET,                YES, 13, FALSE) \
-FLAG(   D,  6, ECX,  0,  1, XSAVE_ZMM_H_SUP_BY_XSS,            NO,   0, FALSE) \
-FLAG(   D,  6, ECX,  1,  1, XSAVE_ZMM_H_ALIGN,                 YES, 13, FALSE) \
-FIELD(  D,  6, ECX,  2, 30, XSAVE_ZMM_H_RSVD1,                 NO,   0, FALSE) \
-FIELD(  D,  6, EDX,  0, 32, XSAVE_ZMM_H_RSVD2,                 NO,   0, FALSE) \
-FIELD(  D,  7, EAX,  0, 32, XSAVE_HI16_ZMM_SIZE,               YES, 13, FALSE) \
-FIELD(  D,  7, EBX,  0, 32, XSAVE_HI16_ZMM_OFFSET,             YES, 13, FALSE) \
-FLAG(   D,  7, ECX,  0,  1, XSAVE_HI16_ZMM_SUP_BY_XSS,         NO,   0, FALSE) \
-FLAG(   D,  7, ECX,  1,  1, XSAVE_HI16_ZMM_ALIGN,              YES, 13, FALSE) \
-FIELD(  D,  7, ECX,  2, 30, XSAVE_HI16_ZMM_RSVD1,              NO,   0, FALSE) \
-FIELD(  D,  7, EDX,  0, 32, XSAVE_HI16_ZMM_RSVD2,              NO,   0, FALSE) \
-FIELD(  D,  8, EAX,  0, 32, XSAVE_PT_STATE_SIZE,               NO,   0, FALSE) \
-FIELD(  D,  8, EBX,  0, 32, XSAVE_PT_STATE_OFFSET,             NO,   0, FALSE) \
-FLAG(   D,  8, ECX,  0,  1, XSAVE_PT_STATE_SUP_BY_XSS,         NO,   0, FALSE) \
-FLAG(   D,  8, ECX,  1,  1, XSAVE_PT_STATE_ALIGN,              NO,   0, FALSE) \
-FIELD(  D,  8, ECX,  2, 30, XSAVE_PT_STATE_RSVD1,              NO,   0, FALSE) \
-FIELD(  D,  8, EDX,  0, 32, XSAVE_PT_STATE_RSVD2,              NO,   0, FALSE) \
-FIELD(  D,  9, EAX,  0, 32, XSAVE_PKRU_SIZE,                   YES, 13, FALSE) \
-FIELD(  D,  9, EBX,  0, 32, XSAVE_PKRU_OFFSET,                 YES, 13, FALSE) \
-FLAG(   D,  9, ECX,  0,  1, XSAVE_PKRU_SUP_BY_XSS,             NO,   0, FALSE) \
-FLAG(   D,  9, ECX,  1,  1, XSAVE_PKRU_ALIGN,                  YES, 13, FALSE) \
-FIELD(  D,  9, ECX,  2, 30, XSAVE_PKRU_RSVD1,                  NO,   0, FALSE) \
-FIELD(  D,  9, EDX,  0, 32, XSAVE_PKRU_RSVD2,                  NO,   0, FALSE) \
-FIELD(  D, 62, EAX,  0, 32, XSAVE_LWP_SIZE,                    NO,   0, FALSE) \
-FIELD(  D, 62, EBX,  0, 32, XSAVE_LWP_OFFSET,                  NO,   0, FALSE) \
-FIELD(  D, 62, ECX,  0, 32, XSAVE_LWP_RSVD1,                   NO,   0, FALSE) \
-FIELD(  D, 62, EDX,  0, 32, XSAVE_LWP_RSVD2,                   NO,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_F                                               \
-FIELD(  F,  0, EBX,  0, 32, PQM_MAX_RMID,                      NO,   0, FALSE) \
-FLAG(   F,  0, EDX,  1,  1, PQM_CMT_SUPPORT,                   NO,   0, FALSE) \
-FIELD(  F,  1, EBX,  0, 32, PQM_CMT_CONV,                      NO,   0, FALSE) \
-FIELD(  F,  1, ECX,  0, 32, PQM_CMT_NUM_RMID,                  NO,   0, FALSE) \
-FLAG(   F,  1, EDX,  0,  1, PQM_CMT_OCCUPANCY,                 NO,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_10                                              \
-FLAG(  10,  0, EBX,  1,  1, L3_QOS_ENFORCEMENT,                NO,   0, FALSE) \
-FIELD( 10,  1, EAX,  0,  4, RESID_CAPACITY_MASK_LENGTH,        NO,   0, FALSE) \
-FIELD( 10,  1, EBX,  0, 32, ISOLATION_UNIT_MAP,                NO,   0, FALSE) \
-FLAG(  10,  1, ECX,  1,  1, INFREQUENT_COS_UPDATE,             NO,   0, FALSE) \
-FLAG(  10,  1, ECX,  2,  1, CODE_AND_DATA_PRIORITIZATION,      NO,   0, FALSE) \
-FIELD( 10,  1, EDX,  0, 16, MAX_COS_NUMBER,                    NO,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_12                                              \
-FLAG(  12,  0, EAX,  0,  1, SGX1,                              YES, 17, FALSE) \
-FLAG(  12,  0, EAX,  1,  1, SGX2,                              NO,   0, FALSE) \
-FLAG(  12,  0, EBX,  0,  1, SGX_MISCSELECT_EXINFO,             YES, 17, FALSE) \
-FIELD( 12,  0, EBX,  1, 31, SGX_MISCSELECT_RSVD,               NO,   0, FALSE) \
-FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,            YES, 17, FALSE) \
-FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,               YES, 17, FALSE) \
-FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                  YES, 17, FALSE) \
-FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                  YES, 17, FALSE) \
-FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                  YES, 17, FALSE) \
-FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                  YES, 17, FALSE) \
-FIELD( 12,  2, EAX,  0, 15, EPC00_VALID,                       YES, 17, FALSE) \
-FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                    YES, 17, FALSE) \
-FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                   YES, 17, FALSE) \
-FIELD( 12,  2, ECX,  0, 15, EPC00_PROTECTED,                   YES, 17, FALSE) \
-FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                    YES, 17, FALSE) \
-FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                   YES, 17, FALSE) \
-FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                       NO,   0, FALSE) \
-FIELD( 12,  3, EAX, 12, 20, EPC01_BASE_LOW,                    NO,   0, FALSE) \
-FIELD( 12,  3, EBX,  0, 20, EPC01_BASE_HIGH,                   NO,   0, FALSE) \
-FIELD( 12,  3, ECX,  0,  4, EPC01_PROTECTED,                   NO,   0, FALSE) \
-FIELD( 12,  3, ECX, 12, 20, EPC01_SIZE_LOW,                    NO,   0, FALSE) \
-FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                   NO,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_14                                              \
-FIELD( 14,  0, EAX,  0, 32, MAX_PT_SUB_LEAF,                   YES, 17, FALSE) \
-FLAG(  14,  0, EBX,  0,  1, CR3FTR_AND_MATCHMSR_AVAILABLE,     YES, 17, FALSE) \
-FLAG(  14,  0, EBX,  1,  1, PSB_AND_CYCLE_ACCURATE_MODE,       YES, 17, FALSE) \
-FLAG(  14,  0, EBX,  2,  1, IP_TRACESTOP_FTR_PTMSR_PERSIST,    YES, 17, FALSE) \
-FLAG(  14,  0, EBX,  3,  1, MTC_PKT_GENERATION_SUPPORTED,      YES, 17, FALSE) \
-FLAG(  14,  0, ECX,  0,  1, TOPA_OUTPUT_SUPPORTED,             YES, 17, FALSE) \
-FLAG(  14,  0, ECX,  1,  1, TOPA_ALLOW_MULTIPLE_ENTRIES,       YES, 17, FALSE) \
-FLAG(  14,  0, ECX,  2,  1, SINGLE_RANGE_OUTPUT_SCHEME,        YES, 17, FALSE) \
-FLAG(  14,  0, ECX,  3,  1, TRACE_TRANSPORT_SUBSYSTEM,         NO,   0, FALSE) \
-FLAG(  14,  0, ECX, 31,  1, LIP_PRESENT_FOR_IP_PAYLOADS,       YES, 17, FALSE) \
-FIELD( 14,  1, EAX,  0,  2, NUM_ADDR_RANGE_FOR_FILTERING,      YES, 17, FALSE) \
-FIELD( 14,  1, EAX, 16, 16, SUPPORTED_MTC_ENCODINGS,           YES, 17, FALSE) \
-FIELD( 14,  1, EBX,  0, 16, SUPPORTED_CYCLE_THRESHOLD_ENCODINGS, YES,17,FALSE) \
-FIELD( 14,  1, EBX, 16, 16, SUPPORTED_PSB_FREQ_ENCODINGS,      YES, 17, FALSE) \
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_15                                              \
-FIELD( 15,  0, EAX,  0, 32, DENOM_TSC_TO_CORE_CRYSTAL_CLK,     NO,   0, FALSE) \
-FIELD( 15,  0, EBX,  0, 32, NUMER_TSC_TO_CORE_CRYSTAL_CLK,     NO,   0, FALSE) \
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_16                                              \
-FIELD( 16,  0, EAX,  0, 16, PROC_BASE_FREQ,                    NO,   0, FALSE) \
-FIELD( 16,  0, EBX,  0, 16, PROC_MIN_FREQ,                     NO,   0, FALSE) \
-FIELD( 16,  0, ECX,  0, 16, BUS_FREQ,                          NO,   0, FALSE) \
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_17                                              \
-FIELD( 17,  0, EAX,  0, 31, MAX_SOCID_INDEX,                   NO,   0, FALSE) \
-FIELD( 17,  0, EBX,  0, 16, SOC_VENDOR_ID,                     NO,   0, FALSE) \
-FIELD( 17,  0, EBX, 16,  1, SOC_INDUSTRY_STD,                  NO,   0, FALSE) \
-FIELD( 17,  0, ECX,  0, 31, SOC_PROJECT_ID,                    NO,   0, FALSE) \
-FIELD( 17,  0, EDX,  0, 31, SOC_STEPPING_ID,                   NO,   0, FALSE) \
-FIELD( 17,  1, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_1_0,       NO,   0, FALSE) \
-FIELD( 17,  1, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_1_1,       NO,   0, FALSE) \
-FIELD( 17,  1, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_1_2,       NO,   0, FALSE) \
-FIELD( 17,  1, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_1_3,       NO,   0, FALSE) \
-FIELD( 17,  2, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_2_0,       NO,   0, FALSE) \
-FIELD( 17,  2, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_2_1,       NO,   0, FALSE) \
-FIELD( 17,  2, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_2_2,       NO,   0, FALSE) \
-FIELD( 17,  2, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_2_3,       NO,   0, FALSE) \
-FIELD( 17,  3, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_3_0,       NO,   0, FALSE) \
-FIELD( 17,  3, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_3_1,       NO,   0, FALSE) \
-FIELD( 17,  3, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_3_2,       NO,   0, FALSE) \
-FIELD( 17,  3, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_3_3,       NO,   0, FALSE) \
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_400                                             \
-FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                     NA,   0, FALSE) \
-FIELD(400,  0, EBX,  0, 32, HYPERVISOR_VENDOR0,                NA,   0, FALSE) \
-FIELD(400,  0, ECX,  0, 32, HYPERVISOR_VENDOR1,                NA,   0, FALSE) \
-FIELD(400,  0, EDX,  0, 32, HYPERVISOR_VENDOR2,                NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_401                                             \
-FIELD(401,  0, EAX,  0, 32, HV_INTERFACE_SIGNATURE,            NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_402                                             \
-FIELD(402,  0, EAX,  0, 32, BUILD_NUMBER,                      NA,   0, FALSE) \
-FIELD(402,  0, EBX,  0, 16, MINOR_VERSION,                     NA,   0, FALSE) \
-FIELD(402,  0, EBX, 16, 16, MAJOR_VERSION,                     NA,   0, FALSE) \
-FIELD(402,  0, ECX,  0, 32, SERVICE_PACK,                      NA,   0, FALSE) \
-FIELD(402,  0, EDX,  0, 24, SERVICE_NUMBER,                    NA,   0, FALSE) \
-FIELD(402,  0, EDX, 24,  8, SERVICE_BRANCH,                    NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_403                                             \
-FLAG( 403,  0, EAX,  0,  1, VP_RUNTIME_AVAIL,                  NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  1,  1, REF_COUNTER_AVAIL,                 NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  2,  1, BASIC_SYNIC_MSRS_AVAIL,            NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  3,  1, SYNTH_TIMER_MSRS_AVAIL,            NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  4,  1, APIC_ACCESS_MSRS_AVAIL,            NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  5,  1, HYPERCALL_MSRS_AVAIL,              NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  6,  1, VP_INDEX_MSR_AVAIL,                NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  7,  1, VIRT_RESET_MSR_AVAIL,              NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  8,  1, STATS_PAGES_MSRS_AVAIL,            NA,   0, FALSE) \
-FLAG( 403,  0, EAX,  9,  1, REF_TSC_AVAIL,                     NA,   0, FALSE) \
-FLAG( 403,  0, EAX, 10,  1, GUEST_IDLE_MSR_AVAIL,              NA,   0, FALSE) \
-FLAG( 403,  0, EAX, 11,  1, FREQUENCY_MSRS_AVAIL,              NA,   0, FALSE) \
-FLAG( 403,  0, EAX, 12,  1, SYNTH_DEBUG_MSRS_AVAIL,            NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  0,  1, CREATE_PARTITIONS_FLAG,            NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  1,  1, ACCESS_PARTITION_ID_FLAG,          NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  2,  1, ACCESS_MEMORY_POOL_FLAG,           NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  3,  1, ADJUST_MESSAGE_BUFFERS_FLAG,       NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  4,  1, POST_MESSAGES_FLAG,                NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  5,  1, SIGNAL_EVENTS_FLAG,                NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  6,  1, CREATE_PORT_FLAG,                  NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  7,  1, CONNECT_PORT_FLAG,                 NA,   0, FALSE) \
-FLAG( 403,  0, EBX,  8,  1, ACCESS_STATS_FLAG,                 NA,   0, FALSE) \
-FLAG( 403,  0, EBX, 11,  1, DEBUGGING_FLAG,                    NA,   0, FALSE) \
-FLAG( 403,  0, EBX, 12,  1, CPU_MANAGEMENT_FLAG,               NA,   0, FALSE) \
-FLAG( 403,  0, EBX, 13,  1, CONFIGURE_PROFILER_FLAG,           NA,   0, FALSE) \
-FLAG( 403,  0, EBX, 14,  1, ENABLE_EXPANDED_STACKWALKING_FLAG, NA,   0, FALSE) \
-FIELD(403,  0, ECX,  0,  4, MAX_POWER_STATE,                   NA,   0, FALSE) \
-FLAG( 403,  0, ECX,  4,  1, HPET_NEEDED_FOR_C3,                NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  0,  1, MWAIT_AVAIL,                       NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  1,  1, GUEST_DEBUGGING_AVAIL,             NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  2,  1, PERFORMANCE_MONITOR_AVAIL,         NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  3,  1, CPU_DYN_PARTITIONING_AVAIL,        NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  4,  1, XMM_REGISTERS_FOR_HYPERCALL_AVAIL, NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  5,  1, GUEST_IDLE_AVAIL,                  NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  6,  1, HYPERVISOR_SLEEP_STATE_AVAIL,      NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  7,  1, NUMA_DISTANCE_QUERY_AVAIL,         NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  8,  1, TIMER_FREQUENCY_AVAIL,             NA,   0, FALSE) \
-FLAG( 403,  0, EDX,  9,  1, SYNTH_MACHINE_CHECK_AVAIL,         NA,   0, FALSE) \
-FLAG( 403,  0, EDX, 10,  1, GUEST_CRASH_MSRS_AVAIL,            NA,   0, FALSE) \
-FLAG( 403,  0, EDX, 11,  1, DEBUG_MSRS_AVAIL,                  NA,   0, FALSE) \
-FLAG( 403,  0, EDX, 12,  1, NPIEP1_AVAIL,                      NA,   0, FALSE) \
-FLAG( 403,  0, EDX, 13,  1, DISABLE_HYPERVISOR_AVAIL,          NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_404                                             \
-FLAG( 404,  0, EAX,  0,  1, USE_HYPERCALL_TO_SWITCH_ADDR_SPACE,NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  1,  1, USE_HYPERCALL_TO_FLUSH_TLB,        NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  2,  1, USE_HYPERCALL_FOR_TLB_SHOOTDOWN,   NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  3,  1, USE_MSRS_FOR_EOI_ICR_TPR,          NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  4,  1, USE_MSR_FOR_RESET,                 NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  5,  1, USE_RELAXED_TIMING,                NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  6,  1, USE_DMA_REMAPPING,                 NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  7,  1, USE_INTERRUPT_REMAPPING,           NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  8,  1, USE_X2APIC,                        NA,   0, FALSE) \
-FLAG( 404,  0, EAX,  9,  1, DEPRECATE_AUTOEOI,                 NA,   0, FALSE) \
-FIELD(404,  0, EBX,  0, 32, SPINLOCK_RETRIES,                  NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_405                                             \
-FIELD(405,  0, EAX,  0, 32, MAX_VCPU,                          NA,   0, FALSE) \
-FIELD(405,  0, EBX,  0, 32, MAX_LCPU,                          NA,   0, FALSE) \
-FIELD(405,  0, ECX,  0, 32, MAX_REMAPPABLE_VECTORS,            NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_406                                             \
-FLAG( 406,  0, EAX,  0,  1, APIC_OVERLAY_ASSIST,               NA,   0, FALSE) \
-FLAG( 406,  0, EAX,  1,  1, MSR_BITMAPS,                       NA,   0, FALSE) \
-FLAG( 406,  0, EAX,  2,  1, ARCH_PMCS,                         NA,   0, FALSE) \
-FLAG( 406,  0, EAX,  3,  1, SLAT,                              NA,   0, FALSE) \
-FLAG( 406,  0, EAX,  4,  1, DMA_REMAPPING,                     NA,   0, FALSE) \
-FLAG( 406,  0, EAX,  5,  1, INTERRUPT_REMAPPING,               NA,   0, FALSE) \
-FLAG( 406,  0, EAX,  6,  1, MEMORY_PATROL_SCRUBBER,            NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_410                                             \
-FIELD(410,  0, EAX,  0, 32, TSC_HZ,                            NA,   0, FALSE) \
-FIELD(410,  0, EBX,  0, 32, APICBUS_HZ,                        NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_80                                              \
-FIELD( 80,  0, EAX,  0, 32, NUM_EXT_LEVELS,                    NA,   0, FALSE) \
-FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                    NA,   0, FALSE) \
-FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                    NA,   0, FALSE) \
-FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                    NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81                                              \
-FIELD( 81,  0, EAX,  0, 32, UNKNOWN81EAX,                      ANY,  4, FALSE) \
-FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                   ANY,  4, FALSE) \
-FIELD( 81,  0, EAX,  4,  4, LEAF81_MODEL,                      ANY,  4, FALSE) \
-FIELD( 81,  0, EAX,  8,  4, LEAF81_FAMILY,                     ANY,  4, FALSE) \
-FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                       ANY,  4, FALSE) \
-FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,             ANY,  4, FALSE) \
-FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,            ANY,  4, FALSE) \
-FIELD( 81,  0, EBX,  0, 32, UNKNOWN81EBX,                      ANY,  4, FALSE) \
-FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                   ANY,  4, FALSE) \
-FIELD( 81,  0, EBX, 16, 16, UNDEF,                             ANY,  4, FALSE) \
-FLAG(  81,  0, ECX,  0,  1, LAHF64,                            YES,  4, TRUE)  \
-FLAG(  81,  0, ECX,  1,  1, CMPLEGACY,                         ANY,  9, FALSE) \
-FLAG(  81,  0, ECX,  2,  1, SVM,                               YES,  7, FALSE) \
-FLAG(  81,  0, ECX,  3,  1, EXTAPICSPC,                        YES,  4, FALSE) \
-FLAG(  81,  0, ECX,  4,  1, CR8AVAIL,                          YES,  4, FALSE) \
-FLAG(  81,  0, ECX,  5,  1, ABM,                               YES,  7, TRUE)  \
-FLAG(  81,  0, ECX,  6,  1, SSE4A,                             YES,  4, TRUE)  \
-FLAG(  81,  0, ECX,  7,  1, MISALIGNED_SSE,                    YES,  4, TRUE)  \
-FLAG(  81,  0, ECX,  8,  1, 3DNPREFETCH,                       YES,  4, TRUE)  \
-FLAG(  81,  0, ECX,  9,  1, OSVW,                              ANY,  8, FALSE) \
-FLAG(  81,  0, ECX, 10,  1, IBS,                               NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 11,  1, XOP,                               YES,  8, TRUE)  \
-FLAG(  81,  0, ECX, 12,  1, SKINIT,                            NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                          NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 15,  1, LWP,                               NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 16,  1, FMA4,                              YES,  8, TRUE)  \
-FLAG(  81,  0, ECX, 17,  1, TCE,                               NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 19,  1, NODEID_MSR,                        NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 21,  1, TBM,                               YES,  9, TRUE)  \
-FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                          NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 23,  1, PERFCORE,                          ANY,  4, TRUE)  \
-FLAG(  81,  0, ECX, 24,  1, PERFNB,                            NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 26,  1, DATABK,                            NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 27,  1, PERFTSC,                           NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 28,  1, PERFL3,                            NO,   0, FALSE) \
-FLAG(  81,  0, ECX, 29,  1, MWAITX,                            NO,   0, FALSE) \
-FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                        YES,  4, TRUE)  \
-FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                        YES,  4, FALSE) \
-FLAG(  81,  0, EDX,  2,  1, LEAF81_DE,                         YES,  4, FALSE) \
-FLAG(  81,  0, EDX,  3,  1, LEAF81_PSE,                        YES,  4, FALSE) \
-FLAG(  81,  0, EDX,  4,  1, LEAF81_TSC,                        YES,  4, TRUE)  \
-FLAG(  81,  0, EDX,  5,  1, LEAF81_MSR,                        YES,  4, FALSE) \
-FLAG(  81,  0, EDX,  6,  1, LEAF81_PAE,                        YES,  4, FALSE) \
-FLAG(  81,  0, EDX,  7,  1, LEAF81_MCE,                        YES,  4, FALSE) \
-FLAG(  81,  0, EDX,  8,  1, LEAF81_CX8,                        YES,  4, TRUE)  \
-FLAG(  81,  0, EDX,  9,  1, LEAF81_APIC,                       ANY,  4, FALSE) \
-FLAG(  81,  0, EDX, 11,  1, SYSC,                              ANY,  4, TRUE)  \
-FLAG(  81,  0, EDX, 12,  1, LEAF81_MTRR,                       YES,  4, FALSE) \
-FLAG(  81,  0, EDX, 13,  1, LEAF81_PGE,                        YES,  4, FALSE) \
-FLAG(  81,  0, EDX, 14,  1, LEAF81_MCA,                        YES,  4, FALSE) \
-FLAG(  81,  0, EDX, 15,  1, LEAF81_CMOV,                       YES,  4, TRUE)  \
-FLAG(  81,  0, EDX, 16,  1, LEAF81_PAT,                        YES,  4, FALSE) \
-FLAG(  81,  0, EDX, 17,  1, LEAF81_PSE36,                      YES,  4, FALSE) \
-FLAG(  81,  0, EDX, 20,  1, NX,                                YES,  4, FALSE) \
-FLAG(  81,  0, EDX, 22,  1, MMXEXT,                            YES,  4, TRUE)  \
-FLAG(  81,  0, EDX, 23,  1, LEAF81_MMX,                        YES,  4, TRUE)  \
-FLAG(  81,  0, EDX, 24,  1, LEAF81_FXSR,                       YES,  4, TRUE)  \
-FLAG(  81,  0, EDX, 25,  1, FFXSR,                             YES,  4, FALSE) \
-FLAG(  81,  0, EDX, 26,  1, PDPE1GB,                           YES,  7, FALSE) \
-FLAG(  81,  0, EDX, 27,  1, RDTSCP,                            YES,  4, TRUE)  \
-FLAG(  81,  0, EDX, 29,  1, LM,                                YES,  4, FALSE) \
-FLAG(  81,  0, EDX, 30,  1, 3DNOWPLUS,                         YES,  4, TRUE)  \
-FLAG(  81,  0, EDX, 31,  1, 3DNOW,                             YES,  4, TRUE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_82                                              \
-FIELD( 82,  0, EAX,  0, 32, LEAF82_BRAND_STRING_EAX,           NA,   0, FALSE) \
-FIELD( 82,  0, EBX,  0, 32, LEAF82_BRAND_STRING_EBX,           NA,   0, FALSE) \
-FIELD( 82,  0, ECX,  0, 32, LEAF82_BRAND_STRING_ECX,           NA,   0, FALSE) \
-FIELD( 82,  0, EDX,  0, 32, LEAF82_BRAND_STRING_EDX,           NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_83                                              \
-FIELD( 83,  0, EAX,  0, 32, LEAF83_BRAND_STRING_EAX,           NA,   0, FALSE) \
-FIELD( 83,  0, EBX,  0, 32, LEAF83_BRAND_STRING_EBX,           NA,   0, FALSE) \
-FIELD( 83,  0, ECX,  0, 32, LEAF83_BRAND_STRING_ECX,           NA,   0, FALSE) \
-FIELD( 83,  0, EDX,  0, 32, LEAF83_BRAND_STRING_EDX,           NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_84                                              \
-FIELD( 84,  0, EAX,  0, 32, LEAF84_BRAND_STRING_EAX,           NA,   0, FALSE) \
-FIELD( 84,  0, EBX,  0, 32, LEAF84_BRAND_STRING_EBX,           NA,   0, FALSE) \
-FIELD( 84,  0, ECX,  0, 32, LEAF84_BRAND_STRING_ECX,           NA,   0, FALSE) \
-FIELD( 84,  0, EDX,  0, 32, LEAF84_BRAND_STRING_EDX,           NA,   0, FALSE)
-
-/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_85                                              \
-FIELD( 85,  0, EAX,  0,  8, ITLB_ENTRIES_2M4M_PGS,             NA,   0, FALSE) \
-FIELD( 85,  0, EAX,  8,  8, ITLB_ASSOC_2M4M_PGS,               NA,   0, FALSE) \
-FIELD( 85,  0, EAX, 16,  8, DTLB_ENTRIES_2M4M_PGS,             NA,   0, FALSE) \
-FIELD( 85,  0, EAX, 24,  8, DTLB_ASSOC_2M4M_PGS,               NA,   0, FALSE) \
-FIELD( 85,  0, EBX,  0,  8, ITLB_ENTRIES_4K_PGS,               NA,   0, FALSE) \
-FIELD( 85,  0, EBX,  8,  8, ITLB_ASSOC_4K_PGS,                 NA,   0, FALSE) \
-FIELD( 85,  0, EBX, 16,  8, DTLB_ENTRIES_4K_PGS,               NA,   0, FALSE) \
-FIELD( 85,  0, EBX, 24,  8, DTLB_ASSOC_4K_PGS,                 NA,   0, FALSE) \
-FIELD( 85,  0, ECX,  0,  8, L1_DCACHE_LINE_SIZE,               NA,   0, FALSE) \
-FIELD( 85,  0, ECX,  8,  8, L1_DCACHE_LINES_PER_TAG,           NA,   0, FALSE) \
-FIELD( 85,  0, ECX, 16,  8, L1_DCACHE_ASSOC,                   NA,   0, FALSE) \
-FIELD( 85,  0, ECX, 24,  8, L1_DCACHE_SIZE,                    NA,   0, FALSE) \
-FIELD( 85,  0, EDX,  0,  8, L1_ICACHE_LINE_SIZE,               NA,   0, FALSE) \
-FIELD( 85,  0, EDX,  8,  8, L1_ICACHE_LINES_PER_TAG,           NA,   0, FALSE) \
-FIELD( 85,  0, EDX, 16,  8, L1_ICACHE_ASSOC,                   NA,   0, FALSE) \
-FIELD( 85,  0, EDX, 24,  8, L1_ICACHE_SIZE,                    NA,   0, FALSE)
-
-/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_86                                              \
-FIELD( 86,  0, EAX,  0, 12, L2_ITLB_ENTRIES_2M4M_PGS,          NA,   0, FALSE) \
-FIELD( 86,  0, EAX, 12,  4, L2_ITLB_ASSOC_2M4M_PGS,            NA,   0, FALSE) \
-FIELD( 86,  0, EAX, 16, 12, L2_DTLB_ENTRIES_2M4M_PGS,          NA,   0, FALSE) \
-FIELD( 86,  0, EAX, 28,  4, L2_DTLB_ASSOC_2M4M_PGS,            NA,   0, FALSE) \
-FIELD( 86,  0, EBX,  0, 12, L2_ITLB_ENTRIES_4K_PGS,            NA,   0, FALSE) \
-FIELD( 86,  0, EBX, 12,  4, L2_ITLB_ASSOC_4K_PGS,              NA,   0, FALSE) \
-FIELD( 86,  0, EBX, 16, 12, L2_DTLB_ENTRIES_4K_PGS,            NA,   0, FALSE) \
-FIELD( 86,  0, EBX, 28,  4, L2_DTLB_ASSOC_4K_PGS,              NA,   0, FALSE) \
-FIELD( 86,  0, ECX,  0,  8, L2CACHE_LINE,                      NA,   0, FALSE) \
-FIELD( 86,  0, ECX,  8,  4, L2CACHE_LINE_PER_TAG,              NA,   0, FALSE) \
-FIELD( 86,  0, ECX, 12,  4, L2CACHE_WAYS,                      NA,   0, FALSE) \
-FIELD( 86,  0, ECX, 16, 16, L2CACHE_SIZE,                      NA,   0, FALSE) \
-FIELD( 86,  0, EDX,  0,  8, L3CACHE_LINE,                      NA,   0, FALSE) \
-FIELD( 86,  0, EDX,  8,  4, L3CACHE_LINE_PER_TAG,              NA,   0, FALSE) \
-FIELD( 86,  0, EDX, 12,  4, L3CACHE_WAYS,                      NA,   0, FALSE) \
-FIELD( 86,  0, EDX, 18, 14, L3CACHE_SIZE,                      NA,   0, FALSE)
-
-/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_87                                              \
-FLAG(  87,  0, EBX,  0,  1, MCA_OVERFLOW_RECOV,                NA,   0, FALSE) \
-FLAG(  87,  0, EBX,  1,  1, SUCCOR,                            NA,   0, FALSE) \
-FLAG(  87,  0, EBX,  2,  1, HWA,                               NA,   0, FALSE) \
-FLAG(  87,  0, EBX,  3,  1, SCALABLE_MCA,                      NA,   0, FALSE) \
-FLAG(  87,  0, EBX,  4,  1, PFEH_SUPPORT_PRESENT,              NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  0,  1, TS,                                NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  1,  1, FID,                               NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  2,  1, VID,                               NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  3,  1, TTP,                               NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  4,  1, LEAF87_TM,                         NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  5,  1, STC,                               NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  6,  1, 100MHZSTEPS,                       NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                          NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                     NA,   0, FALSE) \
-FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                   NA,   0, FALSE)
-
-#define CPUID_88_EBX_14 \
-FLAG(  88,  0, EBX, 14,  1, LEAF88_RSVD1,                       NO,  0, FALSE)
-#define CPUID_88_EBX_15 \
-FLAG(  88,  0, EBX, 15,  1, LEAF88_RSVD2,                       NO,  0, FALSE)
-#define CPUID_88_EBX_16 \
-FLAG(  88,  0, EBX, 16,  1, LEAF88_RSVD3,                       NO,  0, FALSE)
-#define CPUID_88_EBX_17 \
-FLAG(  88,  0, EBX, 17,  1, LEAF88_RSVD4,                       NO,  0, FALSE)
-#define CPUID_88_EBX_18 \
-FLAG(  88,  0, EBX, 18,  1, LEAF88_RSVD5,                       NO,  0, FALSE)
-
-/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_88                                              \
-FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                         YES,  4, FALSE) \
-FIELD( 88,  0, EAX,  8,  8, VIRT_BITS,                         YES,  4, FALSE) \
-FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                YES,  8, FALSE) \
-FLAG(  88,  0, EBX,  0,  1, CLZERO,                            YES, 14, TRUE)  \
-FLAG(  88,  0, EBX,  1,  1, IRPERF,                            NO,   0, FALSE) \
-FLAG(  88,  0, EBX,  2,  1, XSAVE_ERR_PTR,                     NO,   0, FALSE) \
-FLAG(  88,  0, EBX, 12,  1, LEAF88_IBPB,                       ANY,  9, FALSE) \
-CPUID_88_EBX_14 \
-CPUID_88_EBX_15 \
-CPUID_88_EBX_16 \
-CPUID_88_EBX_17 \
-CPUID_88_EBX_18 \
-FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                 YES,  4, FALSE) \
-FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                YES,  7, FALSE) \
-FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                      NO,   0, FALSE)
+FLAG(   7,  0, EDX, 10,  1, LEAF7_RSVD,                          NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_7                                            \
+FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                            YES,   9 ) \
+FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                          ANY,  11 ) \
+FLAG(   7,  0, EBX,  2,  1, SGX,                                 ANY,  17 ) \
+FLAG(   7,  0, EBX,  3,  1, BMI1,                                YES,   9 ) \
+FLAG(   7,  0, EBX,  4,  1, HLE,                                 YES,  11 ) \
+FLAG(   7,  0, EBX,  5,  1, AVX2,                                YES,  11 ) \
+FLAG(   7,  0, EBX,  6,  1, FDP_EXCPTN_ONLY,                     ANY,   4 ) \
+FLAG(   7,  0, EBX,  7,  1, SMEP,                                YES,   9 ) \
+FLAG(   7,  0, EBX,  8,  1, BMI2,                                YES,  11 ) \
+FLAG(   7,  0, EBX,  9,  1, ENFSTRG,                             YES,   9 ) \
+FLAG(   7,  0, EBX, 10,  1, INVPCID,                             YES,  11 ) \
+FLAG(   7,  0, EBX, 11,  1, RTM,                                 YES,  11 ) \
+FLAG(   7,  0, EBX, 12,  1, PQM,                                 NO,    0 ) \
+FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                     ANY,  11 ) \
+FLAG(   7,  0, EBX, 14,  1, MPX,                                 YES,  13 ) \
+FLAG(   7,  0, EBX, 15,  1, PQE,                                 NO,    0 ) \
+FLAG(   7,  0, EBX, 16,  1, AVX512F,                             YES,  13 ) \
+FLAG(   7,  0, EBX, 17,  1, AVX512DQ,                            YES,  13 ) \
+FLAG(   7,  0, EBX, 18,  1, RDSEED,                              YES,  11 ) \
+FLAG(   7,  0, EBX, 19,  1, ADX,                                 YES,  11 ) \
+FLAG(   7,  0, EBX, 20,  1, SMAP,                                YES,  11 ) \
+FLAG(   7,  0, EBX, 21,  1, AVX512IFMA,                          YES,  17 ) \
+FLAG(   7,  0, EBX, 23,  1, CLFLUSHOPT,                          YES,  13 ) \
+FLAG(   7,  0, EBX, 24,  1, CLWB,                                YES,  13 ) \
+FLAG(   7,  0, EBX, 25,  1, PT,                                  YES, FUT ) \
+FLAG(   7,  0, EBX, 26,  1, AVX512PF,                            YES,  13 ) \
+FLAG(   7,  0, EBX, 27,  1, AVX512ER,                            YES,  13 ) \
+FLAG(   7,  0, EBX, 28,  1, AVX512CD,                            YES,  13 ) \
+FLAG(   7,  0, EBX, 29,  1, SHA,                                 YES,  14 ) \
+FLAG(   7,  0, EBX, 30,  1, AVX512BW,                            YES,  13 ) \
+FLAG(   7,  0, EBX, 31,  1, AVX512VL,                            YES,  13 ) \
+FLAG(   7,  0, ECX,  0,  1, PREFETCHWT1,                         YES,  13 ) \
+FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                          YES,  17 ) \
+FLAG(   7,  0, ECX,  2,  1, UMIP,                                YES,  17 ) \
+FLAG(   7,  0, ECX,  3,  1, PKU,                                 YES,  13 ) \
+FLAG(   7,  0, ECX,  4,  1, OSPKE,                               ANY,  13 ) \
+FLAG(   7,  0, ECX,  5,  1, WAITPKG,                             NO,    0 ) \
+FLAG(   7,  0, ECX,  6,  1, AVX512VBMI2,                         YES,  17 ) \
+FLAG(   7,  0, ECX,  8,  1, GFNI,                                YES,  17 ) \
+FLAG(   7,  0, ECX,  9,  1, VAES,                                YES,  17 ) \
+FLAG(   7,  0, ECX, 10,  1, VPCLMULQDQ,                          YES,  17 ) \
+FLAG(   7,  0, ECX, 11,  1, AVX512VNNI,                          YES,  17 ) \
+FLAG(   7,  0, ECX, 12,  1, AVX512BITALG,                        YES,  17 ) \
+FLAG(   7,  0, ECX, 14,  1, AVX512VPOPCNTDQ,                     YES,  16 ) \
+FLAG(   7,  0, ECX, 16,  1, VA57,                                NO,    0 ) \
+FIELD(  7,  0, ECX, 17,  5, MAWA,                                NO,    0 ) \
+FLAG(   7,  0, ECX, 22,  1, RDPID,                               YES,  17 ) \
+FLAG(   7,  0, ECX, 25,  1, CLDEMOTE,                            NO,    0 ) \
+FLAG(   7,  0, ECX, 27,  1, MOVDIRI,                             NO,    0 ) \
+FLAG(   7,  0, ECX, 28,  1, MOVDIR64B,                           NO,    0 ) \
+FLAG(   7,  0, ECX, 30,  1, SGX_LC,                              ANY,  17 ) \
+FLAG(   7,  0, EDX,  2,  1, AVX512QVNNIW,                        YES,  16 ) \
+FLAG(   7,  0, EDX,  3,  1, AVX512QFMAPS,                        YES,  16 ) \
+FLAG(   7,  0, EDX,  4,  1, FAST_SHORT_REPMOV,                   NO,    0 ) \
+CPUID_7_EDX_10 \
+FLAG(   7,  0, EDX, 13,  1, TSX_MICROCODE_UPDATE,                NO,    0 ) \
+FLAG(   7,  0, EDX, 18,  1, PCONFIG,                             NO,    0 ) \
+FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                            ANY,   9 ) \
+FLAG(   7,  0, EDX, 27,  1, STIBP,                               YES,   9 ) \
+FLAG(   7,  0, EDX, 28,  1, FCMD,                                YES,   9 ) \
+FLAG(   7,  0, EDX, 29,  1, ARCH_CAPABILITIES,                   ANY,   9 ) \
+FLAG(   7,  0, EDX, 31,  1, SSBD,                                YES,   9 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_A                                            \
+FIELD(  A,  0, EAX,  0,  8, PMC_VERSION,                         NA,    0 ) \
+FIELD(  A,  0, EAX,  8,  8, PMC_NUM_GEN,                         NA,    0 ) \
+FIELD(  A,  0, EAX, 16,  8, PMC_WIDTH_GEN,                       NA,    0 ) \
+FIELD(  A,  0, EAX, 24,  8, PMC_EBX_LENGTH,                      NA,    0 ) \
+FLAG(   A,  0, EBX,  0,  1, PMC_CORE_CYCLES,                     NA,    0 ) \
+FLAG(   A,  0, EBX,  1,  1, PMC_INSTR_RETIRED,                   NA,    0 ) \
+FLAG(   A,  0, EBX,  2,  1, PMC_REF_CYCLES,                      NA,    0 ) \
+FLAG(   A,  0, EBX,  3,  1, PMC_LAST_LVL_CREF,                   NA,    0 ) \
+FLAG(   A,  0, EBX,  4,  1, PMC_LAST_LVL_CMISS,                  NA,    0 ) \
+FLAG(   A,  0, EBX,  5,  1, PMC_BR_INST_RETIRED,                 NA,    0 ) \
+FLAG(   A,  0, EBX,  6,  1, PMC_BR_MISS_RETIRED,                 NA,    0 ) \
+FLAG(   A,  0, EBX,  7,  1, PMC_TOPDOWN_SLOTS,                   NA,    0 ) \
+FLAG(   A,  0, ECX,  0,  1, PMC_FIXED0,                          NA,    0 ) \
+FLAG(   A,  0, ECX,  1,  1, PMC_FIXED1,                          NA,    0 ) \
+FLAG(   A,  0, ECX,  2,  1, PMC_FIXED2,                          NA,    0 ) \
+FLAG(   A,  0, ECX,  3,  1, PMC_FIXED3,                          NA,    0 ) \
+FIELD(  A,  0, EDX,  0,  5, PMC_NUM_FIXED,                       NA,    0 ) \
+FIELD(  A,  0, EDX,  5,  8, PMC_WIDTH_FIXED,                     NA,    0 ) \
+FLAG(   A,  0, EDX, 15,  1, PMC_ANYTHREAD_DEPRECATED,            NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_B                                            \
+FIELD(  B,  0, EAX,  0,  5, TOPOLOGY_MASK_WIDTH,                 NA,    0 ) \
+FIELD(  B,  0, EBX,  0, 16, TOPOLOGY_CPUS_SHARING_LEVEL,         NA,    0 ) \
+FIELD(  B,  0, ECX,  0,  8, TOPOLOGY_LEVEL_NUMBER,               NA,    0 ) \
+FIELD(  B,  0, ECX,  8,  8, TOPOLOGY_LEVEL_TYPE,                 NA,    0 ) \
+FIELD(  B,  0, EDX,  0, 32, TOPOLOGY_X2APIC_ID,                  NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_D                                            \
+FLAG(   D,  0, EAX,  0,  1, XCR0_MASTER_LEGACY_FP,               YES,   8 ) \
+FLAG(   D,  0, EAX,  1,  1, XCR0_MASTER_SSE,                     YES,   8 ) \
+FLAG(   D,  0, EAX,  2,  1, XCR0_MASTER_YMM_H,                   YES,   8 ) \
+FLAG(   D,  0, EAX,  3,  1, XCR0_MASTER_BNDREGS,                 YES,  13 ) \
+FLAG(   D,  0, EAX,  4,  1, XCR0_MASTER_BNDCSR,                  YES,  13 ) \
+FLAG(   D,  0, EAX,  5,  1, XCR0_MASTER_OPMASK,                  YES,  13 ) \
+FLAG(   D,  0, EAX,  6,  1, XCR0_MASTER_ZMM_H,                   YES,  13 ) \
+FLAG(   D,  0, EAX,  7,  1, XCR0_MASTER_HI16_ZMM,                YES,  13 ) \
+FLAG(   D,  0, EAX,  8,  1, XCR0_MASTER_XSS,                     NO,    0 ) \
+FLAG(   D,  0, EAX,  9,  1, XCR0_MASTER_PKRU,                    YES,  13 ) \
+FIELD(  D,  0, EAX,  10,22, XCR0_MASTER_LOWER,                   NO,    0 ) \
+FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                  ANY,   8 ) \
+FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                      YES,   8 ) \
+FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                   NO,    0 ) \
+FLAG(   D,  0, EDX, 30,  1, XCR0_MASTER_LWP,                     NO,    0 ) \
+FLAG(   D,  0, EDX, 31,  1, XCR0_MASTER_EXTENDED_XSAVE,          NO,    0 ) \
+FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                            YES,  11 ) \
+FLAG(   D,  1, EAX,  1,  1, XSAVEC,                              YES,  13 ) \
+FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                         YES,  17 ) \
+FLAG(   D,  1, EAX,  3,  1, XSAVES,                              YES,  13 ) \
+FIELD(  D,  1, EBX,  0, 32, XSAVES_ENABLED_SIZE,                 ANY,  13 ) \
+FIELD(  D,  1, ECX,  0,  7, XSS_XCR0_USED0,                      NO,    0 ) \
+FLAG(   D,  1, ECX,  8,  1, XSS_PT,                              NO,    0 ) \
+FIELD(  D,  1, ECX,  9,  1, XSS_XCR0_USED1,                      NO,    0 ) \
+FIELD(  D,  1, ECX,  10,22, XSS_RSVD0,                           NO,    0 ) \
+FIELD(  D,  1, EDX,  0, 32, XSS_RSVD1,                           NO,    0 ) \
+FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                      YES,   8 ) \
+FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                    YES,   8 ) \
+FLAG(   D,  2, ECX,  0,  1, XSAVE_YMM_SUP_BY_XSS,                NO,    0 ) \
+FLAG(   D,  2, ECX,  1,  1, XSAVE_YMM_ALIGN,                     YES,  13 ) \
+FIELD(  D,  2, ECX,  2, 30, XSAVE_YMM_RSVD1,                     NO,    0 ) \
+FIELD(  D,  2, EDX,  0, 32, XSAVE_YMM_RSVD2,                     NO,    0 ) \
+FIELD(  D,  3, EAX,  0, 32, XSAVE_BNDREGS_SIZE,                  YES,  13 ) \
+FIELD(  D,  3, EBX,  0, 32, XSAVE_BNDREGS_OFFSET,                YES,  13 ) \
+FLAG(   D,  3, ECX,  0,  1, XSAVE_BNDREGS_SUP_BY_XSS,            NO,    0 ) \
+FLAG(   D,  3, ECX,  1,  1, XSAVE_BNDREGS_ALIGN,                 YES,  13 ) \
+FIELD(  D,  3, ECX,  2, 30, XSAVE_BNDREGS_RSVD1,                 NO,    0 ) \
+FIELD(  D,  3, EDX,  0, 32, XSAVE_BNDREGS_RSVD2,                 NO,    0 ) \
+FIELD(  D,  4, EAX,  0, 32, XSAVE_BNDCSR_SIZE,                   YES,  13 ) \
+FIELD(  D,  4, EBX,  0, 32, XSAVE_BNDCSR_OFFSET,                 YES,  13 ) \
+FLAG(   D,  4, ECX,  0,  1, XSAVE_BNDCSR_SUP_BY_XSS,             NO,    0 ) \
+FLAG(   D,  4, ECX,  1,  1, XSAVE_BNDCSR_ALIGN,                  YES,  13 ) \
+FIELD(  D,  4, ECX,  2, 30, XSAVE_BNDCSR_RSVD1,                  NO,    0 ) \
+FIELD(  D,  4, EDX,  0, 32, XSAVE_BNDCSR_RSVD2,                  NO,    0 ) \
+FIELD(  D,  5, EAX,  0, 32, XSAVE_OPMASK_SIZE,                   YES,  13 ) \
+FIELD(  D,  5, EBX,  0, 32, XSAVE_OPMASK_OFFSET,                 YES,  13 ) \
+FLAG(   D,  5, ECX,  0,  1, XSAVE_OPMASK_SUP_BY_XSS,             NO,    0 ) \
+FLAG(   D,  5, ECX,  1,  1, XSAVE_OPMASK_ALIGN,                  YES,  13 ) \
+FIELD(  D,  5, ECX,  2, 30, XSAVE_OPMASK_RSVD1,                  NO,    0 ) \
+FIELD(  D,  5, EDX,  0, 32, XSAVE_OPMASK_RSVD2,                  NO,    0 ) \
+FIELD(  D,  6, EAX,  0, 32, XSAVE_ZMM_H_SIZE,                    YES,  13 ) \
+FIELD(  D,  6, EBX,  0, 32, XSAVE_ZMM_H_OFFSET,                  YES,  13 ) \
+FLAG(   D,  6, ECX,  0,  1, XSAVE_ZMM_H_SUP_BY_XSS,              NO,    0 ) \
+FLAG(   D,  6, ECX,  1,  1, XSAVE_ZMM_H_ALIGN,                   YES,  13 ) \
+FIELD(  D,  6, ECX,  2, 30, XSAVE_ZMM_H_RSVD1,                   NO,    0 ) \
+FIELD(  D,  6, EDX,  0, 32, XSAVE_ZMM_H_RSVD2,                   NO,    0 ) \
+FIELD(  D,  7, EAX,  0, 32, XSAVE_HI16_ZMM_SIZE,                 YES,  13 ) \
+FIELD(  D,  7, EBX,  0, 32, XSAVE_HI16_ZMM_OFFSET,               YES,  13 ) \
+FLAG(   D,  7, ECX,  0,  1, XSAVE_HI16_ZMM_SUP_BY_XSS,           NO,    0 ) \
+FLAG(   D,  7, ECX,  1,  1, XSAVE_HI16_ZMM_ALIGN,                YES,  13 ) \
+FIELD(  D,  7, ECX,  2, 30, XSAVE_HI16_ZMM_RSVD1,                NO,    0 ) \
+FIELD(  D,  7, EDX,  0, 32, XSAVE_HI16_ZMM_RSVD2,                NO,    0 ) \
+FIELD(  D,  8, EAX,  0, 32, XSAVE_PT_STATE_SIZE,                 NO,    0 ) \
+FIELD(  D,  8, EBX,  0, 32, XSAVE_PT_STATE_OFFSET,               NO,    0 ) \
+FLAG(   D,  8, ECX,  0,  1, XSAVE_PT_STATE_SUP_BY_XSS,           NO,    0 ) \
+FLAG(   D,  8, ECX,  1,  1, XSAVE_PT_STATE_ALIGN,                NO,    0 ) \
+FIELD(  D,  8, ECX,  2, 30, XSAVE_PT_STATE_RSVD1,                NO,    0 ) \
+FIELD(  D,  8, EDX,  0, 32, XSAVE_PT_STATE_RSVD2,                NO,    0 ) \
+FIELD(  D,  9, EAX,  0, 32, XSAVE_PKRU_SIZE,                     YES,  13 ) \
+FIELD(  D,  9, EBX,  0, 32, XSAVE_PKRU_OFFSET,                   YES,  13 ) \
+FLAG(   D,  9, ECX,  0,  1, XSAVE_PKRU_SUP_BY_XSS,               NO,    0 ) \
+FLAG(   D,  9, ECX,  1,  1, XSAVE_PKRU_ALIGN,                    YES,  13 ) \
+FIELD(  D,  9, ECX,  2, 30, XSAVE_PKRU_RSVD1,                    NO,    0 ) \
+FIELD(  D,  9, EDX,  0, 32, XSAVE_PKRU_RSVD2,                    NO,    0 ) \
+FIELD(  D, 62, EAX,  0, 32, XSAVE_LWP_SIZE,                      NO,    0 ) \
+FIELD(  D, 62, EBX,  0, 32, XSAVE_LWP_OFFSET,                    NO,    0 ) \
+FIELD(  D, 62, ECX,  0, 32, XSAVE_LWP_RSVD1,                     NO,    0 ) \
+FIELD(  D, 62, EDX,  0, 32, XSAVE_LWP_RSVD2,                     NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_F                                            \
+FIELD(  F,  0, EBX,  0, 32, PQM_MAX_RMID,                        NO,    0 ) \
+FLAG(   F,  0, EDX,  1,  1, PQM_CMT_SUPPORT,                     NO,    0 ) \
+FIELD(  F,  1, EBX,  0, 32, PQM_CMT_CONV,                        NO,    0 ) \
+FIELD(  F,  1, ECX,  0, 32, PQM_CMT_NUM_RMID,                    NO,    0 ) \
+FLAG(   F,  1, EDX,  0,  1, PQM_CMT_OCCUPANCY,                   NO,    0 ) \
+FLAG(   F,  1, EDX,  1,  1, PQM_MBM_TOTAL,                       NO,    0 ) \
+FLAG(   F,  1, EDX,  2,  1, PQM_MBM_LOCAL,                       NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_10                                          \
+FLAG(  10,  0, EBX,  1,  1, PQE_L3,                              NO,    0 ) \
+FIELD( 10,  1, EAX,  0,  5, PQE_L3_MASK_LENGTH,                  NO,    0 ) \
+FIELD( 10,  1, EBX,  0, 32, PQE_L3_ISOLATION_UNIT_MAP,           NO,    0 ) \
+FLAG(  10,  1, ECX,  2,  1, PQE_L3_CDP,                          NO,    0 ) \
+FIELD( 10,  1, EDX,  0, 16, PQE_L3_MAX_COS_NUMBER,               NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_12                                           \
+FLAG(  12,  0, EAX,  0,  1, SGX1,                                ANY,  17 ) \
+FLAG(  12,  0, EAX,  1,  1, SGX2,                                ANY, FUT ) \
+FLAG(  12,  0, EAX,  5,  1, SGX_OVERSUB_ENCLV,                   ANY, FUT ) \
+FLAG(  12,  0, EAX,  6,  1, SGX_OVERSUB_ENCLS,                   ANY, FUT ) \
+FLAG(  12,  0, EBX,  0,  1, SGX_MISCSELECT_EXINFO,               ANY, FUT ) \
+FIELD( 12,  0, EBX,  1, 31, SGX_MISCSELECT_RSVD,                 NO,    0 ) \
+FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,              ANY,  17 ) \
+FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,                 ANY,  17 ) \
+FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                    ANY,  17 ) \
+FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                    ANY,  17 ) \
+FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                    ANY,  17 ) \
+FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                    ANY,  17 ) \
+FIELD( 12,  2, EAX,  0, 15, EPC00_VALID,                         ANY,  17 ) \
+FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                      ANY,  17 ) \
+FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                     ANY,  17 ) \
+FIELD( 12,  2, ECX,  0, 15, EPC00_PROTECTED,                     ANY,  17 ) \
+FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                      ANY,  17 ) \
+FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                     ANY,  17 ) \
+FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                         NO,    0 ) \
+FIELD( 12,  3, EAX, 12, 20, EPC01_BASE_LOW,                      NO,    0 ) \
+FIELD( 12,  3, EBX,  0, 20, EPC01_BASE_HIGH,                     NO,    0 ) \
+FIELD( 12,  3, ECX,  0,  4, EPC01_PROTECTED,                     NO,    0 ) \
+FIELD( 12,  3, ECX, 12, 20, EPC01_SIZE_LOW,                      NO,    0 ) \
+FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                     NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_14                                           \
+FIELD( 14,  0, EAX,  0, 32, PT_MAX_SUBLEAF,                     YES, FUT ) \
+FLAG(  14,  0, EBX,  0,  1, PT_CR3_FILTER,                      YES, FUT ) \
+FLAG(  14,  0, EBX,  1,  1, PT_CFG_PSB_CYC,                     YES, FUT ) \
+FLAG(  14,  0, EBX,  2,  1, PT_IP_FILTER_PERSIST_MSR,           YES, FUT ) \
+FLAG(  14,  0, EBX,  3,  1, PT_MTC,                             YES, FUT ) \
+FLAG(  14,  0, EBX,  4,  1, PT_PTWRITE,                         NO,    0 ) \
+FLAG(  14,  0, EBX,  5,  1, PT_POWER_EVENT,                     NO,    0 ) \
+FLAG(  14,  0, ECX,  0,  1, PT_TOPA,                            YES, FUT ) \
+FLAG(  14,  0, ECX,  1,  1, PT_TOPA_MULTI,                      YES, FUT ) \
+FLAG(  14,  0, ECX,  2,  1, PT_SRO,                             YES, FUT ) \
+FLAG(  14,  0, ECX,  3,  1, PT_TRACE_TRANS,                     NO,    0 ) \
+FLAG(  14,  0, ECX, 31,  1, PT_LIP,                             YES, FUT ) \
+FIELD( 14,  1, EAX,  0,  3, PT_NUM_ADDR_RANGES,                 YES, FUT ) \
+FIELD( 14,  1, EAX, 16, 16, PT_AVAIL_MTC_ENCS,                  YES, FUT ) \
+FIELD( 14,  1, EBX,  0, 16, PT_AVAIL_CYC_THRESH_ENCS,           YES, FUT ) \
+FIELD( 14,  1, EBX, 16, 16, PT_AVAIL_PSB_FREQ_ENCS,             YES, FUT ) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_15                                           \
+FIELD( 15,  0, EAX,  0, 32, DENOM_TSC_TO_CORE_CRYSTAL_CLK,       NO,    0 ) \
+FIELD( 15,  0, EBX,  0, 32, NUMER_TSC_TO_CORE_CRYSTAL_CLK,       NO,    0 ) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_16                                           \
+FIELD( 16,  0, EAX,  0, 16, PROC_BASE_FREQ,                      NO,    0 ) \
+FIELD( 16,  0, EBX,  0, 16, PROC_MIN_FREQ,                       NO,    0 ) \
+FIELD( 16,  0, ECX,  0, 16, BUS_FREQ,                            NO,    0 ) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_17                                           \
+FIELD( 17,  0, EAX,  0, 31, MAX_SOCID_INDEX,                     NO,    0 ) \
+FIELD( 17,  0, EBX,  0, 16, SOC_VENDOR_ID,                       NO,    0 ) \
+FIELD( 17,  0, EBX, 16,  1, SOC_INDUSTRY_STD,                    NO,    0 ) \
+FIELD( 17,  0, ECX,  0, 31, SOC_PROJECT_ID,                      NO,    0 ) \
+FIELD( 17,  0, EDX,  0, 31, SOC_STEPPING_ID,                     NO,    0 ) \
+FIELD( 17,  1, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_1_0,         NO,    0 ) \
+FIELD( 17,  1, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_1_1,         NO,    0 ) \
+FIELD( 17,  1, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_1_2,         NO,    0 ) \
+FIELD( 17,  1, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_1_3,         NO,    0 ) \
+FIELD( 17,  2, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_2_0,         NO,    0 ) \
+FIELD( 17,  2, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_2_1,         NO,    0 ) \
+FIELD( 17,  2, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_2_2,         NO,    0 ) \
+FIELD( 17,  2, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_2_3,         NO,    0 ) \
+FIELD( 17,  3, EAX,  0, 32, SOC_VENDOR_BRAND_STRING_3_0,         NO,    0 ) \
+FIELD( 17,  3, EBX,  0, 32, SOC_VENDOR_BRAND_STRING_3_1,         NO,    0 ) \
+FIELD( 17,  3, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_3_2,         NO,    0 ) \
+FIELD( 17,  3, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_3_3,         NO,    0 ) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_400                                         \
+FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                       NA,    0 ) \
+FIELD(400,  0, EBX,  0, 32, HYPERVISOR_VENDOR0,                  NA,    0 ) \
+FIELD(400,  0, ECX,  0, 32, HYPERVISOR_VENDOR1,                  NA,    0 ) \
+FIELD(400,  0, EDX,  0, 32, HYPERVISOR_VENDOR2,                  NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_401                                          \
+FIELD(401,  0, EAX,  0, 32, HV_INTERFACE_SIGNATURE,              NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_402                                          \
+FIELD(402,  0, EAX,  0, 32, BUILD_NUMBER,                        NA,    0 ) \
+FIELD(402,  0, EBX,  0, 16, MINOR_VERSION,                       NA,    0 ) \
+FIELD(402,  0, EBX, 16, 16, MAJOR_VERSION,                       NA,    0 ) \
+FIELD(402,  0, ECX,  0, 32, SERVICE_PACK,                        NA,    0 ) \
+FIELD(402,  0, EDX,  0, 24, SERVICE_NUMBER,                      NA,    0 ) \
+FIELD(402,  0, EDX, 24,  8, SERVICE_BRANCH,                      NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_403                                          \
+FLAG( 403,  0, EAX,  0,  1, VP_RUNTIME_AVAIL,                    NA,    0 ) \
+FLAG( 403,  0, EAX,  1,  1, REF_COUNTER_AVAIL,                   NA,    0 ) \
+FLAG( 403,  0, EAX,  2,  1, BASIC_SYNIC_MSRS_AVAIL,              NA,    0 ) \
+FLAG( 403,  0, EAX,  3,  1, SYNTH_TIMER_MSRS_AVAIL,              NA,    0 ) \
+FLAG( 403,  0, EAX,  4,  1, APIC_ACCESS_MSRS_AVAIL,              NA,    0 ) \
+FLAG( 403,  0, EAX,  5,  1, HYPERCALL_MSRS_AVAIL,                NA,    0 ) \
+FLAG( 403,  0, EAX,  6,  1, VP_INDEX_MSR_AVAIL,                  NA,    0 ) \
+FLAG( 403,  0, EAX,  7,  1, VIRT_RESET_MSR_AVAIL,                NA,    0 ) \
+FLAG( 403,  0, EAX,  8,  1, STATS_PAGES_MSRS_AVAIL,              NA,    0 ) \
+FLAG( 403,  0, EAX,  9,  1, REF_TSC_AVAIL,                       NA,    0 ) \
+FLAG( 403,  0, EAX, 10,  1, GUEST_IDLE_MSR_AVAIL,                NA,    0 ) \
+FLAG( 403,  0, EAX, 11,  1, FREQUENCY_MSRS_AVAIL,                NA,    0 ) \
+FLAG( 403,  0, EAX, 12,  1, SYNTH_DEBUG_MSRS_AVAIL,              NA,    0 ) \
+FLAG( 403,  0, EBX,  0,  1, CREATE_PARTITIONS_FLAG,              NA,    0 ) \
+FLAG( 403,  0, EBX,  1,  1, ACCESS_PARTITION_ID_FLAG,            NA,    0 ) \
+FLAG( 403,  0, EBX,  2,  1, ACCESS_MEMORY_POOL_FLAG,             NA,    0 ) \
+FLAG( 403,  0, EBX,  3,  1, ADJUST_MESSAGE_BUFFERS_FLAG,         NA,    0 ) \
+FLAG( 403,  0, EBX,  4,  1, POST_MESSAGES_FLAG,                  NA,    0 ) \
+FLAG( 403,  0, EBX,  5,  1, SIGNAL_EVENTS_FLAG,                  NA,    0 ) \
+FLAG( 403,  0, EBX,  6,  1, CREATE_PORT_FLAG,                    NA,    0 ) \
+FLAG( 403,  0, EBX,  7,  1, CONNECT_PORT_FLAG,                   NA,    0 ) \
+FLAG( 403,  0, EBX,  8,  1, ACCESS_STATS_FLAG,                   NA,    0 ) \
+FLAG( 403,  0, EBX, 11,  1, DEBUGGING_FLAG,                      NA,    0 ) \
+FLAG( 403,  0, EBX, 12,  1, CPU_MANAGEMENT_FLAG,                 NA,    0 ) \
+FLAG( 403,  0, EBX, 13,  1, CONFIGURE_PROFILER_FLAG,             NA,    0 ) \
+FLAG( 403,  0, EBX, 14,  1, ENABLE_EXPANDED_STACKWALKING_FLAG,   NA,    0 ) \
+FLAG( 403,  0, EBX, 16,  1, ACCESS_VSM,                          NA,    0 ) \
+FLAG( 403,  0, EBX, 17,  1, ACCESS_VP_REGISTERS,                 NA,    0 ) \
+FIELD(403,  0, ECX,  0,  4, MAX_POWER_STATE,                     NA,    0 ) \
+FLAG( 403,  0, ECX,  4,  1, HPET_NEEDED_FOR_C3,                  NA,    0 ) \
+FLAG( 403,  0, EDX,  0,  1, MWAIT_AVAIL,                         NA,    0 ) \
+FLAG( 403,  0, EDX,  1,  1, GUEST_DEBUGGING_AVAIL,               NA,    0 ) \
+FLAG( 403,  0, EDX,  2,  1, PERFORMANCE_MONITOR_AVAIL,           NA,    0 ) \
+FLAG( 403,  0, EDX,  3,  1, CPU_DYN_PARTITIONING_AVAIL,          NA,    0 ) \
+FLAG( 403,  0, EDX,  4,  1, XMM_REGS_FOR_HYPERCALL_INPUT,        NA,    0 ) \
+FLAG( 403,  0, EDX,  5,  1, GUEST_IDLE_AVAIL,                    NA,    0 ) \
+FLAG( 403,  0, EDX,  6,  1, HYPERVISOR_SLEEP_STATE_AVAIL,        NA,    0 ) \
+FLAG( 403,  0, EDX,  7,  1, NUMA_DISTANCE_QUERY_AVAIL,           NA,    0 ) \
+FLAG( 403,  0, EDX,  8,  1, TIMER_FREQUENCY_AVAIL,               NA,    0 ) \
+FLAG( 403,  0, EDX,  9,  1, SYNTH_MACHINE_CHECK_AVAIL,           NA,    0 ) \
+FLAG( 403,  0, EDX, 10,  1, GUEST_CRASH_MSRS_AVAIL,              NA,    0 ) \
+FLAG( 403,  0, EDX, 11,  1, DEBUG_MSRS_AVAIL,                    NA,    0 ) \
+FLAG( 403,  0, EDX, 12,  1, NPIEP1_AVAIL,                        NA,    0 ) \
+FLAG( 403,  0, EDX, 13,  1, DISABLE_HYPERVISOR_AVAIL,            NA,    0 ) \
+FLAG( 403,  0, EDX, 15,  1, XMM_REGS_FOR_HYPERCALL_OUTPUT,       NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_404                                         \
+FLAG( 404,  0, EAX,  0,  1, USE_HYPERCALL_TO_SWITCH_ADDR_SPACE,  NA,    0 ) \
+FLAG( 404,  0, EAX,  1,  1, USE_HYPERCALL_TO_FLUSH_TLB,          NA,    0 ) \
+FLAG( 404,  0, EAX,  2,  1, USE_HYPERCALL_FOR_TLB_SHOOTDOWN,     NA,    0 ) \
+FLAG( 404,  0, EAX,  3,  1, USE_MSRS_FOR_EOI_ICR_TPR,            NA,    0 ) \
+FLAG( 404,  0, EAX,  4,  1, USE_MSR_FOR_RESET,                   NA,    0 ) \
+FLAG( 404,  0, EAX,  5,  1, USE_RELAXED_TIMING,                  NA,    0 ) \
+FLAG( 404,  0, EAX,  6,  1, USE_DMA_REMAPPING,                   NA,    0 ) \
+FLAG( 404,  0, EAX,  7,  1, USE_INTERRUPT_REMAPPING,             NA,    0 ) \
+FLAG( 404,  0, EAX,  8,  1, USE_X2APIC,                          NA,    0 ) \
+FLAG( 404,  0, EAX,  9,  1, DEPRECATE_AUTOEOI,                   NA,    0 ) \
+FIELD(404,  0, EBX,  0, 32, SPINLOCK_RETRIES,                    NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_405                                          \
+FIELD(405,  0, EAX,  0, 32, MAX_VCPU,                            NA,    0 ) \
+FIELD(405,  0, EBX,  0, 32, MAX_LCPU,                            NA,    0 ) \
+FIELD(405,  0, ECX,  0, 32, MAX_REMAPPABLE_VECTORS,              NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_406                                          \
+FLAG( 406,  0, EAX,  0,  1, APIC_OVERLAY_ASSIST,                 NA,    0 ) \
+FLAG( 406,  0, EAX,  1,  1, MSR_BITMAPS,                         NA,    0 ) \
+FLAG( 406,  0, EAX,  2,  1, ARCH_PMCS,                           NA,    0 ) \
+FLAG( 406,  0, EAX,  3,  1, SLAT,                                NA,    0 ) \
+FLAG( 406,  0, EAX,  4,  1, DMA_REMAPPING,                       NA,    0 ) \
+FLAG( 406,  0, EAX,  5,  1, INTERRUPT_REMAPPING,                 NA,    0 ) \
+FLAG( 406,  0, EAX,  6,  1, MEMORY_PATROL_SCRUBBER,              NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_410                                          \
+FIELD(410,  0, EAX,  0, 32, TSC_HZ,                              NA,    0 ) \
+FIELD(410,  0, EBX,  0, 32, APICBUS_HZ,                          NA,    0 ) \
+FLAG( 410,  0, ECX,  0,  1, VMMCALL_BACKDOOR,                    NA,    0 ) \
+FLAG( 410,  0, ECX,  1,  1, VMCALL_BACKDOOR,                     NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_80                                           \
+FIELD( 80,  0, EAX,  0, 32, NUM_EXT_LEVELS,                      NA,    0 ) \
+FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                      NA,    0 ) \
+FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                      NA,    0 ) \
+FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                      NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_81                                           \
+FIELD( 81,  0, EAX,  0, 32, UNKNOWN81EAX,                        ANY,   4 ) \
+FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                     ANY,   4 ) \
+FIELD( 81,  0, EAX,  4,  4, LEAF81_MODEL,                        ANY,   4 ) \
+FIELD( 81,  0, EAX,  8,  4, LEAF81_FAMILY,                       ANY,   4 ) \
+FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                         ANY,   4 ) \
+FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,               ANY,   4 ) \
+FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,              ANY,   4 ) \
+FIELD( 81,  0, EBX,  0, 32, UNKNOWN81EBX,                        ANY,   4 ) \
+FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                     ANY,   4 ) \
+FIELD( 81,  0, EBX, 16, 16, UNDEF,                               ANY,   4 ) \
+FLAG(  81,  0, ECX,  0,  1, LAHF64,                              YES,   4 ) \
+FLAG(  81,  0, ECX,  1,  1, CMPLEGACY,                           ANY,   9 ) \
+FLAG(  81,  0, ECX,  2,  1, SVM,                                 YES,   8 ) \
+FLAG(  81,  0, ECX,  3,  1, EXTAPICSPC,                          YES,   4 ) \
+FLAG(  81,  0, ECX,  4,  1, CR8AVAIL,                            YES,   9 ) \
+FLAG(  81,  0, ECX,  5,  1, ABM,                                 YES,   4 ) \
+FLAG(  81,  0, ECX,  6,  1, SSE4A,                               YES,   4 ) \
+FLAG(  81,  0, ECX,  7,  1, MISALIGNED_SSE,                      YES,   4 ) \
+FLAG(  81,  0, ECX,  8,  1, 3DNPREFETCH,                         YES,   4 ) \
+FLAG(  81,  0, ECX,  9,  1, OSVW,                                ANY,   8 ) \
+FLAG(  81,  0, ECX, 10,  1, IBS,                                 NO,    0 ) \
+FLAG(  81,  0, ECX, 11,  1, XOP,                                 YES,   8 ) \
+FLAG(  81,  0, ECX, 12,  1, SKINIT,                              NO,    0 ) \
+FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                            NO,    0 ) \
+FLAG(  81,  0, ECX, 15,  1, LWP,                                 NO,    0 ) \
+FLAG(  81,  0, ECX, 16,  1, FMA4,                                YES,   8 ) \
+FLAG(  81,  0, ECX, 17,  1, TCE,                                 NO,    0 ) \
+FLAG(  81,  0, ECX, 19,  1, NODEID_MSR,                          NO,    0 ) \
+FLAG(  81,  0, ECX, 21,  1, TBM,                                 YES,   9 ) \
+FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                            NO,    0 ) \
+FLAG(  81,  0, ECX, 23,  1, PERFCORE,                            ANY,   4 ) \
+FLAG(  81,  0, ECX, 24,  1, PERFNB,                              NO,    0 ) \
+FLAG(  81,  0, ECX, 26,  1, DATABK,                              NO,    0 ) \
+FLAG(  81,  0, ECX, 27,  1, PERFTSC,                             NO,    0 ) \
+FLAG(  81,  0, ECX, 28,  1, PERFL3,                              NO,    0 ) \
+FLAG(  81,  0, ECX, 29,  1, MWAITX,                              NO,    0 ) \
+FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                          YES,   4 ) \
+FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                          YES,   4 ) \
+FLAG(  81,  0, EDX,  2,  1, LEAF81_DE,                           YES,   4 ) \
+FLAG(  81,  0, EDX,  3,  1, LEAF81_PSE,                          YES,   4 ) \
+FLAG(  81,  0, EDX,  4,  1, LEAF81_TSC,                          YES,   4 ) \
+FLAG(  81,  0, EDX,  5,  1, LEAF81_MSR,                          YES,   4 ) \
+FLAG(  81,  0, EDX,  6,  1, LEAF81_PAE,                          YES,   4 ) \
+FLAG(  81,  0, EDX,  7,  1, LEAF81_MCE,                          YES,   4 ) \
+FLAG(  81,  0, EDX,  8,  1, LEAF81_CX8,                          YES,   4 ) \
+FLAG(  81,  0, EDX,  9,  1, LEAF81_APIC,                         ANY,   4 ) \
+FLAG(  81,  0, EDX, 11,  1, SYSC,                                ANY,   4 ) \
+FLAG(  81,  0, EDX, 12,  1, LEAF81_MTRR,                         YES,   4 ) \
+FLAG(  81,  0, EDX, 13,  1, LEAF81_PGE,                          YES,   4 ) \
+FLAG(  81,  0, EDX, 14,  1, LEAF81_MCA,                          YES,   4 ) \
+FLAG(  81,  0, EDX, 15,  1, LEAF81_CMOV,                         YES,   4 ) \
+FLAG(  81,  0, EDX, 16,  1, LEAF81_PAT,                          YES,   4 ) \
+FLAG(  81,  0, EDX, 17,  1, LEAF81_PSE36,                        YES,   4 ) \
+FLAG(  81,  0, EDX, 20,  1, NX,                                  YES,   4 ) \
+FLAG(  81,  0, EDX, 22,  1, MMXEXT,                              YES,   4 ) \
+FLAG(  81,  0, EDX, 23,  1, LEAF81_MMX,                          YES,   4 ) \
+FLAG(  81,  0, EDX, 24,  1, LEAF81_FXSR,                         YES,   4 ) \
+FLAG(  81,  0, EDX, 25,  1, FFXSR,                               YES,   4 ) \
+FLAG(  81,  0, EDX, 26,  1, PDPE1GB,                             YES,   9 ) \
+FLAG(  81,  0, EDX, 27,  1, RDTSCP,                              YES,   4 ) \
+FLAG(  81,  0, EDX, 29,  1, LM,                                  YES,   4 ) \
+FLAG(  81,  0, EDX, 30,  1, 3DNOWPLUS,                           YES,   4 ) \
+FLAG(  81,  0, EDX, 31,  1, 3DNOW,                               YES,   4 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_82                                           \
+FIELD( 82,  0, EAX,  0, 32, LEAF82_BRAND_STRING_EAX,             NA,    0 ) \
+FIELD( 82,  0, EBX,  0, 32, LEAF82_BRAND_STRING_EBX,             NA,    0 ) \
+FIELD( 82,  0, ECX,  0, 32, LEAF82_BRAND_STRING_ECX,             NA,    0 ) \
+FIELD( 82,  0, EDX,  0, 32, LEAF82_BRAND_STRING_EDX,             NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_83                                           \
+FIELD( 83,  0, EAX,  0, 32, LEAF83_BRAND_STRING_EAX,             NA,    0 ) \
+FIELD( 83,  0, EBX,  0, 32, LEAF83_BRAND_STRING_EBX,             NA,    0 ) \
+FIELD( 83,  0, ECX,  0, 32, LEAF83_BRAND_STRING_ECX,             NA,    0 ) \
+FIELD( 83,  0, EDX,  0, 32, LEAF83_BRAND_STRING_EDX,             NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_84                                           \
+FIELD( 84,  0, EAX,  0, 32, LEAF84_BRAND_STRING_EAX,             NA,    0 ) \
+FIELD( 84,  0, EBX,  0, 32, LEAF84_BRAND_STRING_EBX,             NA,    0 ) \
+FIELD( 84,  0, ECX,  0, 32, LEAF84_BRAND_STRING_ECX,             NA,    0 ) \
+FIELD( 84,  0, EDX,  0, 32, LEAF84_BRAND_STRING_EDX,             NA,    0 )
+
+/*    LEVEL, REG, POS, SIZE, NAME,                          MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_85                                           \
+FIELD( 85,  0, EAX,  0,  8, ITLB_ENTRIES_2M4M_PGS,               NA,    0 ) \
+FIELD( 85,  0, EAX,  8,  8, ITLB_ASSOC_2M4M_PGS,                 NA,    0 ) \
+FIELD( 85,  0, EAX, 16,  8, DTLB_ENTRIES_2M4M_PGS,               NA,    0 ) \
+FIELD( 85,  0, EAX, 24,  8, DTLB_ASSOC_2M4M_PGS,                 NA,    0 ) \
+FIELD( 85,  0, EBX,  0,  8, ITLB_ENTRIES_4K_PGS,                 NA,    0 ) \
+FIELD( 85,  0, EBX,  8,  8, ITLB_ASSOC_4K_PGS,                   NA,    0 ) \
+FIELD( 85,  0, EBX, 16,  8, DTLB_ENTRIES_4K_PGS,                 NA,    0 ) \
+FIELD( 85,  0, EBX, 24,  8, DTLB_ASSOC_4K_PGS,                   NA,    0 ) \
+FIELD( 85,  0, ECX,  0,  8, L1_DCACHE_LINE_SIZE,                 NA,    0 ) \
+FIELD( 85,  0, ECX,  8,  8, L1_DCACHE_LINES_PER_TAG,             NA,    0 ) \
+FIELD( 85,  0, ECX, 16,  8, L1_DCACHE_ASSOC,                     NA,    0 ) \
+FIELD( 85,  0, ECX, 24,  8, L1_DCACHE_SIZE,                      NA,    0 ) \
+FIELD( 85,  0, EDX,  0,  8, L1_ICACHE_LINE_SIZE,                 NA,    0 ) \
+FIELD( 85,  0, EDX,  8,  8, L1_ICACHE_LINES_PER_TAG,             NA,    0 ) \
+FIELD( 85,  0, EDX, 16,  8, L1_ICACHE_ASSOC,                     NA,    0 ) \
+FIELD( 85,  0, EDX, 24,  8, L1_ICACHE_SIZE,                      NA,    0 )
+
+/*    LEVEL, REG, POS, SIZE, NAME,                          MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_86                                           \
+FIELD( 86,  0, EAX,  0, 12, L2_ITLB_ENTRIES_2M4M_PGS,            NA,    0 ) \
+FIELD( 86,  0, EAX, 12,  4, L2_ITLB_ASSOC_2M4M_PGS,              NA,    0 ) \
+FIELD( 86,  0, EAX, 16, 12, L2_DTLB_ENTRIES_2M4M_PGS,            NA,    0 ) \
+FIELD( 86,  0, EAX, 28,  4, L2_DTLB_ASSOC_2M4M_PGS,              NA,    0 ) \
+FIELD( 86,  0, EBX,  0, 12, L2_ITLB_ENTRIES_4K_PGS,              NA,    0 ) \
+FIELD( 86,  0, EBX, 12,  4, L2_ITLB_ASSOC_4K_PGS,                NA,    0 ) \
+FIELD( 86,  0, EBX, 16, 12, L2_DTLB_ENTRIES_4K_PGS,              NA,    0 ) \
+FIELD( 86,  0, EBX, 28,  4, L2_DTLB_ASSOC_4K_PGS,                NA,    0 ) \
+FIELD( 86,  0, ECX,  0,  8, L2CACHE_LINE,                        NA,    0 ) \
+FIELD( 86,  0, ECX,  8,  4, L2CACHE_LINE_PER_TAG,                NA,    0 ) \
+FIELD( 86,  0, ECX, 12,  4, L2CACHE_WAYS,                        NA,    0 ) \
+FIELD( 86,  0, ECX, 16, 16, L2CACHE_SIZE,                        NA,    0 ) \
+FIELD( 86,  0, EDX,  0,  8, L3CACHE_LINE,                        NA,    0 ) \
+FIELD( 86,  0, EDX,  8,  4, L3CACHE_LINE_PER_TAG,                NA,    0 ) \
+FIELD( 86,  0, EDX, 12,  4, L3CACHE_WAYS,                        NA,    0 ) \
+FIELD( 86,  0, EDX, 18, 14, L3CACHE_SIZE,                        NA,    0 )
+
+/*    LEVEL, REG, POS, SIZE, NAME,                          MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_87                                           \
+FLAG(  87,  0, EBX,  0,  1, MCA_OVERFLOW_RECOV,                  NA,    0 ) \
+FLAG(  87,  0, EBX,  1,  1, SUCCOR,                              NA,    0 ) \
+FLAG(  87,  0, EBX,  2,  1, HWA,                                 NA,    0 ) \
+FLAG(  87,  0, EBX,  3,  1, SCALABLE_MCA,                        NA,    0 ) \
+FLAG(  87,  0, EBX,  4,  1, PFEH_SUPPORT_PRESENT,                NA,    0 ) \
+FLAG(  87,  0, EDX,  0,  1, TS,                                  NA,    0 ) \
+FLAG(  87,  0, EDX,  1,  1, FID,                                 NA,    0 ) \
+FLAG(  87,  0, EDX,  2,  1, VID,                                 NA,    0 ) \
+FLAG(  87,  0, EDX,  3,  1, TTP,                                 NA,    0 ) \
+FLAG(  87,  0, EDX,  4,  1, LEAF87_TM,                           NA,    0 ) \
+FLAG(  87,  0, EDX,  5,  1, STC,                                 NA,    0 ) \
+FLAG(  87,  0, EDX,  6,  1, 100MHZSTEPS,                         NA,    0 ) \
+FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                            NA,    0 ) \
+FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                       NA,    0 ) \
+FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                     NA,    0 )
+
+/*    LEVEL, REG, POS, SIZE, NAME,                          MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_88                                           \
+FIELD( 88,  0, EAX,  0,  8, PHYS_BITS,                           YES,   4 ) \
+FIELD( 88,  0, EAX,  8,  8, VIRT_BITS,                           YES,   4 ) \
+FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                  YES,   8 ) \
+FLAG(  88,  0, EBX,  0,  1, CLZERO,                              YES,  14 ) \
+FLAG(  88,  0, EBX,  1,  1, IRPERF,                              NO,    0 ) \
+FLAG(  88,  0, EBX,  2,  1, XSAVE_ERR_PTR,                       NO,    0 ) \
+FLAG(  88,  0, EBX,  9,  1, WBNOINVD,                            YES, FUT ) \
+FLAG(  88,  0, EBX, 12,  1, LEAF88_IBPB,                         ANY,   9 ) \
+FLAG(  88,  0, EBX, 14,  1, LEAF88_IBRS,                         NO,    0 ) \
+FLAG(  88,  0, EBX, 15,  1, LEAF88_STIBP,                        NO,    0 ) \
+FLAG(  88,  0, EBX, 16,  1, LEAF88_IBRS_ALWAYS,                  NO,    0 ) \
+FLAG(  88,  0, EBX, 17,  1, LEAF88_STIBP_ALWAYS,                 NO,    0 ) \
+FLAG(  88,  0, EBX, 18,  1, LEAF88_PREFER_IBRS,                  NO,    0 ) \
+FLAG(  88,  0, EBX, 24,  1, LEAF88_SSBD_SPEC_CTRL,               ANY,   9 ) \
+FLAG(  88,  0, EBX, 25,  1, LEAF88_SSBD_VIRT_SPEC_CTRL,          ANY,   9 ) \
+FLAG(  88,  0, EBX, 26,  1, LEAF88_SSBD_NOT_NEEDED,              NO,    0 ) \
+FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                   YES,   4 ) \
+FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                  YES,   7 ) \
+FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                        NO,    0 )
 
 #define CPUID_8A_EDX_11 \
-FLAG(  8A,  0, EDX, 11,  1, SVMEDX_RSVD1,                      NO,   0, FALSE)
+FLAG(  8A,  0, EDX, 11,  1, SVMEDX_RSVD1,                        NO,    0 )
 #define CPUID_8A_EDX_14 \
-FLAG(  8A,  0, EDX, 14,  1, SVMEDX_RSVD2,                      NO,   0, FALSE)
-
-/*    LEVEL, REG, POS, SIZE, NAME,                        MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_8A                                              \
-FIELD( 8A,  0, EAX,  0,  8, SVM_REVISION,                      YES,  4, FALSE) \
-FLAG(  8A,  0, EAX,  8,  1, SVM_HYPERVISOR,                    NO,   0, FALSE) \
-FIELD( 8A,  0, EAX,  9, 23, SVMEAX_RSVD,                       NO,   0, FALSE) \
-FIELD( 8A,  0, EBX,  0, 32, SVM_NUM_ASIDS,                     YES,  7, FALSE) \
-FIELD( 8A,  0, ECX,  0, 32, SVMECX_RSVD,                       NO,   0, FALSE) \
-FLAG(  8A,  0, EDX,  0,  1, SVM_NPT,                           YES,  7, FALSE) \
-FLAG(  8A,  0, EDX,  1,  1, SVM_LBR,                           NO,   0, FALSE) \
-FLAG(  8A,  0, EDX,  2,  1, SVM_LOCK,                          ANY,  7, FALSE) \
-FLAG(  8A,  0, EDX,  3,  1, SVM_NRIP,                          YES,  7, FALSE) \
-FLAG(  8A,  0, EDX,  4,  1, SVM_TSC_RATE_MSR,                  NO,   0, FALSE) \
-FLAG(  8A,  0, EDX,  5,  1, SVM_VMCB_CLEAN,                    YES,  7, FALSE) \
-FLAG(  8A,  0, EDX,  6,  1, SVM_FLUSH_BY_ASID,                 YES,  7, FALSE) \
-FLAG(  8A,  0, EDX,  7,  1, SVM_DECODE_ASSISTS,                YES,  7, FALSE) \
-FIELD( 8A,  0, EDX,  8,  2, SVMEDX_RSVD0,                      NO,   0, FALSE) \
-FLAG(  8A,  0, EDX, 10,  1, SVM_PAUSE_FILTER,                  NO,   0, FALSE) \
+FLAG(  8A,  0, EDX, 14,  1, SVMEDX_RSVD2,                        NO,    0 )
+#define CPUID_8A_EDX_17 \
+FLAG(  8A,  0, EDX, 17,  1, SVMEDX_RSVD3,                        NO,    0 )
+
+/*    LEVEL, REG, POS, SIZE, NAME,                          MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_8A                                           \
+FIELD( 8A,  0, EAX,  0,  8, SVM_REVISION,                        YES,   4 ) \
+FLAG(  8A,  0, EAX,  8,  1, SVM_HYPERVISOR,                      NO,    0 ) \
+FIELD( 8A,  0, EAX,  9, 23, SVMEAX_RSVD,                         NO,    0 ) \
+FIELD( 8A,  0, EBX,  0, 32, SVM_NUM_ASIDS,                       YES,   7 ) \
+FIELD( 8A,  0, ECX,  0, 32, SVMECX_RSVD,                         NO,    0 ) \
+FLAG(  8A,  0, EDX,  0,  1, SVM_NPT,                             YES,   7 ) \
+FLAG(  8A,  0, EDX,  1,  1, SVM_LBR,                             NO,    0 ) \
+FLAG(  8A,  0, EDX,  2,  1, SVM_LOCK,                            ANY,   7 ) \
+FLAG(  8A,  0, EDX,  3,  1, SVM_NRIP,                            YES,   7 ) \
+FLAG(  8A,  0, EDX,  4,  1, SVM_TSC_RATE_MSR,                    NO,    0 ) \
+FLAG(  8A,  0, EDX,  5,  1, SVM_VMCB_CLEAN,                      YES,   7 ) \
+FLAG(  8A,  0, EDX,  6,  1, SVM_FLUSH_BY_ASID,                   YES,   7 ) \
+FLAG(  8A,  0, EDX,  7,  1, SVM_DECODE_ASSISTS,                  YES,   7 ) \
+FIELD( 8A,  0, EDX,  8,  2, SVMEDX_RSVD0,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 10,  1, SVM_PAUSE_FILTER,                    NO,    0 ) \
 CPUID_8A_EDX_11 \
-FLAG(  8A,  0, EDX, 12,  1, SVM_PAUSE_THRESHOLD,               NO,   0, FALSE) \
-FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                          NO,   0, FALSE) \
+FLAG(  8A,  0, EDX, 12,  1, SVM_PAUSE_THRESHOLD,                 NO,    0 ) \
+FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                            NO,    0 ) \
 CPUID_8A_EDX_14 \
-FLAG(  8A,  0, EDX, 15,  1, SVM_V_VMSAVE_VMLOAD,               NO,   0, FALSE) \
-FLAG(  8A,  0, EDX, 16,  1, SVM_VGIF,                          NO,   0, FALSE) \
-FIELD( 8A,  0, EDX, 17, 15, SVMEDX_RSVD,                       NO,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_819                                             \
-FIELD(819,  0, EAX,  0, 12, L1_ITLB_ENTRIES_1G_PGS,            NA,   0, FALSE) \
-FIELD(819,  0, EAX, 12,  4, L1_ITLB_ASSOC_1G_PGS,              NA,   0, FALSE) \
-FIELD(819,  0, EAX, 16, 12, L1_DTLB_ENTRIES_1G_PGS,            NA,   0, FALSE) \
-FIELD(819,  0, EAX, 28,  4, L1_DTLB_ASSOC_1G_PGS,              NA,   0, FALSE) \
-FIELD(819,  0, EBX,  0, 12, L2_ITLB_ENTRIES_1G_PGS,            NA,   0, FALSE) \
-FIELD(819,  0, EBX, 12,  4, L2_ITLB_ASSOC_1G_PGS,              NA,   0, FALSE) \
-FIELD(819,  0, EBX, 16, 12, L2_DTLB_ENTRIES_1G_PGS,            NA,   0, FALSE) \
-FIELD(819,  0, EBX, 28,  4, L2_DTLB_ASSOC_1G_PGS,              NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81A                                             \
-FLAG( 81A,  0, EAX,  0,  1, FP128,                             NA,   0, FALSE) \
-FLAG( 81A,  0, EAX,  1,  1, MOVU,                              NA,   0, FALSE) \
-FLAG( 81A,  0, EAX,  2,  1, FP256,                             NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81B                                             \
-FLAG( 81B,  0, EAX,  0,  1, IBS_FFV,                           NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  1,  1, IBS_FETCHSAM,                      NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  2,  1, IBS_OPSAM,                         NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  3,  1, RW_OPCOUNT,                        NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  4,  1, OPCOUNT,                           NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  5,  1, BRANCH_TARGET_ADDR,                NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  6,  1, OPCOUNT_EXT,                       NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  7,  1, RIP_INVALID_CHECK,                 NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  8,  1, OP_BRN_FUSE,                       NA,   0, FALSE) \
-FLAG( 81B,  0, EAX,  9,  1, IBS_FETCH_CTL_EXTD,                NA,   0, FALSE) \
-FLAG( 81B,  0, EAX, 10,  1, IBS_OP_DATA4,                      NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81C                                             \
-FLAG( 81C,  0, EAX,  0,  1, LWP_AVAIL,                         NA,   0, FALSE) \
-FLAG( 81C,  0, EAX,  1,  1, LWP_VAL_AVAIL,                     NA,   0, FALSE) \
-FLAG( 81C,  0, EAX,  2,  1, LWP_IRE_AVAIL,                     NA,   0, FALSE) \
-FLAG( 81C,  0, EAX,  3,  1, LWP_BRE_AVAIL,                     NA,   0, FALSE) \
-FLAG( 81C,  0, EAX,  4,  1, LWP_DME_AVAIL,                     NA,   0, FALSE) \
-FLAG( 81C,  0, EAX,  5,  1, LWP_CNH_AVAIL,                     NA,   0, FALSE) \
-FLAG( 81C,  0, EAX,  6,  1, LWP_RNH_AVAIL,                     NA,   0, FALSE) \
-FLAG( 81C,  0, EAX, 29,  1, LWP_CONT_AVAIL,                    NA,   0, FALSE) \
-FLAG( 81C,  0, EAX, 30,  1, LWP_PTSC_AVAIL,                    NA,   0, FALSE) \
-FLAG( 81C,  0, EAX, 31,  1, LWP_INT_AVAIL,                     NA,   0, FALSE) \
-FIELD(81C,  0, EBX,  0,  8, LWP_CB_SIZE,                       NA,   0, FALSE) \
-FIELD(81C,  0, EBX,  8,  8, LWP_EVENT_SIZE,                    NA,   0, FALSE) \
-FIELD(81C,  0, EBX, 16,  8, LWP_MAX_EVENTS,                    NA,   0, FALSE) \
-FIELD(81C,  0, EBX, 24,  8, LWP_EVENT_OFFSET,                  NA,   0, FALSE) \
-FIELD(81C,  0, ECX,  0,  4, LWP_LATENCY_MAX,                   NA,   0, FALSE) \
-FLAG( 81C,  0, ECX,  5,  1, LWP_DATA_ADDR_VALID,               NA,   0, FALSE) \
-FIELD(81C,  0, ECX,  6,  3, LWP_LATENCY_ROUND,                 NA,   0, FALSE) \
-FIELD(81C,  0, ECX,  9,  7, LWP_VERSION,                       NA,   0, FALSE) \
-FIELD(81C,  0, ECX, 16,  8, LWP_MIN_BUF_SIZE,                  NA,   0, FALSE) \
-FLAG( 81C,  0, ECX, 28,  1, LWP_BRANCH_PRED,                   NA,   0, FALSE) \
-FLAG( 81C,  0, ECX, 29,  1, LWP_IP_FILTERING,                  NA,   0, FALSE) \
-FLAG( 81C,  0, ECX, 30,  1, LWP_CACHE_LEVEL,                   NA,   0, FALSE) \
-FLAG( 81C,  0, ECX, 31,  1, LWP_CACHE_LATENCY,                 NA,   0, FALSE) \
-FLAG( 81C,  0, EDX,  0,  1, LWP_SUPPORTED,                     NA,   0, FALSE) \
-FLAG( 81C,  0, EDX,  1,  1, LWP_VAL_SUPPORTED,                 NA,   0, FALSE) \
-FLAG( 81C,  0, EDX,  2,  1, LWP_IRE_SUPPORTED,                 NA,   0, FALSE) \
-FLAG( 81C,  0, EDX,  3,  1, LWP_BRE_SUPPORTED,                 NA,   0, FALSE) \
-FLAG( 81C,  0, EDX,  4,  1, LWP_DME_SUPPORTED,                 NA,   0, FALSE) \
-FLAG( 81C,  0, EDX,  5,  1, LWP_CNH_SUPPORTED,                 NA,   0, FALSE) \
-FLAG( 81C,  0, EDX,  6,  1, LWP_RNH_SUPPORTED,                 NA,   0, FALSE) \
-FLAG( 81C,  0, EDX, 29,  1, LWP_CONT_SUPPORTED,                NA,   0, FALSE) \
-FLAG( 81C,  0, EDX, 30,  1, LWP_PTSC_SUPPORTED,                NA,   0, FALSE) \
-FLAG( 81C,  0, EDX, 31,  1, LWP_INT_SUPPORTED,                 NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81D                                             \
-FIELD(81D,  0, EAX,  0,  5, LEAF81D_CACHE_TYPE,                NA,   0, FALSE) \
-FIELD(81D,  0, EAX,  5,  3, LEAF81D_CACHE_LEVEL,               NA,   0, FALSE) \
-FLAG( 81D,  0, EAX,  8,  1, LEAF81D_CACHE_SELF_INIT,           NA,   0, FALSE) \
-FLAG( 81D,  0, EAX,  9,  1, LEAF81D_CACHE_FULLY_ASSOC,         NA,   0, FALSE) \
-FIELD(81D,  0, EAX, 14, 12, LEAF81D_NUM_SHARING_CACHE,         NA,   0, FALSE) \
-FIELD(81D,  0, EBX,  0, 12, LEAF81D_CACHE_LINE_SIZE,           NA,   0, FALSE) \
-FIELD(81D,  0, EBX, 12, 10, LEAF81D_CACHE_PHYS_PARTITIONS,     NA,   0, FALSE) \
-FIELD(81D,  0, EBX, 22, 10, LEAF81D_CACHE_WAYS,                NA,   0, FALSE) \
-FIELD(81D,  0, ECX,  0, 32, LEAF81D_CACHE_NUM_SETS,            NA,   0, FALSE) \
-FLAG( 81D,  0, EDX,  0,  1, LEAF81D_CACHE_WBINVD,              NA,   0, FALSE) \
-FLAG( 81D,  0, EDX,  1,  1, LEAF81D_CACHE_INCLUSIVE,           NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81E                                             \
-FIELD(81E,  0, EAX,  0, 32, EXTENDED_APICID,                   NA,   0, FALSE) \
-FIELD(81E,  0, EBX,  0,  8, COMPUTE_UNIT_ID,                   NA,   0, FALSE) \
-FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,            NA,   0, FALSE) \
-FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                        NA,   0, FALSE) \
-FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                     NA,   0, FALSE)
-
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,             MON SUPP, HWV, CPL3 */
-#define CPUID_FIELD_DATA_LEVEL_81F                                             \
-FLAG( 81F,  0, EAX,  0,  1, SME,                               NO,   0, FALSE) \
-FLAG( 81F,  0, EAX,  1,  1, SEV,                               NO,   0, FALSE) \
-FLAG( 81F,  0, EAX,  2,  1, PAGE_FLUSH_MSR,                    NO,   0, FALSE) \
-FLAG( 81F,  0, EAX,  3,  1, SEV_ES,                            NO,   0, FALSE) \
-FIELD(81F,  0, EBX,  0,  5, SME_PAGE_TABLE_BIT_NUM,            NO,   0, FALSE) \
-FIELD(81F,  0, EBX,  6,  6, SME_PHYS_ADDR_SPACE_REDUCTION,     NO,   0, FALSE) \
-FIELD(81F,  0, ECX,  0, 32, NUM_ENCRYPTED_GUESTS,              NO,   0, FALSE) \
-FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                      NO,   0, FALSE)
+FLAG(  8A,  0, EDX, 15,  1, SVM_V_VMSAVE_VMLOAD,                 NO,    0 ) \
+FLAG(  8A,  0, EDX, 16,  1, SVM_VGIF,                            NO,    0 ) \
+CPUID_8A_EDX_17 \
+FIELD( 8A,  0, EDX, 18, 14, SVMEDX_RSVD,                         NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_819                                          \
+FIELD(819,  0, EAX,  0, 12, L1_ITLB_ENTRIES_1G_PGS,              NA,    0 ) \
+FIELD(819,  0, EAX, 12,  4, L1_ITLB_ASSOC_1G_PGS,                NA,    0 ) \
+FIELD(819,  0, EAX, 16, 12, L1_DTLB_ENTRIES_1G_PGS,              NA,    0 ) \
+FIELD(819,  0, EAX, 28,  4, L1_DTLB_ASSOC_1G_PGS,                NA,    0 ) \
+FIELD(819,  0, EBX,  0, 12, L2_ITLB_ENTRIES_1G_PGS,              NA,    0 ) \
+FIELD(819,  0, EBX, 12,  4, L2_ITLB_ASSOC_1G_PGS,                NA,    0 ) \
+FIELD(819,  0, EBX, 16, 12, L2_DTLB_ENTRIES_1G_PGS,              NA,    0 ) \
+FIELD(819,  0, EBX, 28,  4, L2_DTLB_ASSOC_1G_PGS,                NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_81A                                          \
+FLAG( 81A,  0, EAX,  0,  1, FP128,                               NA,    0 ) \
+FLAG( 81A,  0, EAX,  1,  1, MOVU,                                NA,    0 ) \
+FLAG( 81A,  0, EAX,  2,  1, FP256,                               NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_81B                                          \
+FLAG( 81B,  0, EAX,  0,  1, IBS_FFV,                             NA,    0 ) \
+FLAG( 81B,  0, EAX,  1,  1, IBS_FETCHSAM,                        NA,    0 ) \
+FLAG( 81B,  0, EAX,  2,  1, IBS_OPSAM,                           NA,    0 ) \
+FLAG( 81B,  0, EAX,  3,  1, RW_OPCOUNT,                          NA,    0 ) \
+FLAG( 81B,  0, EAX,  4,  1, OPCOUNT,                             NA,    0 ) \
+FLAG( 81B,  0, EAX,  5,  1, BRANCH_TARGET_ADDR,                  NA,    0 ) \
+FLAG( 81B,  0, EAX,  6,  1, OPCOUNT_EXT,                         NA,    0 ) \
+FLAG( 81B,  0, EAX,  7,  1, RIP_INVALID_CHECK,                   NA,    0 ) \
+FLAG( 81B,  0, EAX,  8,  1, OP_BRN_FUSE,                         NA,    0 ) \
+FLAG( 81B,  0, EAX,  9,  1, IBS_FETCH_CTL_EXTD,                  NA,    0 ) \
+FLAG( 81B,  0, EAX, 10,  1, IBS_OP_DATA4,                        NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_81C                                          \
+FLAG( 81C,  0, EAX,  0,  1, LWP_AVAIL,                           NA,    0 ) \
+FLAG( 81C,  0, EAX,  1,  1, LWP_VAL_AVAIL,                       NA,    0 ) \
+FLAG( 81C,  0, EAX,  2,  1, LWP_IRE_AVAIL,                       NA,    0 ) \
+FLAG( 81C,  0, EAX,  3,  1, LWP_BRE_AVAIL,                       NA,    0 ) \
+FLAG( 81C,  0, EAX,  4,  1, LWP_DME_AVAIL,                       NA,    0 ) \
+FLAG( 81C,  0, EAX,  5,  1, LWP_CNH_AVAIL,                       NA,    0 ) \
+FLAG( 81C,  0, EAX,  6,  1, LWP_RNH_AVAIL,                       NA,    0 ) \
+FLAG( 81C,  0, EAX, 29,  1, LWP_CONT_AVAIL,                      NA,    0 ) \
+FLAG( 81C,  0, EAX, 30,  1, LWP_PTSC_AVAIL,                      NA,    0 ) \
+FLAG( 81C,  0, EAX, 31,  1, LWP_INT_AVAIL,                       NA,    0 ) \
+FIELD(81C,  0, EBX,  0,  8, LWP_CB_SIZE,                         NA,    0 ) \
+FIELD(81C,  0, EBX,  8,  8, LWP_EVENT_SIZE,                      NA,    0 ) \
+FIELD(81C,  0, EBX, 16,  8, LWP_MAX_EVENTS,                      NA,    0 ) \
+FIELD(81C,  0, EBX, 24,  8, LWP_EVENT_OFFSET,                    NA,    0 ) \
+FIELD(81C,  0, ECX,  0,  4, LWP_LATENCY_MAX,                     NA,    0 ) \
+FLAG( 81C,  0, ECX,  5,  1, LWP_DATA_ADDR_VALID,                 NA,    0 ) \
+FIELD(81C,  0, ECX,  6,  3, LWP_LATENCY_ROUND,                   NA,    0 ) \
+FIELD(81C,  0, ECX,  9,  7, LWP_VERSION,                         NA,    0 ) \
+FIELD(81C,  0, ECX, 16,  8, LWP_MIN_BUF_SIZE,                    NA,    0 ) \
+FLAG( 81C,  0, ECX, 28,  1, LWP_BRANCH_PRED,                     NA,    0 ) \
+FLAG( 81C,  0, ECX, 29,  1, LWP_IP_FILTERING,                    NA,    0 ) \
+FLAG( 81C,  0, ECX, 30,  1, LWP_CACHE_LEVEL,                     NA,    0 ) \
+FLAG( 81C,  0, ECX, 31,  1, LWP_CACHE_LATENCY,                   NA,    0 ) \
+FLAG( 81C,  0, EDX,  0,  1, LWP_SUPPORTED,                       NA,    0 ) \
+FLAG( 81C,  0, EDX,  1,  1, LWP_VAL_SUPPORTED,                   NA,    0 ) \
+FLAG( 81C,  0, EDX,  2,  1, LWP_IRE_SUPPORTED,                   NA,    0 ) \
+FLAG( 81C,  0, EDX,  3,  1, LWP_BRE_SUPPORTED,                   NA,    0 ) \
+FLAG( 81C,  0, EDX,  4,  1, LWP_DME_SUPPORTED,                   NA,    0 ) \
+FLAG( 81C,  0, EDX,  5,  1, LWP_CNH_SUPPORTED,                   NA,    0 ) \
+FLAG( 81C,  0, EDX,  6,  1, LWP_RNH_SUPPORTED,                   NA,    0 ) \
+FLAG( 81C,  0, EDX, 29,  1, LWP_CONT_SUPPORTED,                  NA,    0 ) \
+FLAG( 81C,  0, EDX, 30,  1, LWP_PTSC_SUPPORTED,                  NA,    0 ) \
+FLAG( 81C,  0, EDX, 31,  1, LWP_INT_SUPPORTED,                   NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_81D                                          \
+FIELD(81D,  0, EAX,  0,  5, LEAF81D_CACHE_TYPE,                  NA,    0 ) \
+FIELD(81D,  0, EAX,  5,  3, LEAF81D_CACHE_LEVEL,                 NA,    0 ) \
+FLAG( 81D,  0, EAX,  8,  1, LEAF81D_CACHE_SELF_INIT,             NA,    0 ) \
+FLAG( 81D,  0, EAX,  9,  1, LEAF81D_CACHE_FULLY_ASSOC,           NA,    0 ) \
+FIELD(81D,  0, EAX, 14, 12, LEAF81D_NUM_SHARING_CACHE,           NA,    0 ) \
+FIELD(81D,  0, EBX,  0, 12, LEAF81D_CACHE_LINE_SIZE,             NA,    0 ) \
+FIELD(81D,  0, EBX, 12, 10, LEAF81D_CACHE_PHYS_PARTITIONS,       NA,    0 ) \
+FIELD(81D,  0, EBX, 22, 10, LEAF81D_CACHE_WAYS,                  NA,    0 ) \
+FIELD(81D,  0, ECX,  0, 32, LEAF81D_CACHE_NUM_SETS,              NA,    0 ) \
+FLAG( 81D,  0, EDX,  0,  1, LEAF81D_CACHE_WBINVD,                NA,    0 ) \
+FLAG( 81D,  0, EDX,  1,  1, LEAF81D_CACHE_INCLUSIVE,             NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_81E                                          \
+FIELD(81E,  0, EAX,  0, 32, EXTENDED_APICID,                     NA,    0 ) \
+FIELD(81E,  0, EBX,  0,  8, COMPUTE_UNIT_ID,                     NA,    0 ) \
+FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,              NA,    0 ) \
+FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                          NA,    0 ) \
+FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                       NA,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_81F                                          \
+FLAG( 81F,  0, EAX,  0,  1, SME,                                 NO,    0 ) \
+FLAG( 81F,  0, EAX,  1,  1, SEV,                                 YES,  17 ) \
+FLAG( 81F,  0, EAX,  2,  1, PAGE_FLUSH_MSR,                      NO,    0 ) \
+FLAG( 81F,  0, EAX,  3,  1, SEV_ES,                              YES,  17 ) \
+FIELD(81F,  0, EBX,  0,  6, SME_PAGE_TABLE_BIT_NUM,              YES,  17 ) \
+FIELD(81F,  0, EBX,  6,  6, SME_PHYS_ADDR_SPACE_REDUCTION,       NO,    0 ) \
+FIELD(81F,  0, ECX,  0, 32, NUM_ENCRYPTED_GUESTS,                NO,    0 ) \
+FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                        NO,    0 )
 
 #define INTEL_CPUID_FIELD_DATA
 
@@ -1195,16 +1210,14 @@ FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                      NO,   0, FALSE)
  */
 #define VMW_BIT_MASK(shift)  (0xffffffffu >> (32 - shift))
 
-
-#define FIELD(lvl, ecxIn, reg, bitpos, size, name, s, hwv, c3) \
+#define FIELD(lvl, ecxIn, reg, bitpos, size, name, s, hwv)     \
    CPUID_##name##_SHIFT        = bitpos,                       \
    CPUID_##name##_MASK         = VMW_BIT_MASK(size) << bitpos, \
    CPUID_INTERNAL_SHIFT_##name = bitpos,                       \
    CPUID_INTERNAL_MASK_##name  = VMW_BIT_MASK(size) << bitpos, \
    CPUID_INTERNAL_REG_##name   = CPUID_REG_##reg,              \
    CPUID_INTERNAL_EAXIN_##name = CPUID_LEVEL_VAL_##lvl,        \
-   CPUID_INTERNAL_ECXIN_##name = ecxIn,                        \
-   CPUID_INTERNAL_HWV_##name   = hwv,
+   CPUID_INTERNAL_ECXIN_##name = ecxIn,
 
 #define FLAG FIELD
 
@@ -1336,18 +1349,6 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
              CPUID_INTERNAL_SHIFT_##field);                             \
    } while (0)
 
-#define CPUID_SETTO_SAFE(eaxIn, reg, field, dataPtr, val)               \
-   do {                                                                 \
-      uint32 _v = val &                                                 \
-         (CPUID_INTERNAL_MASK_##field >> CPUID_INTERNAL_SHIFT_##field); \
-      uint32 *_d = dataPtr;                                             \
-      ASSERT_ON_COMPILE(                                                \
-         (uint32)eaxIn   == (uint32)CPUID_INTERNAL_EAXIN_##field &&     \
-         CPUID_REG_##reg == (CpuidReg)CPUID_INTERNAL_REG_##field);      \
-      *_d = (*_d & ~CPUID_INTERNAL_MASK_##field) |                      \
-         (_v << CPUID_INTERNAL_SHIFT_##field);                          \
-   } while (0)
-
 
 /*
  * Definitions of various fields' values and more complicated
@@ -1419,25 +1420,27 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_ATOM_4A        0x4a  // Future Silvermont
 #define CPUID_MODEL_ATOM_4C        0x4c  // Airmont
 #define CPUID_MODEL_ATOM_4D        0x4d  // Avoton
-#define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y / Kabylake U/Y ES
+#define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y / Kaby Lake U/Y ES
 #define CPUID_MODEL_BROADWELL_4F   0x4f  // Broadwell EP/EN/EX
 #define CPUID_MODEL_SKYLAKE_55     0x55  // Skylake EP/EN/EX
 #define CPUID_MODEL_BROADWELL_56   0x56  // Broadwell DE
 #define CPUID_MODEL_KNL_57         0x57  // Knights Landing
 #define CPUID_MODEL_ATOM_5A        0x5a  // Future Silvermont
 #define CPUID_MODEL_ATOM_5D        0x5d  // Future Silvermont
-#define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S / Kabylake S/H ES
+#define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S / Kaby Lake S/H ES
 #define CPUID_MODEL_ATOM_5F        0x5f  // Denverton
+#define CPUID_MODEL_CANNONLAKE_66  0x66  // Cannon Lake
 #define CPUID_MODEL_KNM_85         0x85  // Knights Mill
-#define CPUID_MODEL_KABYLAKE_8E    0x8e  // Kabylake U/Y QS
-#define CPUID_MODEL_KABYLAKE_9E    0x9e  // Kabylake S/H QS
+#define CPUID_MODEL_KABYLAKE_8E    0x8e  // Kaby Lake U/Y QS
+#define CPUID_MODEL_KABYLAKE_9E    0x9e  // Kaby Lake S/H QS
 
 /* Intel stepping information */
-#define CPUID_STEPPING_KABYLAKE_ES     0x8  // Kabylake S/H/U/Y ES
-#define CPUID_STEPPING_COFFEELAKE_A    0xA  // Coffeelake U/S/H
-#define CPUID_STEPPING_COFFEELAKE_B    0xB  // Coffeelake S/H
+#define CPUID_STEPPING_KABYLAKE_ES     0x8  // Kaby Lake S/H/U/Y ES
+#define CPUID_STEPPING_COFFEELAKE_A    0xA  // Coffee Lake U/S/H
+#define CPUID_STEPPING_COFFEELAKE_D    0xD  // Last Coffee Lake stepping
 #define CPUID_STEPPING_CASCADELAKE_A   0x5  // Cascade Lake A-step
 #define CPUID_STEPPING_CASCADELAKE_B1  0x7  // Cascade Lake B1-step
+#define CPUID_STEPPING_WHISKEYLAKE     0xB  // Whiskey Lake U
 
 #define CPUID_MODEL_PIII_07    7
 #define CPUID_MODEL_PIII_08    8
@@ -1461,7 +1464,13 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_EXCAVATOR_60      0x60 // family == CPUID_FAMILY_BULLDOZER
 #define CPUID_MODEL_EXCAVATOR_6F      0x6F // Max Excavator model defined in BKDG
 #define CPUID_MODEL_ZEN_00            0x00 // family == CPUID_FAMILY_ZEN
+#define CPUID_MODEL_ZEN_NAPLES_01     0x01 // family == CPUID_FAMILY_ZEN
 #define CPUID_MODEL_ZEN_1F            0x1F // Max Zen model defined in BKDG
+#define CPUID_MODEL_ZEN2_30           0x30 // family == CPUID_FAMILY_ZEN
+#define CPUID_MODEL_ZEN2_3F           0x3F // Max Zen2 model
+
+/* AMD stepping information */
+#define CPUID_STEPPING_ZEN_NAPLES_B2  0x02 // Zen Naples ZP-B2
 
 /* VIA model information */
 #define CPUID_MODEL_NANO                15 // Isaiah
@@ -1489,9 +1498,9 @@ static INLINE Bool
 CPUID_IsRawVendor(CPUIDRegs *id0, const char* vendor)
 {
    // hard to get strcmp() in some environments, so do it in the raw
-   return (id0->ebx == *(const uint32 *) (vendor + 0) &&
-           id0->ecx == *(const uint32 *) (vendor + 4) &&
-           id0->edx == *(const uint32 *) (vendor + 8));
+   return (id0->ebx == *(const uint32 *)(uintptr_t) (vendor + 0) &&
+           id0->ecx == *(const uint32 *)(uintptr_t) (vendor + 4) &&
+           id0->edx == *(const uint32 *)(uintptr_t) (vendor + 8));
 }
 
 static INLINE Bool
@@ -1665,13 +1674,14 @@ CPUID_MODEL_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
 static INLINE Bool
 CPUID_MODEL_IS_CASCADELAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
-   /* Assumes the CPU manufacturer is Intel. */
+      /* Assumes the CPU manufacturer is Intel. */
    return CPUID_FAMILY_IS_P6(v) &&
           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_55 &&
           CPUID_EFFECTIVE_STEPPING(v) >= CPUID_STEPPING_CASCADELAKE_A &&
           CPUID_EFFECTIVE_STEPPING(v) <= CPUID_STEPPING_CASCADELAKE_B1;
 }
 
+
 static INLINE Bool
 CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
@@ -1679,7 +1689,8 @@ CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
    return CPUID_FAMILY_IS_P6(v) &&
           ((CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E &&
             CPUID_EFFECTIVE_STEPPING(v) != CPUID_STEPPING_KABYLAKE_ES) ||
-            CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_55 ||
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_55 &&
+            !CPUID_MODEL_IS_CASCADELAKE(v))                            ||
            (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E &&
             CPUID_EFFECTIVE_STEPPING(v) != CPUID_STEPPING_KABYLAKE_ES));
 }
@@ -1689,35 +1700,55 @@ CPUID_MODEL_IS_COFFEELAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
    /* Assumes the CPU manufacturer is Intel. */
    return CPUID_FAMILY_IS_P6(v) &&
-          ((CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_9E           &&
-            (CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_COFFEELAKE_A   ||
-             CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_COFFEELAKE_B)) ||
-           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_8E           &&
+          ((CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_9E &&
+            CPUID_EFFECTIVE_STEPPING(v) >= CPUID_STEPPING_COFFEELAKE_A &&
+            CPUID_EFFECTIVE_STEPPING(v) <= CPUID_STEPPING_COFFEELAKE_D) ||
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_8E &&
             CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_COFFEELAKE_A));
 }
 
 static INLINE Bool
-CPUID_MODEL_IS_KABYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+CPUID_MODEL_IS_WHISKEYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
    /* Assumes the CPU manufacturer is Intel. */
    return CPUID_FAMILY_IS_P6(v) &&
-          !CPUID_MODEL_IS_COFFEELAKE(v) &&
-          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_9E         ||
-           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_8E         ||
-           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E         &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_8E &&
+          CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_WHISKEYLAKE;
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_KABYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+      return CPUID_FAMILY_IS_P6(v) &&
+          ((CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_9E &&
+            CPUID_EFFECTIVE_STEPPING(v) < CPUID_STEPPING_COFFEELAKE_A) ||
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_8E &&
+            CPUID_EFFECTIVE_STEPPING(v) < CPUID_STEPPING_COFFEELAKE_A) ||
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E &&
             CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_KABYLAKE_ES) ||
-           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E         &&
+           (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E &&
             CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_KABYLAKE_ES));
 }
 
 static INLINE Bool
-CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+CPUID_MODEL_IS_CANNONLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
    /* Assumes the CPU manufacturer is Intel. */
    return CPUID_FAMILY_IS_P6(v) &&
-          (CPUID_MODEL_IS_COFFEELAKE(v) ||
-           CPUID_MODEL_IS_KABYLAKE(v)   ||
-           CPUID_MODEL_IS_SKYLAKE(v));
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_CANNONLAKE_66;
+}
+
+static INLINE Bool
+CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_MODEL_IS_SKYLAKE(v)     ||
+          CPUID_MODEL_IS_KABYLAKE(v)    ||
+          CPUID_MODEL_IS_COFFEELAKE(v)  ||
+          CPUID_MODEL_IS_WHISKEYLAKE(v) ||
+          CPUID_MODEL_IS_CASCADELAKE(v) ||
+          CPUID_MODEL_IS_CANNONLAKE(v);
 }
 
 
@@ -2009,6 +2040,15 @@ CPUID_MODEL_IS_ZEN(uint32 eax)
 }
 
 
+static INLINE Bool
+CPUID_MODEL_IS_ZEN2(uint32 eax)
+{
+  return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN &&
+         (CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_ZEN2_30 &&
+          CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN2_3F);
+}
+
+
 static INLINE Bool
 CPUID_FAMILY_IS_DHYANA(uint32 eax)
 {
@@ -2051,6 +2091,12 @@ CPUID_MODEL_IS_DHYANA_A(uint32 eax)
 #define CPUID_TOPOLOGY_LEVEL_TYPE_SMT       1
 #define CPUID_TOPOLOGY_LEVEL_TYPE_CORE      2
 
+#define CPUID_AMD_LEAF85_L1_CACHE_FULLY_ASSOC     0xff
+#define CPUID_AMD_LEAF86_L2_L3_CACHE_FULLY_ASSOC  0x0f
+#define CPUID_AMD_LEAF81D_CACHE_TYPE_NULL   0
+#define CPUID_AMD_LEAF81D_CACHE_TYPE_DATA   1
+#define CPUID_AMD_LEAF81D_CACHE_TYPE_INST   2
+#define CPUID_AMD_LEAF81D_CACHE_TYPE_UNIF   3
 
 /*
  * For certain AMD processors, an lfence instruction is necessary at various
@@ -2186,22 +2232,6 @@ CPUID_IsValid7Subleaf(uint32 eax, uint32 subleaf)  // IN: %eax = cpuid.7.0.eax
    return subleaf <= eax;
 }
 
-/*
- *----------------------------------------------------------------------
- *
- * CPUID_IsValidDSubleaf --
- *
- *    It is the caller's repsonsibility to determine if the processor
- *    supports XSAVE and therefore has D sub-leaves.
- *
- *----------------------------------------------------------------------
- */
-static INLINE Bool
-CPUID_IsValidDSubleaf(uint32 subleaf)  // IN: subleaf to check
-{
-   return subleaf <= 63;
-}
-
 /*
  *----------------------------------------------------------------------
  *
diff --git a/vmmon-only/include/x86cpuid_asm.h b/vmmon-only/include/x86cpuid_asm.h
index 167486f8..b27772af 100644
--- a/vmmon-only/include/x86cpuid_asm.h
+++ b/vmmon-only/include/x86cpuid_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -119,38 +119,45 @@ void __cpuidex(int regs[4], int eax, int ecx);
 #endif
 
 static INLINE void
-__GET_CPUID(int eax,         // IN
+__GET_CPUID(uint32     eax,  // IN
             CPUIDRegs *regs) // OUT
 {
    __asm__ __volatile__(
       VM_CPUID_BLOCK
-      : "=a" (regs->eax), VM_EBX_OUT(regs->ebx), "=c" (regs->ecx), "=d" (regs->edx)
+      : "=a" (regs->eax),
+        VM_EBX_OUT(regs->ebx),
+        "=c" (regs->ecx),
+        "=d" (regs->edx)
       : "a" (eax)
       : "memory"
    );
 }
 
 static INLINE void
-__GET_CPUID2(int eax,         // IN
-             int ecx,         // IN
+__GET_CPUID2(uint32 eax,      // IN
+             uint32 ecx,      // IN
              CPUIDRegs *regs) // OUT
 {
    __asm__ __volatile__(
       VM_CPUID_BLOCK
-      : "=a" (regs->eax), VM_EBX_OUT(regs->ebx), "=c" (regs->ecx), "=d" (regs->edx)
+      : "=a" (regs->eax),
+        VM_EBX_OUT(regs->ebx),
+        "=c" (regs->ecx),
+        "=d" (regs->edx)
       : "a" (eax), "c" (ecx)
       : "memory"
    );
 }
 
 static INLINE uint32
-__GET_EAX_FROM_CPUID(int eax) // IN
+__GET_EAX_FROM_CPUID(uint32 eax) // IN
 {
    uint32 ebx;
 
    __asm__ __volatile__(
       VM_CPUID_BLOCK
-      : "=a" (eax), VM_EBX_OUT(ebx)
+      : "=a" (eax),
+        VM_EBX_OUT(ebx)
       : "a" (eax)
       : "memory", "%ecx", "%edx"
    );
@@ -159,7 +166,7 @@ __GET_EAX_FROM_CPUID(int eax) // IN
 }
 
 static INLINE uint32
-__GET_EBX_FROM_CPUID(int eax) // IN
+__GET_EBX_FROM_CPUID(uint32 eax) // IN
 {
    uint32 ebx;
 
@@ -174,14 +181,16 @@ __GET_EBX_FROM_CPUID(int eax) // IN
 }
 
 static INLINE uint32
-__GET_ECX_FROM_CPUID(int eax) // IN
+__GET_ECX_FROM_CPUID(uint32 eax) // IN
 {
    uint32 ecx;
    uint32 ebx;
 
    __asm__ __volatile__(
       VM_CPUID_BLOCK
-      : "=a" (eax), VM_EBX_OUT(ebx), "=c" (ecx)
+      : "=a" (eax),
+        VM_EBX_OUT(ebx),
+        "=c" (ecx)
       : "a" (eax)
       : "memory", "%edx"
    );
@@ -190,14 +199,16 @@ __GET_ECX_FROM_CPUID(int eax) // IN
 }
 
 static INLINE uint32
-__GET_EDX_FROM_CPUID(int eax) // IN
+__GET_EDX_FROM_CPUID(uint32 eax) // IN
 {
    uint32 edx;
    uint32 ebx;
 
    __asm__ __volatile__(
       VM_CPUID_BLOCK
-      : "=a" (eax), VM_EBX_OUT(ebx), "=d" (edx)
+      : "=a" (eax),
+        VM_EBX_OUT(ebx),
+        "=d" (edx)
       : "a" (eax)
       : "memory", "%ecx"
    );
@@ -207,7 +218,7 @@ __GET_EDX_FROM_CPUID(int eax) // IN
 
 
 static INLINE uint32
-__GET_EAX_FROM_CPUID4(int ecx) // IN
+__GET_EAX_FROM_CPUID4(uint32 ecx) // IN
 {
    uint32 eax;
    uint32 ebx;
@@ -228,7 +239,7 @@ __GET_EAX_FROM_CPUID4(int ecx) // IN
 #elif defined(_MSC_VER) // } {
 
 static INLINE void
-__GET_CPUID(int input, CPUIDRegs *regs)
+__GET_CPUID(uint32 input, CPUIDRegs *regs)
 {
 #ifdef VM_X86_64
    __cpuid((int *)regs, input);
@@ -262,7 +273,7 @@ __GET_CPUID(int input, CPUIDRegs *regs)
  */
 
 static INLINE void
-__GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs)
+__GET_CPUID2(uint32 inputEax, uint32 inputEcx, CPUIDRegs *regs)
 {
    __cpuidex((int *)regs, inputEax, inputEcx);
 }
@@ -275,13 +286,13 @@ __GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs)
  */
 
 extern void
-__GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs);
+__GET_CPUID2(uint32 inputEax, uint32 inputEcx, CPUIDRegs *regs);
 #endif // _MSC_VER >= 1500
 
 #else // VM_X86_64
 
 static INLINE void
-__GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs)
+__GET_CPUID2(uint32 inputEax, uint32 inputEcx, CPUIDRegs *regs)
 {
    __asm push esi
    __asm push ebx
@@ -305,7 +316,7 @@ __GET_CPUID2(int inputEax, int inputEcx, CPUIDRegs *regs)
 #endif
 
 static INLINE uint32
-__GET_EAX_FROM_CPUID(int input)
+__GET_EAX_FROM_CPUID(uint32 input)
 {
 #ifdef VM_X86_64
    CPUIDRegs regs;
@@ -332,7 +343,7 @@ __GET_EAX_FROM_CPUID(int input)
 }
 
 static INLINE uint32
-__GET_EBX_FROM_CPUID(int input)
+__GET_EBX_FROM_CPUID(uint32 input)
 {
 #ifdef VM_X86_64
    CPUIDRegs regs;
@@ -359,7 +370,7 @@ __GET_EBX_FROM_CPUID(int input)
 }
 
 static INLINE uint32
-__GET_ECX_FROM_CPUID(int input)
+__GET_ECX_FROM_CPUID(uint32 input)
 {
 #ifdef VM_X86_64
    CPUIDRegs regs;
@@ -386,7 +397,7 @@ __GET_ECX_FROM_CPUID(int input)
 }
 
 static INLINE uint32
-__GET_EDX_FROM_CPUID(int input)
+__GET_EDX_FROM_CPUID(uint32 input)
 {
 #ifdef VM_X86_64
    CPUIDRegs regs;
@@ -420,12 +431,12 @@ __GET_EDX_FROM_CPUID(int input)
  */
 
 extern uint32
-__GET_EAX_FROM_CPUID4(int inputEcx);
+__GET_EAX_FROM_CPUID4(uint32 inputEcx);
 
 #else // VM_X86_64
 
 static INLINE uint32
-__GET_EAX_FROM_CPUID4(int inputEcx)
+__GET_EAX_FROM_CPUID4(uint32 inputEcx)
 {
    uint32 output;
 
diff --git a/vmmon-only/include/x86desc.h b/vmmon-only/include/x86desc.h
index 01529b50..4f2f877a 100644
--- a/vmmon-only/include/x86desc.h
+++ b/vmmon-only/include/x86desc.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -97,43 +97,78 @@ static INLINE uint32 Desc_LongMode(const Descriptor *d) { return d->longmode; }
 static INLINE uint32 Desc_DB(const Descriptor *d)       { return d->DB; }
 static INLINE uint32 Desc_Gran(const Descriptor *d)     { return d->gran; }
 
-static INLINE uint32 Desc64_Type(const Descriptor64 *d)     { return d->type; }
-static INLINE uint32 Desc64_S(const Descriptor64 *d)        { return d->S; }
-static INLINE uint32 Desc64_DPL(const Descriptor64 *d)      { return d->DPL; }
-static INLINE uint32 Desc64_Present(const Descriptor64 *d)  { return d->present; }
-static INLINE uint32 Desc64_AVL(const Descriptor64 *d)      { return d->AVL; }
-static INLINE uint32 Desc64_Gran(const Descriptor64 *d)     { return d->gran; }
-static INLINE uint32 Desc64_ExtAttrs(const Descriptor64 *d) { return d->ext_attrs; }
+static INLINE uint32
+Desc64_Type(const Descriptor64 *d)
+{
+   return (uint32)d->type;
+}
+
+static INLINE uint32
+Desc64_S(const Descriptor64 *d)
+{
+   return (uint32)d->S;
+}
+
+static INLINE uint32
+Desc64_DPL(const Descriptor64 *d)
+{
+   return (uint32)d->DPL;
+}
+
+static INLINE uint32
+Desc64_Present(const Descriptor64 *d)
+{
+   return (uint32)d->present;
+}
+
+static INLINE uint32
+Desc64_AVL(const Descriptor64 *d)
+{
+   return (uint32)d->AVL;
+}
+
+static INLINE uint32
+Desc64_Gran(const Descriptor64 *d)
+{
+   return (uint32)d->gran;
+}
+
+static INLINE uint32
+Desc64_ExtAttrs(const Descriptor64 *d)
+{
+   return (uint32)d->ext_attrs;
+}
 
 static INLINE LA32
 Desc_GetBase(const Descriptor *d)
 {
-   return (d->base_hi << 24) | (d->base_mid << 16) | d->base_lo;
+   return ((unsigned)d->base_hi  << 24) |
+          ((unsigned)d->base_mid << 16) | d->base_lo;
 }
 
 static INLINE LA64
 Desc64_GetBase(const Descriptor64 *d)
 {
-   return ((uint64)d->base_hi << 32)  | 
-          ((uint64)d->base_mid << 24) | (uint32)d->base_lo;
+   return ((uint64)d->base_hi << 32)  |
+          ((uint64)d->base_mid << 24) | (uint64)d->base_lo;
 }
 
 static INLINE LA32
 Desc64_GetBaseHi(const Descriptor64 *d)
 {
-   return d->base_hi;
+   return (LA32)d->base_hi;
 }
 
 static INLINE VA32
 Desc_GetLimit(const Descriptor *d)
 {
-   return (d->limit_hi << 16) | d->limit_lo;
+   return ((unsigned)d->limit_hi << 16) | d->limit_lo;
 }
 
 static INLINE VA32
 Desc64_GetLimit(const Descriptor64 *d)
 {
-   return ((uint32)d->limit_hi << 16) | (uint32)d->limit_lo;
+   return (VA32)(((unsigned)d->limit_hi << 16) | d->limit_lo);
 }
 
 static INLINE Bool
@@ -310,12 +345,13 @@ static INLINE uint32 DESC_PRESENT(Descriptor d)    { return d.present; }
  *-----------------------------------------------------------------------------
  */
 
-static INLINE void 
-Desc_SetSystemDescriptor64(Descriptor *d, uint64 base, uint32 limit, uint32 type, 
-                           uint32 DPL, uint32 present, uint32 DB, uint32 gran)
+static INLINE void
+Desc_SetSystemDescriptor64(Descriptor *d, uint64 base, uint32 limit,
+                           uint32 type, uint32 DPL, uint32 present,
+                           uint32 DB, uint32 gran)
 {
-   uint32 baseHi = (uint32) (base >> 32);
-   uint32 baseLo = (uint32) base;
+   uint32 baseHi = (uint32)(base >> 32);
+   uint32 baseLo = (uint32)base;
 
    /*
     * The first half of a 16-byte descriptor is a valid 8-byte descriptor
@@ -336,15 +372,17 @@ Desc_SetSystemDescriptor64(Descriptor *d, uint64 base, uint32 limit, uint32 type
  *   Given descriptor, return the code/stack size that it specifies.
  *----------------------------------------------------------------------
  */
-static INLINE int
+static INLINE unsigned
 Desc_DBSize(const Descriptor *desc)
 {
    /*
     * Code/stack size is determined by the D/B bit; bit 22 of the 2nd word.
-    * Shift the bit to position 1, mask it out, add 2. Result: 2 or 4.
+    * Shift the bit to position 1, mask it out, add 2.
+    *
+    * Result: 2 or 4.
     */
-   int cSz = ((((const uint32*)desc)[1] >> 21) & 2) + 2;
-   ASSERT(cSz == (Desc_DB(desc) ? 4 : 2));
+   unsigned cSz = ((((const uint32 *)desc)[1] >> 21) & 2) + 2;
+   ASSERT(cSz == (Desc_DB(desc) ? 4U : 2U));
    return cSz;
 }
 
@@ -526,7 +564,7 @@ typedef struct Gate {
 static INLINE VA
 CallGate_GetOffset(const Gate *cg)
 {
-   return (cg->offset_hi << 16) | cg->offset_lo;
+   return ((unsigned)cg->offset_hi << 16) | cg->offset_lo;
 }
 
 static INLINE void
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 6a581b8d..469ee63f 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -16,7 +16,7 @@
  *
  *********************************************************/
 
-/* 
+/*
  * x86msr.h --
  *
  *      MSR number definitions.
@@ -59,11 +59,8 @@ struct MSRReply {
     * we use it to correlate the replies of multiple queries.
     */
    uint64 tag;              // OUT
-
    uint64 msrVal;           // OUT
-
    uint8  implemented;      // OUT
-
    uint8  _pad[7];
 }
 #include "vmware_pack_end.h"
@@ -123,24 +120,29 @@ MSRQuery;
 #define MSR_ARCH_CAPABILITIES_NOL1F_VMENTRY       (1ULL << 3)
 #define MSR_ARCH_CAPABILITIES_SSB_NO              (1ULL << 4)
 
+#define MSR_FLUSH_CMD                        0x10b
+#define MSR_FLUSH_CMD_FLUSH_L1D                   (1ULL << 0)
 
 #define MSR_SPEC_CTRL_IBRS                        (1UL << 0)
 #define MSR_SPEC_CTRL_STIBP                       (1UL << 1)
+#define MSR_SPEC_CTRL_SSBD                        (1UL << 2)
 
 #define MSR_PRED_CMD_IBPB                         (1UL << 0)
 
 #define MSR_MISC_FEATURES_ENABLES            0x140
 
 /* Intel Core Architecture and later: use only architected counters. */
-#define IA32_MSR_PERF_CAPABILITIES                0x345
-#define MSR_PERF_CAPABILITIES_LBRFMT_SHIFT        0
-#define MSR_PERF_CAPABILITIES_LBRFMT_MASK         0x3f
-#define MSR_PERF_CAPABILITIES_PEBSTRAP            (1u << 6)
-#define MSR_PERF_CAPABILITIES_PEBSSAVEARCHREGS    (1u << 7)
-#define MSR_PERF_CAPABILITIES_PEBSRECORDFMT_SHIFT 8
-#define MSR_PERF_CAPABILITIES_PEBSRECORDFMT_MASK  0xf
-#define MSR_PERF_CAPABILITIES_FREEZE_WHILE_SMM    (1u << 12)
-#define MSR_PERF_CAPABILITIES_FULL_WIDTH_WRITES   (1u << 13)
+#define IA32_MSR_PERF_CAPABILITIES                   0x345
+#define MSR_PERF_CAPABILITIES_LBRFMT_SHIFT           0
+#define MSR_PERF_CAPABILITIES_LBRFMT_MASK            0x3f
+#define MSR_PERF_CAPABILITIES_PEBSTRAP               (1u << 6)
+#define MSR_PERF_CAPABILITIES_PEBSSAVEARCHREGS       (1u << 7)
+#define MSR_PERF_CAPABILITIES_PEBSRECORDFMT_SHIFT    8
+#define MSR_PERF_CAPABILITIES_PEBSRECORDFMT_MASK     0xf
+#define MSR_PERF_CAPABILITIES_FREEZE_WHILE_SMM       (1u << 12)
+#define MSR_PERF_CAPABILITIES_FULL_WIDTH_WRITES      (1u << 13)
+#define MSR_PERF_CAPABILITIES_PEBS_ADAPTIVE_DATA     (1u << 14)
+#define MSR_PERF_CAPABILITIES_PERF_METRICS_AVAILABLE (1u << 15)
 
 #define IA32_MSR_PEBS_ENABLE                      0x3f1
 
@@ -267,6 +269,8 @@ typedef enum {
 
 #define MSR_XSS              0x00000da0  // Extended Supervisor State Mask
 
+#define MSR_MPX_LAX          0x00001000  // MPX Linear Address Extension
+
 /* RTIT MSRs */
 #define MSR_RTIT_CTL              0x00000570
 #define MSR_RTIT_STATUS           0x00000571
@@ -509,9 +513,28 @@ typedef enum {
 #define MSR_VM_CR_SVME_DISABLE     0x0000000000000010ULL
 #define MSR_VM_CR_RESERVED         0xffffffffffffffe0ULL
 
+/* SEV related MSRs. */
+#define MSR_VMPAGE_FLUSH           0xc001011e
+#define MSR_GHCB_PA                0xc0010130
+#define MSR_GHCB_PA_SEVINFO_HV              1
+#define MSR_GHCB_PA_SEVINFO_REQ             2
+#define MSR_GHCB_PA_AP_JUMP_TABLE           3
+#define MSR_SEV_STATUS             0xc0010131
+
+#define MSR_SEV_STATUS_SEV_EN      0x0000000000000001ULL // SEV is enabled
+#define MSR_SEV_STATUS_SEV_ES_EN   0x0000000000000002ULL // SEV-ES is enabled
+
 #define MSR_AMD_DE_CFG           0xc0011029  // Decode configuration
 #define MSR_AMD_DE_CFG_BIT1      (1ULL<<1)
 
+#define MSR_AMD_LS_CFG           0xc0011020  // load-store configuration
+#define MSR_AMD_LS_CFG_SSBD_BULLDOZER (1ULL<<54)  // BD family non-arch SSBD
+#define MSR_AMD_LS_CFG_SSBD_KYOTO     (1ULL<<33)  // Kyoto family non-arch SSBD
+#define MSR_AMD_LS_CFG_SSBD_ZEN       (1ULL<<10)  // Zen family non-arch SSBD
+
+#define MSR_AMD_VIRT_SPEC_CTRL   0xc001011f  // Virtual speculation control
+#define MSR_AMD_VIRT_SPEC_CTRL_SSBD   (1ULL<<2)   // Virtual SSBD
+
 /* Syscall/Sysret related MSRs (x86_64) */
 #define MSR_STAR             0xc0000081 // Also present on Athlons.
 #define MSR_LSTAR            0xc0000082
@@ -593,6 +616,8 @@ typedef enum {
 #define MSR_HYPERV_HYPERCALL_EN                  1ULL
 #define MSR_HYPERV_REFERENCE_TSC_EN              1ULL
 #define MSR_HYPERV_VP_ASSIST_EN                  1ULL
+#define MSR_HYPERV_SIEF_EN                       1ULL
+#define MSR_HYPERV_SIM_EN                        1ULL
 
 #define MSR_HYPERV_GUESTOSID_VENDOR_SHIFT        48
 #define MSR_HYPERV_GUESTOSID_VENDOR_MASK         0xfULL
@@ -602,6 +627,9 @@ typedef enum {
 #define MSR_HYPERV_GUESTOSID_OS_MASK             0xfULL
 #define MSR_HYPERV_GUESTOSID_OS_WINNT_DERIVATIVE 4ULL
 
+/* MSR for forcing RTM abort to recover PMC3 (see PR 2333817) */
+#define MSR_TSX_FORCE_ABORT                      0x0000010f
+#define MSR_TSX_FORCE_ABORT_RTM_BIT_INDEX        0
 
 /*
  * MTRR bit description
@@ -659,14 +687,19 @@ typedef unsigned char MTRRType;
 
 
 
+// Platform Quality of Service (PQM) MSRs
+#define MSR_INTEL_PQM_EVTSEL    0xc8d
+#define MSR_INTEL_PQM_CTR       0xc8e
+#define MSR_INTEL_PQM_ASSOC     0xc8f
 
-/*
- * Platform Quality of Service
- */
+ // Platform Quality Enforcement (PQE) MSRs
+#define MSR_INTEL_PQE_CLOS_MASK_BASE     0xc90
+#define MSR_INTEL_PQE_CLOS_MASK_MAX      0xd8f
 
-#define MSR_INTEL_QOS_EVTSEL    0xc8d
-#define MSR_INTEL_QOS_CTR       0xc8e
-#define MSR_INTEL_QOS_ASSOC     0xc8f
+#define MSR_INTEL_PQE_CLOS_L3_MASK_BASE     0xc90
+#define MSR_INTEL_PQE_CLOS_L3_MASK_MAX      0xd0f
+#define MSR_INTEL_PQE_CLOS_L2_MASK_BASE     0xd10
+#define MSR_INTEL_PQE_CLOS_L2_MASK_MAX      0xd4f
 
 static INLINE uint32
 X86MSR_SysCallEIP(uint64 star)
@@ -689,6 +722,126 @@ X86MSR_SysRetCS(uint64 star)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * X86MSR_{G,S}etMSR --
+ *
+ *      Get or set an MSR in hardware. The interface should remain
+ *      agnostic to the underlying compiler and architecture.
+ *
+ *----------------------------------------------------------------------
+ */
+
+#ifdef __GNUC__
+/*
+ * Checked against the Intel manual and GCC --hpreg
+ * volatile because the msr can change without the compiler knowing it
+ * (when we use wrmsr).
+ */
+#ifdef VM_X86_64
+static INLINE uint64
+X86MSR_GetMSR(uint32 cx)
+{
+   uint64 msr;
+   __asm__ __volatile__(
+      "rdmsr; shlq $32, %%rdx; orq %%rdx, %%rax"
+      : "=a" (msr)
+      : "c" (cx)
+      : "%rdx"
+   );
+
+   return msr;
+}
+
+static INLINE void
+X86MSR_SetMSR(uint32 cx, uint64 value)
+{
+   __asm__ __volatile__(
+      "wrmsr"
+      : /* no outputs */
+      : "a" ((uint32) value),
+        "d" ((uint32)(value >> 32)),
+        "c" (cx)
+    );
+}
+#else // __GNUC__ && !VM_X86_64
+static INLINE uint64
+X86MSR_GetMSR(uint32 cx)
+{
+   uint64 msr;
+   __asm__ __volatile__(
+      "rdmsr"
+      : "=A" (msr)
+      : "c"  (cx)
+   );
+
+   return msr;
+}
+
+static INLINE void
+X86MSR_SetMSR(uint32 cx, uint64 value)
+{
+   __asm__ __volatile__(
+      "wrmsr"
+      : /* no outputs */
+      : "A" (value),
+        "c" (cx)
+    );
+}
+#endif
+#elif defined _MSC_VER // !__GNUC__ && _MSC_VER
+#ifdef _WIN64
+unsigned __int64  __readmsr(unsigned long);
+void              __writemsr(unsigned long, unsigned __int64);
+#pragma intrinsic(__readmsr, __writemsr)
+static INLINE uint64
+X86MSR_GetMSR(uint32 cx)
+{
+   return __readmsr((unsigned long)cx);
+}
+
+static INLINE void
+X86MSR_SetMSR(uint32 cx, uint64 value)
+{
+   __writemsr((unsigned long)(cx), (unsigned __int64)(value));
+}
+#else // !__GNUC__ && _MSC_VER && !_WIN64
+#pragma warning( disable : 4035)
+static INLINE uint64
+X86MSR_GetMSR(uint32 input)
+{
+   __asm push ecx
+   __asm mov  ecx, input
+   /* 0x0f 0x32 -> edx:eax = rdmsr[ecx] */
+   __asm _emit 0x0f __asm _emit 0x32
+   __asm pop ecx
+}
+
+static INLINE void
+X86MSR_SetMSR(uint32 input, uint64 value)
+{
+      uint32 hival = (uint32)((value) >> 32);
+      uint32 loval = (uint32)value;
+      __asm push edx
+      __asm push ecx
+      __asm push eax
+      __asm mov  eax, loval
+      __asm mov  edx, hival
+      __asm mov  ecx, input
+      /* 0x0f 0x30 -> wrmsr[ecx] = edx:eax */
+      __asm _emit 0x0f __asm _emit 0x30
+      __asm pop  eax
+      __asm pop  ecx
+      __asm pop  edx
+}
+#pragma warning (default: 4035)
+#endif
+#else // !__GNUC__ && !_MSC_VER
+#error No compiler defined for RDMSR/WRMSR.
+#endif
+
+
 #if defined __cplusplus
 }
 #endif
diff --git a/vmmon-only/include/x86paging_64.h b/vmmon-only/include/x86paging_64.h
index eceea27b..871a9dec 100644
--- a/vmmon-only/include/x86paging_64.h
+++ b/vmmon-only/include/x86paging_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016,2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016,2018-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -52,7 +52,6 @@
 #define LM_AVAIL_MASK         (CONST64(0x7) << LM_AVAIL_SHIFT)
 #define LM_FLAGS_MASK         CONST64(0x80000000000001ff)
 #define LM_CR3_FLAGS_MASK     CONST64(0x18)
-#define LM_L4_L3_RSVD_MASK    CONST64(0x180)
 #define LM_L3_1G_RSVD_MASK    CONST64(0x3fffe000)
 
 #define LM_MAKE_CR3(_mpfn, _flags) \
@@ -65,12 +64,62 @@
                     ((uint64)(_flags) & LM_FLAGS_MASK))
 
 #define LM_MAKE_PDE(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
+#define LM_MAKE_L5E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
 #define LM_MAKE_L4E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
 #define LM_MAKE_L3E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
 #define LM_MAKE_L2E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
 #define LM_MAKE_L1E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * LMPTEIsSafe --
+ *
+ *    A shadow PTE is considered "safe" if any of the following conditions are
+ *    met:
+ *
+ *      a) It is not terminal (i.e., present with no reserved bits set)
+ *      b) Terminal, but with MPN and PS fields set to zero
+ *      c) Terminal, but with MPN field specifying an uncachable page
+ *
+ *    In practice, for condition c), we require that bits 45:43 of the EPTE are
+ *    set to b'111.  The position of these bits is undocumented and not
+ *    architectural; they are truly magic.
+ *
+ *----------------------------------------------------------------------
+ */
+#ifdef VMX86_DEBUG
+
+#define LM_SAFE_BITS_MASK (MASK64(3) << 43)
+#define LM_SAFE_BITS(_v)  ((_v) & LM_SAFE_BITS_MASK)
+
+static INLINE Bool
+LMPTEIsTerminal(VM_PAE_PTE pte, PT_Level level, uint64 physMask)
+{
+   uint64 rsvd2m = (MASK(PT_LEVEL_SHIFT) << PAGE_SHIFT) & ~PTE_LARGE_PAT;
+   uint64 rsvd1g = (MASK(2 * PT_LEVEL_SHIFT) << PAGE_SHIFT) & ~PTE_LARGE_PAT;
+   uint64 rsvdl4 = PTE_PS;
+   uint64 rsvd = physMask & MASK64(52);
+
+   return (!PTE_PRESENT(pte) ||
+           (pte & LM_PTE_PFN_MASK) & rsvd) != 0 ||
+           ((pte & PTE_PS) != 0 &&
+            ((level == PT_LEVEL_2 && (pte & rsvd2m) != 0) ||
+             (level == PT_LEVEL_3 && (pte & rsvd1g) != 0))) ||
+           (level == PT_LEVEL_4 && (pte & rsvdl4) != 0);
+}
+
+static INLINE Bool
+LMPTEIsSafe(VM_PAE_PTE pte, PT_Level level, uint64 physMask)
+{
+   MPN mpn = (pte & LM_PTE_PFN_MASK) >> PT_PTE_PFN_SHIFT;
+   Bool safe = !LMPTEIsTerminal(pte, level, physMask) ||
+               (mpn == 0 && !PTE_LARGEPAGE(pte)) ||
+               LM_SAFE_BITS(pte) == LM_SAFE_BITS_MASK;
+   return safe;
+}
+#endif /* VMX86_DEBUG */
 
 
 /*
diff --git a/vmmon-only/include/x86segdescrs.h b/vmmon-only/include/x86segdescrs.h
index 951ea029..bbb3be0a 100644
--- a/vmmon-only/include/x86segdescrs.h
+++ b/vmmon-only/include/x86segdescrs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -65,21 +65,21 @@ typedef struct Descriptor {
 typedef 
 #include "vmware_pack_begin.h"
 struct Descriptor64 {
-   unsigned   limit_lo  : 16;   // Limit bits 15-0.
-   unsigned   base_lo   : 24;   // Base bits  23-0.
-   unsigned   type      : 4;
-   unsigned   S         : 1;
-   unsigned   DPL       : 2;
-   unsigned   present   : 1;
-   unsigned   limit_hi  : 4;    // Limit bits 19-16.
-   unsigned   AVL       : 1;
-   unsigned   reserved0 : 2;
-   unsigned   gran      : 1;
-   unsigned   base_mid  : 8;    // Base bits 31-24.
-   unsigned   base_hi   : 32;   // Base bits 63-32.
-   unsigned   reserved1 : 8;
-   unsigned   ext_attrs : 5;
-   unsigned   reserved2 : 19;
+   uint64   limit_lo  : 16;   // Limit bits 15-0.
+   uint64   base_lo   : 24;   // Base bits  23-0.
+   uint64   type      : 4;
+   uint64   S         : 1;
+   uint64   DPL       : 2;
+   uint64   present   : 1;
+   uint64   limit_hi  : 4;    // Limit bits 19-16.
+   uint64   AVL       : 1;
+   uint64   reserved0 : 2;
+   uint64   gran      : 1;
+   uint64   base_mid  : 8;    // Base bits 31-24.
+   uint64   base_hi   : 32;   // Base bits 63-32.
+   uint64   reserved1 : 8;
+   uint64   ext_attrs : 5;
+   uint64   reserved2 : 19;
 }
 #include "vmware_pack_end.h"
 Descriptor64;
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
index 04a14d23..2d18e668 100644
--- a/vmmon-only/include/x86svm.h
+++ b/vmmon-only/include/x86svm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005-2014,2017-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2014,2017-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -47,8 +47,10 @@
 #endif
 #include "x86cpuid_asm.h"
 
-#define SVM_VMCB_IO_BITMAP_SIZE    (3 * PAGE_SIZE)
-#define SVM_VMCB_MSR_BITMAP_SIZE   (2 * PAGE_SIZE)
+#define SVM_VMCB_IO_BITMAP_PAGES   (3)
+#define SVM_VMCB_IO_BITMAP_SIZE    PAGES_2_BYTES(SVM_VMCB_IO_BITMAP_PAGES)
+#define SVM_VMCB_MSR_BITMAP_PAGES  (2)
+#define SVM_VMCB_MSR_BITMAP_SIZE   PAGES_2_BYTES(SVM_VMCB_MSR_BITMAP_PAGES)
 
 /* Exit controls for the CR/DR access and hardware exceptions */
 #define SVM_CR_RD_CTL(num)         (0x1 << (num))
@@ -63,53 +65,56 @@
 #define SVM_XCP_CTL_ALL            0xffffffff
 
 /* Execution intercept controls */
-/* VMCB.exitCtl */
-#define SVM_VMCB_EXEC_CTL_INTR        0x0000000000000001ULL
-#define SVM_VMCB_EXEC_CTL_NMI         0x0000000000000002ULL
-#define SVM_VMCB_EXEC_CTL_SMI         0x0000000000000004ULL
-#define SVM_VMCB_EXEC_CTL_INIT        0x0000000000000008ULL
-#define SVM_VMCB_EXEC_CTL_VINTR       0x0000000000000010ULL
-#define SVM_VMCB_EXEC_CTL_CR0_SEL_WR  0x0000000000000020ULL
-#define SVM_VMCB_EXEC_CTL_SIDT        0x0000000000000040ULL
-#define SVM_VMCB_EXEC_CTL_SGDT        0x0000000000000080ULL
-#define SVM_VMCB_EXEC_CTL_SLDT        0x0000000000000100ULL
-#define SVM_VMCB_EXEC_CTL_STR         0x0000000000000200ULL
-#define SVM_VMCB_EXEC_CTL_LIDT        0x0000000000000400ULL
-#define SVM_VMCB_EXEC_CTL_LGDT        0x0000000000000800ULL
-#define SVM_VMCB_EXEC_CTL_LLDT        0x0000000000001000ULL
-#define SVM_VMCB_EXEC_CTL_LTR         0x0000000000002000ULL
-#define SVM_VMCB_EXEC_CTL_RDTSC       0x0000000000004000ULL
-#define SVM_VMCB_EXEC_CTL_RDPMC       0x0000000000008000ULL
-#define SVM_VMCB_EXEC_CTL_PUSHF       0x0000000000010000ULL
-#define SVM_VMCB_EXEC_CTL_POPF        0x0000000000020000ULL
-#define SVM_VMCB_EXEC_CTL_CPUID       0x0000000000040000ULL
-#define SVM_VMCB_EXEC_CTL_RSM         0x0000000000080000ULL
-#define SVM_VMCB_EXEC_CTL_IRET        0x0000000000100000ULL
-#define SVM_VMCB_EXEC_CTL_SWINT       0x0000000000200000ULL
-#define SVM_VMCB_EXEC_CTL_INVD        0x0000000000400000ULL
-#define SVM_VMCB_EXEC_CTL_PAUSE       0x0000000000800000ULL
-#define SVM_VMCB_EXEC_CTL_HLT         0x0000000001000000ULL
-#define SVM_VMCB_EXEC_CTL_INVLPG      0x0000000002000000ULL
-#define SVM_VMCB_EXEC_CTL_INVLPGA     0x0000000004000000ULL
-#define SVM_VMCB_EXEC_CTL_IOIO        0x0000000008000000ULL
-#define SVM_VMCB_EXEC_CTL_MSR         0x0000000010000000ULL
-#define SVM_VMCB_EXEC_CTL_TS          0x0000000020000000ULL
-#define SVM_VMCB_EXEC_CTL_FERR_FRZ    0x0000000040000000ULL
-#define SVM_VMCB_EXEC_CTL_SHUTDOWN    0x0000000080000000ULL
-#define SVM_VMCB_EXEC_CTL_VMRUN       0x0000000100000000ULL
-#define SVM_VMCB_EXEC_CTL_VMMCALL     0x0000000200000000ULL
-#define SVM_VMCB_EXEC_CTL_VMLOAD      0x0000000400000000ULL
-#define SVM_VMCB_EXEC_CTL_VMSAVE      0x0000000800000000ULL
-#define SVM_VMCB_EXEC_CTL_STGI        0x0000001000000000ULL
-#define SVM_VMCB_EXEC_CTL_CLGI        0x0000002000000000ULL
-#define SVM_VMCB_EXEC_CTL_SKINIT      0x0000004000000000ULL
-#define SVM_VMCB_EXEC_CTL_RDTSCP      0x0000008000000000ULL
-#define SVM_VMCB_EXEC_CTL_ICEBP       0x0000010000000000ULL
-#define SVM_VMCB_EXEC_CTL_WBINVD      0x0000020000000000ULL
-#define SVM_VMCB_EXEC_CTL_MONITOR     0x0000040000000000ULL
-#define SVM_VMCB_EXEC_CTL_MWAIT       0x0000080000000000ULL
-#define SVM_VMCB_EXEC_CTL_MWAIT_COND  0x0000100000000000ULL
-#define SVM_VMCB_EXEC_CTL_XSETBV      0x0000200000000000ULL
+/* VMCB.execCtl */
+#define SVM_VMCB_EXEC_CTL_INTR           0x0000000000000001ULL
+#define SVM_VMCB_EXEC_CTL_NMI            0x0000000000000002ULL
+#define SVM_VMCB_EXEC_CTL_SMI            0x0000000000000004ULL
+#define SVM_VMCB_EXEC_CTL_INIT           0x0000000000000008ULL
+#define SVM_VMCB_EXEC_CTL_VINTR          0x0000000000000010ULL
+#define SVM_VMCB_EXEC_CTL_CR0_SEL_WR     0x0000000000000020ULL
+#define SVM_VMCB_EXEC_CTL_SIDT           0x0000000000000040ULL
+#define SVM_VMCB_EXEC_CTL_SGDT           0x0000000000000080ULL
+#define SVM_VMCB_EXEC_CTL_SLDT           0x0000000000000100ULL
+#define SVM_VMCB_EXEC_CTL_STR            0x0000000000000200ULL
+#define SVM_VMCB_EXEC_CTL_LIDT           0x0000000000000400ULL
+#define SVM_VMCB_EXEC_CTL_LGDT           0x0000000000000800ULL
+#define SVM_VMCB_EXEC_CTL_LLDT           0x0000000000001000ULL
+#define SVM_VMCB_EXEC_CTL_LTR            0x0000000000002000ULL
+#define SVM_VMCB_EXEC_CTL_RDTSC          0x0000000000004000ULL
+#define SVM_VMCB_EXEC_CTL_RDPMC          0x0000000000008000ULL
+#define SVM_VMCB_EXEC_CTL_PUSHF          0x0000000000010000ULL
+#define SVM_VMCB_EXEC_CTL_POPF           0x0000000000020000ULL
+#define SVM_VMCB_EXEC_CTL_CPUID          0x0000000000040000ULL
+#define SVM_VMCB_EXEC_CTL_RSM            0x0000000000080000ULL
+#define SVM_VMCB_EXEC_CTL_IRET           0x0000000000100000ULL
+#define SVM_VMCB_EXEC_CTL_SWINT          0x0000000000200000ULL
+#define SVM_VMCB_EXEC_CTL_INVD           0x0000000000400000ULL
+#define SVM_VMCB_EXEC_CTL_PAUSE          0x0000000000800000ULL
+#define SVM_VMCB_EXEC_CTL_HLT            0x0000000001000000ULL
+#define SVM_VMCB_EXEC_CTL_INVLPG         0x0000000002000000ULL
+#define SVM_VMCB_EXEC_CTL_INVLPGA        0x0000000004000000ULL
+#define SVM_VMCB_EXEC_CTL_IOIO           0x0000000008000000ULL
+#define SVM_VMCB_EXEC_CTL_MSR            0x0000000010000000ULL
+#define SVM_VMCB_EXEC_CTL_TS             0x0000000020000000ULL
+#define SVM_VMCB_EXEC_CTL_FERR_FRZ       0x0000000040000000ULL
+#define SVM_VMCB_EXEC_CTL_SHUTDOWN       0x0000000080000000ULL
+#define SVM_VMCB_EXEC_CTL_VMRUN          0x0000000100000000ULL
+#define SVM_VMCB_EXEC_CTL_VMMCALL        0x0000000200000000ULL
+#define SVM_VMCB_EXEC_CTL_VMLOAD         0x0000000400000000ULL
+#define SVM_VMCB_EXEC_CTL_VMSAVE         0x0000000800000000ULL
+#define SVM_VMCB_EXEC_CTL_STGI           0x0000001000000000ULL
+#define SVM_VMCB_EXEC_CTL_CLGI           0x0000002000000000ULL
+#define SVM_VMCB_EXEC_CTL_SKINIT         0x0000004000000000ULL
+#define SVM_VMCB_EXEC_CTL_RDTSCP         0x0000008000000000ULL
+#define SVM_VMCB_EXEC_CTL_ICEBP          0x0000010000000000ULL
+#define SVM_VMCB_EXEC_CTL_WBINVD         0x0000020000000000ULL
+#define SVM_VMCB_EXEC_CTL_MONITOR        0x0000040000000000ULL
+#define SVM_VMCB_EXEC_CTL_MWAIT          0x0000080000000000ULL
+#define SVM_VMCB_EXEC_CTL_MWAIT_COND     0x0000100000000000ULL
+#define SVM_VMCB_EXEC_CTL_XSETBV         0x0000200000000000ULL
+#define SVM_VMCB_EXEC_CTL_EFER_WR_TRAP   0x0000800000000000ULL
+#define SVM_VMCB_EXEC_CTL_CR_WR_TRAP(n) (0x0001000000000000ULL << (n))
+#define SVM_VMCB_EXEC_CTL_CR_WR_TRAP_ALL 0xffff000000000000ULL
 
 /* VMCB.tlbCtl */
 #define SVM_VMCB_TLB_CTL_FLUSH              0x01
@@ -130,9 +135,12 @@
 
 /* VMCB.intrState */
 #define SVM_VMCB_INTRSTATE_INTR_SHADOW     (1 << 0)
+#define SVM_VMCB_INTRSTATE_GUEST_IF        (1 << 1)
 
 /* VMCB.nptCtl */
 #define SVM_VMCB_NPTCTL_NP_ENABLE          (1 << 0)
+#define SVM_VMCB_NPTCTL_SEV_ENABLE         (1 << 1)
+#define SVM_VMCB_NPTCTL_SEV_ES_ENABLE      (1 << 2)
 
 /* VMCB.virtExt */
 #define SVM_VMCB_VIRTEXT_LBR_ENABLE        (1 << 0)
@@ -234,9 +242,16 @@
 #define SVM_EXITCODE_MWAIT                139
 #define SVM_EXITCODE_MWAIT_COND           140
 #define SVM_EXITCODE_XSETBV               141
+#define SVM_EXITCODE_EFER_WRITE_TRAP      143
+#define SVM_EXITCODE_CR_WRITE_TRAP(n)    (144 + (n))
 #define SVM_EXITCODE_NPF                 1024
 #define SVM_EXITCODE_AVIC_INCOMPLETE_IPI 1025
 #define SVM_EXITCODE_AVIC_NOACCEL        1026
+#define SVM_EXITCODE_VMGEXIT             1027
+#define SVM_EXITCODE_MMIO_READ           0x80000001   // SW only
+#define SVM_EXITCODE_MMIO_WRITE          0x80000002   // SW only
+#define SVM_EXITCODE_NMI_COMPLETE        0x80000003   // SW only
+#define SVM_EXITCODE_UNSUPPORTED         0x8000FFFF   // SW only
 #define SVM_EXITCODE_INVALID             (-1ULL)
 
 /* ExitInfo1 for I/O exits */
@@ -260,6 +275,9 @@
 #define SVM_IOEXIT_MBZ           0x00000002
 #define SVM_IOEXIT_SBZ           0x0000e000
 
+/* ExitInfo1 for MSR exits */
+#define SVM_MSREXIT_WRMSR        0x00000001
+
 /* ExitInfo1 for CR exits */
 #define SVM_CREXIT_MOVCR         (1ull << 63)
 #define SVM_CREXIT_GPR_MASK      0xf
@@ -430,7 +448,7 @@ SVM_LockedFromFeatures(uint64 vmCR)
 static INLINE Bool
 SVM_EnabledCPU(void)
 {
-   return SVM_EnabledFromFeatures(__GET_MSR(MSR_VM_CR));
+   return SVM_EnabledFromFeatures(X86MSR_GetMSR(MSR_VM_CR));
 }
 #endif /* } !defined(USERLEVEL) */
 
diff --git a/vmmon-only/include/x86types.h b/vmmon-only/include/x86types.h
index d8273e4e..4ad854fd 100644
--- a/vmmon-only/include/x86types.h
+++ b/vmmon-only/include/x86types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -62,13 +62,6 @@ typedef uint64 VM_EPTE;
  * Registers
  */
 
-typedef union SharedReg64 {
-   Reg8  reg8[2];
-   Reg16 reg16;
-   Reg32 reg32;
-   Reg64 reg64;
-} SharedReg64;
-
 typedef union SharedUReg64 {
    UReg8  ureg8[2];
    UReg16 ureg16;
@@ -178,11 +171,7 @@ typedef Task32 Task;
 
 #pragma pack(push, 1)
 typedef struct {
-#if defined(VMM) || defined(COREQUERY)
-   uint64 va;
-#else
-   uint32 va;
-#endif
+   uint64   va;
    Selector seg;
 } FarPtr;
 #pragma pack(pop)
@@ -468,4 +457,12 @@ typedef struct ExcFrame64ForCopy {
 } ExcFrame64ForCopy;
 #pragma pack(pop)
 
+/*
+ * Layout of the stack for performing a 64 bit lret instruction.
+ */
+typedef struct LretFrame64 {
+   uint64 rip;
+   uint64 cs;
+} LretFrame64;
+
 #endif // ifndef _X86TYPES_H_
diff --git a/vmmon-only/include/x86vt-exit-reasons.h b/vmmon-only/include/x86vt-exit-reasons.h
index 07d6cf6d..263f840a 100644
--- a/vmmon-only/include/x86vt-exit-reasons.h
+++ b/vmmon-only/include/x86vt-exit-reasons.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -92,6 +92,12 @@ VT_EXIT(RDSEED,               61)
 VT_EXIT(PML_LOGFULL,          62)
 VT_EXIT(XSAVES,               63)
 VT_EXIT(XRSTORS,              64)
-
+VT_EXIT(VMEXIT65,             65)
+VT_EXIT(VMEXIT66,             66)
+VT_EXIT(VMEXIT67,             67)
+VT_EXIT(VMEXIT68,             68)
+VT_EXIT(VMEXIT69,             69)
+VT_EXIT(ENCLV,                70)
+VT_EXIT(SGX_CONFLICT,         71)
 /* Bump this up if you add an exit reason. */
-#define VT_NUM_EXIT_REASONS   65
+#define VT_NUM_EXIT_REASONS   72
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
index 1073e906..831d12fd 100644
--- a/vmmon-only/include/x86vt-vmcs-fields.h
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -283,7 +283,7 @@ VMCS_FIELD(ENCLS_EXITING_BITMAP,    0x202E, _S64, _TC, 23, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x2030, _S64, _TC, 24)
 VMCS_FIELD(TSC_MULTIPLIER,          0x2032, _S64, _TC, 25, _NC, _NV, _NA,  _S)
 VMCS_UNUSED(                        0x2034, _S64, _TC, 26)
-VMCS_UNUSED(                        0x2036, _S64, _TC, 27)
+VMCS_FIELD(ENCLV_EXITING_BITMAP,    0x2036, _S64, _TC, 27, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x2038, _S64, _TC, 28)
 VMCS_UNUSED(                        0x203A, _S64, _TC, 29)
 VMCS_UNUSED(                        0x203C, _S64, _TC, 30)
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
index fc1dae49..6de4c30e 100644
--- a/vmmon-only/include/x86vt.h
+++ b/vmmon-only/include/x86vt.h
@@ -159,10 +159,10 @@
 #define VT_ENCODING_RSVD               0xffff9000
 
 /*
- * The highest index of any currently defined field is 25, for
- * TSC_MULTIPLIER.
+ * The highest index of any currently defined field is 27, for
+ * ENCLV_EXITING_BITMAP.
  */
-#define VT_ENCODING_MAX_INDEX                  25
+#define VT_ENCODING_MAX_INDEX                  27
 
 enum {
 #define VMCS_FIELD(_name, _val, ...) VT_VMCS_##_name = _val,
@@ -293,7 +293,9 @@ enum {
    VMX_CPU2(PT_SUPPRESS_NR_BIT, 19)                      \
    VMX_CPU2(XSAVES,             20)                      \
    VMX_CPU2(EPT_MBX,            22)                      \
-   VMX_CPU2(TSC_SCALING,        25)
+   VMX_CPU2(TSC_SCALING,        25)                      \
+   VMX_CPU2(ENCLV,              28)                      \
+   VMX_CPU2(EPC_VIRT_EXT,       29)
 
 #define VMX_PROCBASED_CTLS2_CAP                          \
         VMX_PROCBASED_CTLS2_CAP_NDA                      \
@@ -687,6 +689,12 @@ enum {
 #define VT_GUESTFAIL_QUAL_NMI          3
 #define VT_GUESTFAIL_QUAL_LINK         4
 
+/* SGX conflict VM-exit Qualification Codes */
+#define VT_SGX_TRACKING_RESOURCE_CONFLICT     0
+#define VT_SGX_TRACKING_REFERENCE_CONFLICT    1
+#define VT_SGX_EPC_PAGE_CONFLICT_EXCEPTION    2
+#define VT_SGX_EPC_PAGE_CONFLICT_ERROR        3
+
 /* VMX abort indicators. */
 
 #define VT_VMX_ABORT_GUEST_MSRS        1
@@ -710,7 +718,8 @@ enum {
 #define VT_REQUIRED_PINBASED_CTLS                      \
    (VT_PINBASED_CTLS_DEFAULT1                        | \
     VT_VMCS_PIN_VMEXEC_CTL_EXTINT_EXIT               | \
-    VT_VMCS_PIN_VMEXEC_CTL_NMI_EXIT)
+    VT_VMCS_PIN_VMEXEC_CTL_NMI_EXIT                  | \
+    VT_VMCS_PIN_VMEXEC_CTL_VNMI)
 
 #define VT_REQUIRED_PROCBASED_CTLS                     \
    (VT_PROCBASED_CTLS_DEFAULT1                       | \
@@ -726,6 +735,7 @@ enum {
     VT_VMCS_CPU_VMEXEC_CTL_LDCR8                     | \
     VT_VMCS_CPU_VMEXEC_CTL_STCR8                     | \
     VT_VMCS_CPU_VMEXEC_CTL_TPR_SHADOW                | \
+    VT_VMCS_CPU_VMEXEC_CTL_VNMI_WINDOW               | \
     VT_VMCS_CPU_VMEXEC_CTL_MONITOR)
 
 #define VT_REQUIRED_EXIT_CTLS                          \
@@ -1075,7 +1085,7 @@ VT_MBXSupportedFromFeatures(uint64 secondary)
 static INLINE Bool
 VT_EnabledCPU(void)
 {
-   return VT_EnabledFromFeatures(__GET_MSR(MSR_FEATCTL));
+   return VT_EnabledFromFeatures(X86MSR_GetMSR(MSR_FEATCTL));
 }
 
 
@@ -1096,16 +1106,14 @@ VT_EnabledCPU(void)
 static INLINE Bool
 VT_SupportedCPU(void)
 {
-   if (__GET_MSR(MSR_VMX_BASIC) & MSR_VMX_BASIC_TRUE_CTLS) {
-      return VT_SupportedFromFeatures(__GET_MSR(MSR_VMX_TRUE_PINBASED_CTLS),
-                                      __GET_MSR(MSR_VMX_TRUE_PROCBASED_CTLS),
-                                      __GET_MSR(MSR_VMX_TRUE_ENTRY_CTLS),
-                                      __GET_MSR(MSR_VMX_TRUE_EXIT_CTLS),
-                                      __GET_MSR(MSR_VMX_BASIC));
-   } else {
-      /* Bug 1914425 - VMM no longer supports CPUs without TRUE_xxx_CTLS */
-      return FALSE;
-   }
+
+   /* Bug 1914425 - VMM no longer supports CPUs without TRUE_xxx_CTLS */
+   return (X86MSR_GetMSR(MSR_VMX_BASIC) & MSR_VMX_BASIC_TRUE_CTLS) != 0 &&
+          VT_SupportedFromFeatures(X86MSR_GetMSR(MSR_VMX_TRUE_PINBASED_CTLS),
+                                   X86MSR_GetMSR(MSR_VMX_TRUE_PROCBASED_CTLS),
+                                   X86MSR_GetMSR(MSR_VMX_TRUE_ENTRY_CTLS),
+                                   X86MSR_GetMSR(MSR_VMX_TRUE_EXIT_CTLS),
+                                   X86MSR_GetMSR(MSR_VMX_BASIC));
 }
 
 #endif /* } !defined(USERLEVEL) */
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 3dc5dd3f..a1fb92b1 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -48,12 +48,10 @@
 #include "modulecall.h"
 #include "vm_asm.h"
 #include "vmx86.h"
-#include "initblock.h"
 #include "task.h"
 #include "memtrack.h"
 #include "task.h"
 #include "cpuid.h"
-#include "cpuid_info.h"
 #include "circList.h"
 #include "x86msr.h"
 
@@ -64,6 +62,7 @@
 #include "hostif.h"
 #include "hostif_priv.h"
 #include "vmhost.h"
+#include "sharedAreaVmmon.h"
 
 static void LinuxDriverQueue(Device *device);
 static void LinuxDriverDequeue(Device *device);
@@ -96,7 +95,9 @@ long LinuxDriver_Ioctl(struct file *filp, u_int iocmd,
                        unsigned long ioarg);
 
 static int LinuxDriver_Close(struct inode *inode, struct file *filp);
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 17, 0)
+static vm_fault_t LinuxDriverFault(struct vm_fault *fault);
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
 static int LinuxDriverFault(struct vm_fault *fault);
 #else
 static int LinuxDriverFault(struct vm_area_struct *vma, struct vm_fault *fault);
@@ -414,6 +415,7 @@ LinuxDriver_Open(struct inode *inode, // IN
    memset(device, 0, sizeof *device);
 
    sema_init(&device->lock4Gb, 1);
+   init_rwsem(&device->vmDriverRWSema);
 
    filp->private_data = device;
    LinuxDriverQueue(device);
@@ -443,17 +445,12 @@ LinuxDriver_Open(struct inode *inode, // IN
  */
 
 static int
-LinuxDriverAllocPages(unsigned int gfpFlag, // IN
-                      unsigned int order,   // IN
+LinuxDriverAllocPages(unsigned int order,   // IN
                       struct page **pg,     // OUT
-                      unsigned int size)    // IN
+                      PageCnt size)         // IN
 {
-   struct page* page;
-
-   page = alloc_pages(gfpFlag, order);
+   struct page* page = alloc_pages(GFP_HIGHUSER, order);
    if (page) {
-      unsigned int i;
-
       /*
        * Grab an extra reference on all pages except first one - first
        * one was already refcounted by alloc_pages.
@@ -466,9 +463,8 @@ LinuxDriverAllocPages(unsigned int gfpFlag, // IN
        * Note that this depends on Linux VM internals.  It works on all
        * kernels we care about.
        */
-
-      order = 1 << order;
-      for (i = 0; i < order; i++) {
+      PageCnt i, orderToNumPages = 1 << order;
+      for (i = 0; i < orderToNumPages; i++) {
          if (i) {
             /*
              * Debug kernels assert that page->_count is not zero when
@@ -486,17 +482,14 @@ LinuxDriverAllocPages(unsigned int gfpFlag, // IN
             put_page(page);
          } else {
             void *addr = kmap(page);
-
             memset(addr, 0, PAGE_SIZE);
             kunmap(page);
             *pg++ = page;
          }
          page++;
       }
-
       return 0;
    }
-
    return -ENOMEM;
 }
 
@@ -520,8 +513,7 @@ LinuxDriverAllocPages(unsigned int gfpFlag, // IN
 static void
 LinuxDriverDestructor4Gb(Device *device) // IN
 {
-   unsigned int pg;
-
+   PageCnt pg;
    if (!device->size4Gb) {
       return;
    }
@@ -554,10 +546,12 @@ LinuxDriver_Close(struct inode *inode, // IN
    ASSERT(device);
 
    LinuxDriverDequeue(device);
+   down_write(&device->vmDriverRWSema);
    if (device->vm != NULL) {
       Vmx86_ReleaseVM(device->vm);
       device->vm = NULL;
    }
+   up_write(&device->vmDriverRWSema);
 
    Vmx86_Close();
 
@@ -595,7 +589,12 @@ LinuxDriver_Close(struct inode *inode, // IN
  *-----------------------------------------------------------------------------
  */
 
-static int
+static
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 17, 0)
+vm_fault_t
+#else
+int
+#endif
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
 LinuxDriverFault(struct vm_fault *fault)     //IN/OUT
 #else
@@ -607,7 +606,7 @@ LinuxDriverFault(struct vm_area_struct *vma, //IN
    struct vm_area_struct *vma = fault->vma;
 #endif
    Device *device = (Device *) vma->vm_file->private_data;
-   unsigned long pg;
+   PageNum pg;
    struct page* page;
 
    pg = fault->pgoff;
@@ -644,12 +643,10 @@ LinuxDriverFault(struct vm_area_struct *vma, //IN
 static int LinuxDriverAllocContig(Device *device,
                                   struct vm_area_struct *vma,
                                   unsigned long off,
-                                  unsigned long size)
+                                  PageCnt size)
 {
    unsigned long vmaOrder = VMMON_MAP_ORDER(off);
-   unsigned long vmaAllocSize;
-   unsigned int gfpFlag;
-   unsigned long i;
+   PageCnt vmaAllocSize, i;
 
    if (VMMON_MAP_RSVD(off)) {
       /* Reserved bits set... */
@@ -659,24 +656,6 @@ static int LinuxDriverAllocContig(Device *device,
       /* We do not need non-zero offsets... */
       return -EINVAL;
    }
-   switch (VMMON_MAP_MT(off)) {
-      case VMMON_MAP_MT_LOW4GB:
-#ifdef GFP_DMA32
-         gfpFlag = GFP_USER | GFP_DMA32;
-#else
-         gfpFlag = GFP_USER | GFP_DMA;
-#endif
-         break;
-      case VMMON_MAP_MT_LOW16MB:
-         gfpFlag = GFP_USER | GFP_DMA;
-         break;
-      case VMMON_MAP_MT_ANY:
-         gfpFlag = GFP_HIGHUSER;
-         break;
-      default:
-         /* Invalid memory type */
-         return -EINVAL;
-   }
    if (size > VMMON_MAP_OFFSET_MASK + 1) {
       /* Size is too big to fit to our window. */
       return -ENOMEM;
@@ -694,23 +673,18 @@ static int LinuxDriverAllocContig(Device *device,
    }
    vmaAllocSize = 1 << vmaOrder;
    for (i = 0; i < size; i += vmaAllocSize) {
-      int err;
-
-      err = LinuxDriverAllocPages(gfpFlag, vmaOrder,
-                                  device->pages4Gb + i, size - i);
+      int err = LinuxDriverAllocPages(vmaOrder, device->pages4Gb + i, size - i);
       if (err) {
          while (i > 0) {
             put_page(device->pages4Gb[--i]);
          }
          up(&device->lock4Gb);
-
          return err;
       }
    }
    device->size4Gb = size;
    up(&device->lock4Gb);
    vma->vm_ops = &vmuser_mops;
-
    return 0;
 }
 
@@ -739,7 +713,7 @@ LinuxDriverMmap(struct file *filp,
                 struct vm_area_struct *vma)
 {
    Device *device = (Device *) filp->private_data;
-   unsigned long size;
+   PageCnt size;
    int err;
 
    /* Only shared mappings */
@@ -753,17 +727,18 @@ LinuxDriverMmap(struct file *filp,
    if (size < 1) {
       return -EINVAL;
    }
+   down_read(&device->vmDriverRWSema);
    if (device->vm) {
       err = -EINVAL;
    } else {
       err = LinuxDriverAllocContig(device, vma, vma->vm_pgoff, size);
    }
+   up_read(&device->vmDriverRWSema);
    if (err) {
       return err;
    }
    /* Clear VM_IO, otherwise SuSE's kernels refuse to do get_user_pages */
    vma->vm_flags &= ~VM_IO;
-
    return 0;
 }
 
@@ -1034,26 +1009,30 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
                   unsigned long ioarg)  // IN:
 {
    Device *device = (Device *) filp->private_data;
-   int retval = 0;
+   long retval = 0;
    Vcpuid vcpuid;
    VMDriver *vm;
+   Bool needsWriteLock = iocmd == IOCTL_VMX86_CREATE_VM ||
+                         iocmd == IOCTL_VMX86_RELEASE_VM;
 
+   ASSERT_ON_COMPILE(sizeof(long) == sizeof(int64));
    if (device == NULL) {
       return -EINVAL;
    }
 
-   vm = device->vm;
-
-   /*
-    * Validate the VM pointer for those IOCTLs that require it.
-    */
+   if (needsWriteLock) {
+      down_write(&device->vmDriverRWSema);
+   } else {
+      down_read(&device->vmDriverRWSema);
+   }
 
+   vm = device->vm;
+   /* Validate the VM pointer for those IOCTLs that require it. */
    switch (iocmd) {
    case IOCTL_VMX86_VERSION:
    case IOCTL_VMX86_CREATE_VM:
    case IOCTL_VMX86_SET_UID:
    case IOCTL_VMX86_GET_NUM_VMS:
-   case IOCTL_VMX86_GET_TOTAL_MEM_USAGE:
    case IOCTL_VMX86_SET_HARD_LIMIT:
    case IOCTL_VMX86_GET_IPI_VECTORS:
    case IOCTL_VMX86_GET_KHZ_ESTIMATE:
@@ -1108,67 +1087,73 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
 
    case IOCTL_VMX86_PROCESS_BOOTSTRAP: {
       VMProcessBootstrapBlock *args;
+      size_t argsSz = GetVMProcessBootstrapBlockSize(vm->numVCPUs);
       VA64 uAddr;
-      Bool res;
 
       retval = HostIF_CopyFromUser(&uAddr, (VA64)ioarg, sizeof uAddr);
       if (retval != 0) {
          break;
       }
-      args = HostIF_AllocKernelMem(sizeof *args, TRUE);
+      args = HostIF_AllocKernelMem(argsSz, TRUE);
       if (args == NULL) {
          retval = -ENOMEM;
          break;
       }
-      retval = HostIF_CopyFromUser(args, uAddr, sizeof *args);
+      retval = HostIF_CopyFromUser(args, uAddr, argsSz);
       if (retval != 0) {
          HostIF_FreeKernelMem(args);
          break;
       }
-      res = Vmx86_ProcessBootstrap(vm,
-                                   args->bsBlobAddr,
-                                   args->numBytes,
-                                   args->headerOffset,
-                                   args->numVCPUs,
-                                   args->ptRootVAs,
-                                   args->shRegions);
-      if (!res) {
+      if (args->numVCPUs != vm->numVCPUs) {
+         retval = -EINVAL;
+      } else if (!Vmx86_ProcessBootstrap(vm,
+                                         args->bsBlobAddr,
+                                         args->numBytes,
+                                         args->headerOffset,
+                                         args->numVCPUs,
+                                         args->perVcpuPages,
+                                         args->shRegions)) {
          retval = -ENOMEM;
       }
       HostIF_FreeKernelMem(args);
       break;
    }
 
-   case IOCTL_VMX86_RELEASE_VM:
-      device->vm = NULL;
-      Vmx86_ReleaseVM(vm);
-      break;
-
-   case IOCTL_VMX86_INIT_VM: {
-      InitBlock *initParams;
-      VA64 uAddr;
+   case IOCTL_VMX86_REGISTER_SHARED: {
+      VMSharedAreaRegistrationBlock args;
 
-      retval = HostIF_CopyFromUser(&uAddr, (VA64)ioarg, sizeof uAddr);
+      retval = HostIF_CopyFromUser(&args, (VA64)ioarg, sizeof args);
       if (retval != 0) {
          break;
       }
-      initParams = HostIF_AllocKernelMem(sizeof *initParams, TRUE);
-      if (initParams == NULL) {
+      if (!SharedAreaVmmon_ValidateRegionArgs(vm, &args)) {
+         retval = -EINVAL;
+         break;
+      }
+      if (!SharedAreaVmmon_RegisterRegion(vm, &args)) {
          retval = -ENOMEM;
+      }
+      break;
+   }
+
+   case IOCTL_VMX86_REGISTER_STATVARS: {
+      VMStatVarsRegistrationBlock args;
+
+      retval = HostIF_CopyFromUser(&args, (VA64)ioarg, sizeof args);
+      if (retval != 0) {
          break;
       }
-      retval = HostIF_CopyFromUser(initParams, uAddr, sizeof *initParams);
-      if (retval == 0) {
-         if (Vmx86_InitVM(vm, initParams) == 0) {
-            retval = HostIF_CopyToUser(uAddr, initParams, sizeof *initParams);
-         } else {
-            retval = -EINVAL;
-         }
+      if (!StatVarsVmmon_RegisterVCPU(vm, &args)) {
+         retval = -ENOMEM;
       }
-      HostIF_FreeKernelMem(initParams);
       break;
    }
 
+   case IOCTL_VMX86_RELEASE_VM:
+      device->vm = NULL;
+      Vmx86_ReleaseVM(vm);
+      break;
+
    case IOCTL_VMX86_RUN_VM:
       vcpuid = ioarg;
 
@@ -1236,17 +1221,28 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
-   case IOCTL_VMX86_GET_NUM_VMS:
-      retval = Vmx86_GetNumVMs();
+   case IOCTL_VMX86_GET_VMM_PAGE_ROOT: {
+      VcpuPageRoot args;
+
+      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
+      if (retval) {
+         break;
+      }
+      if (args.vcpuid >= vm->numVCPUs || vm->ptRootMpns == NULL) {
+         retval = -EINVAL;
+      } else {
+         args.pageRoot = vm->ptRootMpns[args.vcpuid];
+         retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
+      }
       break;
+   }
 
-   case IOCTL_VMX86_GET_TOTAL_MEM_USAGE:
-      retval = Vmx86_GetTotalMemUsage();
+   case IOCTL_VMX86_GET_NUM_VMS:
+      retval = Vmx86_GetNumVMs();
       break;
 
    case IOCTL_VMX86_SET_HARD_LIMIT: {
-      int32 limit;
-
+      PageCnt limit;
       retval = HostIF_CopyFromUser(&limit, ioarg, sizeof limit);
       if (retval != 0) {
          break;
@@ -1516,6 +1512,13 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
+   case IOCTL_VMX86_GET_NUM_ANON_PAGES: {
+      PageCnt numAnonPages;
+      numAnonPages = Vmx86_GetNumAnonPages(vm);
+      retval = HostIF_CopyToUser(ioarg, &numAnonPages, sizeof numAnonPages);
+      break;
+   }
+
    case IOCTL_VMX86_READ_PAGE: {
          VMMReadWritePage req;
 
@@ -1530,6 +1533,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       }
 
    case IOCTL_VMX86_WRITE_PAGE: {
+#if VMX86_DEVEL
          VMMReadWritePage req;
 
          retval = HostIF_CopyFromUser(&req, ioarg, sizeof req);
@@ -1538,6 +1542,9 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
          }
          retval = HostIF_WritePhysical(vm, MPN_2_MA(req.mpn), req.uAddr, FALSE,
                                        PAGE_SIZE);
+#else
+         retval = -EINVAL;
+#endif
          break;
       }
 
@@ -1596,7 +1603,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       uint64 swapSize;
       retval = HostIF_CopyFromUser(&swapSize, ioarg, sizeof swapSize);
       if (retval != 0) {
-         Warning("Could not copy swap size from user, status %d\n", retval);
+         Warning("Could not copy swap size from user, status %ld\n", retval);
          break;
       }
       linuxState.swapSize = swapSize;
@@ -1629,6 +1636,11 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    }
 
 exit:
+   if (needsWriteLock) {
+      up_write(&device->vmDriverRWSema);
+   } else {
+      up_read(&device->vmDriverRWSema);
+   }
    return retval;
 }
 
diff --git a/vmmon-only/linux/driver.h b/vmmon-only/linux/driver.h
index 189734fb..23ac2a1c 100644
--- a/vmmon-only/linux/driver.h
+++ b/vmmon-only/linux/driver.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2018-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -27,27 +27,14 @@
 #include <linux/mutex.h>
 #include <linux/sched.h>
 #include <linux/semaphore.h>
+#include <linux/rwsem.h>
 #include <linux/wait.h>
 
 #include "vmx86.h"
 #include "driver_vmcore.h"
 
 
-/*
- * Used to track a piece of memory that's been mapped into the kernel from
- * userlevel.
- */
-typedef struct VMMappedUserMem {
-   void *addr;
-   size_t numPages;
-   struct page *pages[0];
-} VMMappedUserMem;
-
-
-/*
- * Per-instance driver state
- */
-
+/* Per-instance driver state */
 struct VMDriver;
 
 /* 16 pages (64KB) looks as a good limit for one allocation */
@@ -56,7 +43,15 @@ struct VMDriver;
 typedef struct Device {
    struct Device   *next;
    struct VMDriver *vm;
-
+   /*
+    * This RW semaphore protects accesses to the VMDriver to
+    * avoid racing between various ioctls, and the creation
+    * and removal of the VM in question. The lock is read-acquired
+    * by ioctls that reference the VMDriver, and write-acquired by
+    * ioctls or device callbacks that allocate or destory the
+    * VMDriver.
+    */
+   struct rw_semaphore vmDriverRWSema;
    /*
     * The semaphore protect accesses to size4Gb and pages4Gb
     * in mmap(). mmap() may happen only once, and all other
@@ -64,7 +59,7 @@ typedef struct Device {
     * only after successful mmap.
     */
    struct semaphore lock4Gb;
-   unsigned int size4Gb;
+   PageCnt size4Gb;
    struct page *pages4Gb[VMMON_MAX_LOWMEM_PAGES];
 } Device;
 
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index b05e0143..f3a96a8b 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -63,7 +63,7 @@
 #include "memtrack.h"
 #include "phystrack.h"
 #include "cpuid.h"
-#include "cpuid_info.h"
+#include "x86cpuid_asm.h"
 #include "hostif.h"
 #include "hostif_priv.h"
 #include "vmhost.h"
@@ -787,21 +787,21 @@ HostIF_FreeMachinePage(MPN mpn)  // IN:
  *----------------------------------------------------------------------
  */
 
-int
+int64
 HostIF_AllocLockedPages(VMDriver *vm,         // IN: VM instance pointer
                         VA64 addr,            // OUT: buffer address
-                        unsigned numPages,    // IN: number of pages to allocate
+                        PageCnt numPages,     // IN: number of pages to allocate
                         Bool kernelMPNBuffer) // IN: kernel vs user space
 {
    VMHost *vmh = vm->vmhost;
-   unsigned int cnt;
-   int err = 0;
+   PageCnt cnt;
+   int64 err = 0;
 
    if (!vmh || !vmh->AWEPages) {
       return -EINVAL;
    }
    for (cnt = 0; cnt < numPages; cnt++) {
-      struct page* pg;
+      struct page *pg;
       MPN mpn;
 
       pg = alloc_page(GFP_HIGHUSER);
@@ -848,66 +848,38 @@ HostIF_AllocLockedPages(VMDriver *vm,         // IN: VM instance pointer
 
 int
 HostIF_FreeLockedPages(VMDriver *vm,         // IN: VM instance pointer
-                       VA64 addr,            // IN: array of MPNs
-                       unsigned numPages,    // IN: number of pages to free
-                       Bool kernelMPNBuffer) // IN: kernel vs user address
+                       MPN *mpns,            // IN: array of MPNs
+                       PageCnt numPages)     // IN: number of pages to free
 {
-   const int MPN_BATCH = 64;
-   MPN const *pmpn = VA64ToPtr(addr);
    VMHost *vmh = vm->vmhost;
-   unsigned int cnt;
+   PageCnt cnt;
    struct page *pg;
-   MPN *mpns;
-
-   mpns = HostIF_AllocKernelMem(sizeof *mpns * MPN_BATCH, TRUE);
 
-   if (mpns == NULL) {
-      return -ENOMEM;
-   }
    if (!vmh || !vmh->AWEPages) {
-      HostIF_FreeKernelMem(mpns);
       return -EINVAL;
    }
 
-   if (!kernelMPNBuffer) {
-      if (numPages > MPN_BATCH) {
-         HostIF_FreeKernelMem(mpns);
-         return -EINVAL;
-      }
-
-      if (HostIF_CopyFromUser(mpns, addr, numPages * sizeof *pmpn)) {
-         printk(KERN_DEBUG "Cannot read from process address space at %p\n",
-                pmpn);
-         HostIF_FreeKernelMem(mpns);
-         return -EINVAL;
-      }
-
-      pmpn = mpns;
-   }
-
    for (cnt = 0; cnt < numPages; cnt++) {
-      if (!PhysTrack_Test(vmh->AWEPages, pmpn[cnt])) {
+      if (!PhysTrack_Test(vmh->AWEPages, mpns[cnt])) {
          printk(KERN_DEBUG "Attempted to free unallocated MPN %016" FMT64 "X\n",
-                pmpn[cnt]);
-         HostIF_FreeKernelMem(mpns);
+                mpns[cnt]);
          return -EINVAL;
       }
 
-      pg = pfn_to_page(pmpn[cnt]);
+      pg = pfn_to_page(mpns[cnt]);
       if (page_count(pg) != 1) {
          // should this case be considered a failure?
          printk(KERN_DEBUG "Page %016" FMT64 "X is still used by someone "
-                "(use count %u, VM %p)\n", pmpn[cnt],
+                "(use count %u, VM %p)\n", mpns[cnt],
                  page_count(pg), vm);
       }
    }
 
    for (cnt = 0; cnt < numPages; cnt++) {
-      pg = pfn_to_page(pmpn[cnt]);
-      PhysTrack_Remove(vmh->AWEPages, pmpn[cnt]);
+      pg = pfn_to_page(mpns[cnt]);
+      PhysTrack_Remove(vmh->AWEPages, mpns[cnt]);
       __free_page(pg);
    }
-   HostIF_FreeKernelMem(mpns);
    return 0;
 }
 
@@ -1042,7 +1014,7 @@ HostIFAllocVMHost(uint32 numVCPUs) // IN:
  *      Initialize the host-dependent part of the driver.
  *
  * Results:
- *      zero on success, non-zero on error.
+ *      TRUE on success, FALSE on error.
  *
  * Side effects:
  *      None
@@ -1050,12 +1022,12 @@ HostIFAllocVMHost(uint32 numVCPUs) // IN:
  *----------------------------------------------------------------------
  */
 
-int
+Bool
 HostIF_Init(VMDriver *vm, uint32 numVCPUs)
 {
    vm->memtracker = MemTrack_Init(vm);
    if (vm->memtracker == NULL) {
-      return -1;
+      return FALSE;
    }
 
    vm->vmhost = HostIFAllocVMHost(numVCPUs);
@@ -1068,7 +1040,7 @@ HostIF_Init(VMDriver *vm, uint32 numVCPUs)
    }
    MutexInit(&vm->vmhost->vmMutex, "vm");
 
-   return 0;
+   return TRUE;
 error:
    if (vm->vmhost != NULL) {
       HostIFHostMemCleanup(vm);
@@ -1079,7 +1051,7 @@ HostIF_Init(VMDriver *vm, uint32 numVCPUs)
       MemTrack_Cleanup(vm->memtracker, UnlockEntry, vm);
       vm->memtracker = NULL;
    }
-   return -1;
+   return FALSE;
 }
 
 
@@ -1248,11 +1220,7 @@ HostIF_LockPage(VMDriver *vm,                // IN: VMDriver
    vpn = PTR_2_VPN(uvAddr);
    if (!allowMultipleMPNsPerVA) {
       entryPtr = MemTrack_LookupVPN(vm->memtracker, vpn);
-
-      /*
-       * Already tracked and locked
-       */
-
+      /* Already tracked and locked */
       if (entryPtr != NULL && entryPtr->mpn != 0) {
          return PAGE_LOCK_ALREADY_LOCKED;
       }
@@ -1265,10 +1233,7 @@ HostIF_LockPage(VMDriver *vm,                // IN: VMDriver
    *mpn = (MPN)page_to_pfn(page);
 
    if (allowMultipleMPNsPerVA) {
-      /*
-       *  Add the MPN to the PhysTracker that tracks locked pages.
-       */
-
+      /* Add the MPN to the PhysTracker that tracks locked pages */
       struct PhysTracker* const pt = vm->vmhost->lockedPages;
 
       if (PhysTrack_Test(pt, *mpn)) {
@@ -1485,7 +1450,7 @@ HostIF_FreeAllResources(VMDriver *vm) // IN
 
 void *
 HostIF_AllocKernelMem(size_t size,  // IN:
-                      int wired)    // IN:
+                      Bool wired)   // IN:
 {
    void * ptr = kmalloc(size, GFP_KERNEL);
 
@@ -1629,9 +1594,9 @@ HostIF_UnmapPage(VPN vpn) // IN:
  *----------------------------------------------------------------------
  */
 
-unsigned int
+PageCnt
 HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
-                               unsigned int currentlyLockedPages) // IN
+                               PageCnt currentlyLockedPages)      // IN
 {
    /*
     * This variable is available and exported to modules,
@@ -1640,12 +1605,10 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
 
 #if LINUX_VERSION_CODE < KERNEL_VERSION(5, 0, 0)
    extern unsigned long totalram_pages;
-
-   unsigned int totalPhysicalPages = totalram_pages;
+   PageCnt totalPhysicalPages = totalram_pages;
 #else
-   unsigned int totalPhysicalPages = totalram_pages();
+   PageCnt totalPhysicalPages = totalram_pages();
 #endif
-
    /*
     * Use the memory information linux exports as of late for a more
     * precise estimate of locked memory.  All kernel page-related structures
@@ -1654,14 +1617,13 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
     * also as good as locked, since we don't use them.  Lastly, without
     * available swap, anonymous pages become locked in memory as well.
     */
-
-   unsigned int forHost;
-   unsigned int reservedPages = MEMDEFAULTS_MIN_HOST_PAGES;
-   unsigned int hugePages = (vm == NULL) ? 0 :
-      BYTES_2_PAGES(vm->memInfo.hugePageBytes);
-   unsigned int lockedPages = hugePages + reservedPages;
-   unsigned int anonPages;
-   unsigned int swapPages = BYTES_2_PAGES(linuxState.swapSize);
+   PageCnt forHost;
+   PageCnt reservedPages = MEMDEFAULTS_MIN_HOST_PAGES;
+   PageCnt hugePages = (vm == NULL) ? 0
+                                    : BYTES_2_PAGES(vm->memInfo.hugePageBytes);
+   PageCnt lockedPages = hugePages + reservedPages;
+   PageCnt anonPages;
+   PageCnt swapPages = BYTES_2_PAGES(linuxState.swapSize);
 
    /* global_page_state is global_zone_page_state in 4.14. */
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 14, 0)
@@ -2156,10 +2118,10 @@ HostIF_MapCrossPage(VMDriver *vm, // IN
  */
 
 void *
-HostIF_AllocKernelPages(unsigned numPages, // IN: Number of pages
+HostIF_AllocKernelPages(PageCnt numPages,  // IN: Number of pages
                         MPN     *mpns)     // OUT: Array of MPNs
 {
-   unsigned i;
+   PageCnt i;
    void *ptr = vmalloc(numPages * PAGE_SIZE);
 
    if (ptr == NULL) {
@@ -2190,7 +2152,7 @@ HostIF_AllocKernelPages(unsigned numPages, // IN: Number of pages
  */
 
 void
-HostIF_FreeKernelPages(unsigned numPages, // IN: Number of pages
+HostIF_FreeKernelPages(PageCnt numPages,  // IN: Number of pages
                        void    *ptr)      // IN: Kernel VA of first page
 {
    vfree(ptr);
@@ -2328,7 +2290,7 @@ isVAReadable(VA r)  // IN:
    int ret;
 
    old_fs = get_fs();
-   set_fs(get_ds());
+   set_fs(KERNEL_DS);
    r = APICR_TO_ADDR(r, APICR_VERSION);
    ret = HostIF_CopyFromUser(&dummy, r, sizeof dummy);
    set_fs(old_fs);
@@ -2464,7 +2426,7 @@ HostIF_APICInit(VMDriver *vm,   // IN:
       apicIPILogged = TRUE;
    }
 
-   if ((__GET_MSR(MSR_APIC_BASE) & APIC_MSR_X2APIC_ENABLED) != 0) {
+   if ((X86MSR_GetMSR(MSR_APIC_BASE) & APIC_MSR_X2APIC_ENABLED) != 0) {
       if (setVMPtr) {
          vm->hostAPIC.base = NULL;
          vm->vmhost->hostAPICIsMapped = FALSE;
@@ -2605,7 +2567,7 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
    }
 
    old_fs = get_fs();
-   set_fs(get_ds());
+   set_fs(KERNEL_DS);
 
    {
       struct poll_wqueues table;
@@ -2690,8 +2652,12 @@ HostIF_SemaphoreForceWakeup(VMDriver *vm,       // IN:
                             const VCPUSet *vcs) // IN:
 {
    FOR_EACH_VCPU_IN_SET_WITH_MAX(vcs, vcpuid, vm->numVCPUs) {
-      struct task_struct *t = vm->vmhost->vcpuSemaTask[vcpuid];
-      vm->vmhost->vcpuSemaTask[vcpuid] = NULL;
+      /*
+       * To avoid lost wake-up race and to avoid redundant wakeups, use
+       * "xchg" to read and clear atomically; wake_up_process() is non-lossy.
+       */
+      struct task_struct *t =
+         (struct task_struct *)xchg(&vm->vmhost->vcpuSemaTask[vcpuid], NULL);
       if (t && (t->state & TASK_INTERRUPTIBLE)) {
          wake_up_process(t);
       }
@@ -2734,7 +2700,7 @@ HostIF_SemaphoreSignal(uint64 *args)  // IN:
    }
 
    old_fs = get_fs();
-   set_fs(get_ds());
+   set_fs(KERNEL_DS);
 
    /*
     * Always write sizeof(uint64) bytes. This works fine for eventfd and
@@ -3185,6 +3151,26 @@ HostIF_GetNextAnonPage(VMDriver *vm, MPN inMPN)
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * HostIF_GetNumAnonPages --
+ *
+ *      Returns the number of anon MPNs used by this VM.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+PageCnt
+HostIF_GetNumAnonPages(VMDriver *vm)
+{
+   if (!vm->vmhost || !vm->vmhost->AWEPages) {
+      return 0;
+   }
+   return PhysTrack_GetNumTrackedPages(vm->vmhost->AWEPages);
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -3402,7 +3388,6 @@ HostIF_SetFastClockRate(unsigned int rate) // IN: Frequency in Hz.
       }
    } else {
       if (linuxState.fastClockThread) {
-         force_sig(SIGKILL, linuxState.fastClockThread);
          kthread_stop(linuxState.fastClockThread);
 
          linuxState.fastClockThread = NULL;
@@ -3412,145 +3397,6 @@ HostIF_SetFastClockRate(unsigned int rate) // IN: Frequency in Hz.
    return 0;
 }
 
-
-/*
- *-----------------------------------------------------------------------------
- *
- * HostIF_MapUserMem --
- *
- *      Obtain kernel pointer to user memory. The pages backing the user memory
- *      address are locked into memory (this allows the pointer to be used in
- *      contexts where paging is undesirable or impossible).
- *
- * Results:
- *      On success, returns the kernel virtual address, along with a handle to
- *      be used for unmapping.
- *      On failure, returns NULL.
- *
- * Side effects:
- *      Yes.
- *
- *-----------------------------------------------------------------------------
- */
-
-void *
-HostIF_MapUserMem(VA addr,                  // IN: User memory virtual address
-                  size_t size,              // IN: Size of memory desired
-                  VMMappedUserMem **handle) // OUT: Handle to mapped memory
-{
-   void *p = (void *) (uintptr_t) addr;
-   VMMappedUserMem *newHandle;
-   VA offset = addr & (PAGE_SIZE - 1);
-   size_t numPagesNeeded = ((offset + size) / PAGE_SIZE) + 1;
-   size_t handleSize =
-      sizeof *newHandle + numPagesNeeded * sizeof newHandle->pages[0];
-   void *mappedAddr;
-
-   ASSERT(handle);
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 0, 0)
-   if (!access_ok(VERIFY_WRITE, p, size))
-#else
-   if (!access_ok(p, size))
-#endif
-   {
-      printk(KERN_ERR "%s: Couldn't verify write to uva 0x%p with size %"
-             FMTSZ"u\n", __func__, p, size);
-
-      return NULL;
-   }
-
-   newHandle = kmalloc(handleSize, GFP_KERNEL);
-   if (newHandle == NULL) {
-      printk(KERN_ERR "%s: Couldn't allocate %"FMTSZ"u bytes of memory\n",
-             __func__, handleSize);
-
-      return NULL;
-   }
-
-   if (HostIFGetUserPages(p, newHandle->pages, numPagesNeeded)) {
-      kfree(newHandle);
-      printk(KERN_ERR "%s: Couldn't get %"FMTSZ"u %s for uva 0x%p\n", __func__,
-             numPagesNeeded, numPagesNeeded > 1 ? "pages" : "page", p);
-
-      return NULL;
-   }
-
-   if (numPagesNeeded > 1) {
-      /*
-       * Unlike kmap(), vmap() can fail. If it does, we need to release the
-       * pages that we acquired in HostIFGetUserPages().
-       */
-
-      mappedAddr = vmap(newHandle->pages, numPagesNeeded, VM_MAP, PAGE_KERNEL);
-      if (mappedAddr == NULL) {
-         unsigned int i;
-         for (i = 0; i < numPagesNeeded; i++) {
-            put_page(newHandle->pages[i]);
-         }
-         kfree(newHandle);
-         printk(KERN_ERR "%s: Couldn't vmap %"FMTSZ"u %s for uva 0x%p\n",
-                __func__, numPagesNeeded,
-                numPagesNeeded > 1 ? "pages" : "page", p);
-
-         return NULL;
-      }
-   } else {
-      mappedAddr = kmap(newHandle->pages[0]);
-   }
-
-   printk(KERN_DEBUG "%s: p = 0x%p, offset = 0x%p, numPagesNeeded = %"FMTSZ"u,"
-          " handleSize = %"FMTSZ"u, mappedAddr = 0x%p\n",
-          __func__, p, (void *)offset, numPagesNeeded, handleSize, mappedAddr);
-
-   newHandle->numPages = numPagesNeeded;
-   newHandle->addr = mappedAddr;
-   *handle = newHandle;
-
-   return mappedAddr + offset;
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * HostIF_UnmapUserMem --
- *
- *      Unmap user memory from HostIF_MapUserMem().
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      Yes.
- *
- *-----------------------------------------------------------------------------
- */
-
-void
-HostIF_UnmapUserMem(VMMappedUserMem *handle) // IN: Handle to mapped memory
-{
-   unsigned int i;
-
-   if (handle == NULL) {
-      return;
-   }
-
-   printk(KERN_DEBUG "%s: numPages = %"FMTSZ"u, addr = 0x%p\n",
-          __func__, handle->numPages, handle->addr);
-
-   if (handle->numPages > 1) {
-      vunmap(handle->addr);
-   } else {
-      kunmap(handle->pages[0]);
-   }
-
-   for (i = 0; i < handle->numPages; i++) {
-      put_page(handle->pages[i]);
-   }
-   kfree(handle);
-}
-
 /*
  *-----------------------------------------------------------------------------
  *
diff --git a/vmmon-only/linux/hostif_priv.h b/vmmon-only/linux/hostif_priv.h
index fd790660..9465654e 100644
--- a/vmmon-only/linux/hostif_priv.h
+++ b/vmmon-only/linux/hostif_priv.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2009-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2009-2015,2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -25,12 +25,6 @@
 #ifndef _HOSTIF_PRIV_H_
 #define _HOSTIF_PRIV_H_
 
-/* Functions for mapping and unmapping userspace memory. */
-struct VMMappedUserMem;
-EXTERN void  *HostIF_MapUserMem(VA addr, size_t size,
-                                struct VMMappedUserMem **handle);
-EXTERN void   HostIF_UnmapUserMem(struct VMMappedUserMem *handle);
-
 /* Uptime-related functions. */
 EXTERN void   HostIF_InitUptime(void);
 EXTERN void   HostIF_CleanupUptime(void);
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/vmcore/moduleloop.c
index bd47aaf1..7e761f99 100644
--- a/vmmon-only/vmcore/moduleloop.c
+++ b/vmmon-only/vmcore/moduleloop.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -24,7 +24,7 @@
  *
  */
 
-#if defined(linux)
+#if defined(__linux__)
 /* Must come before any kernel header file */
 #   include "driver-config.h"
 #   include <linux/kernel.h>
@@ -34,7 +34,6 @@
 #include "modulecall.h"
 #include "vmx86.h"
 #include "task.h"
-#include "initblock.h"
 #include "vm_basic_asm.h"
 #include "iocontrols.h"
 #include "hostif.h"
@@ -43,6 +42,7 @@
 #include "usercalldefs.h"
 #include "cpuid.h"
 #include "vmmblob.h"
+#include "sharedAreaVmmon.h"
 
 /*
  *----------------------------------------------------------------------
@@ -72,13 +72,15 @@ int
 Vmx86_RunVM(VMDriver *vm,   // IN:
             Vcpuid vcpuid)  // IN:
 {
-   uint32           retval    = MODULECALL_USERRETURN;
+   uint64           retval    = MODULECALL_USERRETURN;
    VMCrossPageData *crosspage;
    int              bailValue = 0;
 
-   ASSERT(vcpuid < vm->numVCPUs && CPUID_HostSupportsHV());
+   ASSERT(vcpuid < vm->numVCPUs);
+   if (vm->crosspage[vcpuid] == NULL) {
+      return USERCALL_VMX86ALLOCERR;
+   }
    crosspage = &vm->crosspage[vcpuid]->crosspageData;
-   ASSERT(crosspage);
 
    /*
     * Check if we were interrupted by signal.
@@ -123,7 +125,8 @@ skipTaskSwitch:;
           * from the ioctl (back to the userlevel side of a VCPU thread).
           */
          bailValue = crosspage->userCallType;
-         crosspage->retval = retval;
+         ASSERT(retval == (uint64)((uint32)retval));
+         crosspage->retval = (uint32)retval;
          goto bailOut;
       }
 
@@ -136,18 +139,19 @@ skipTaskSwitch:;
 
       case MODULECALL_GET_RECYCLED_PAGES: {
          MPN mpns[MODULECALL_NUM_ARGS];
-         int nPages = MIN((int)crosspage->args[0], MODULECALL_NUM_ARGS);
-
-         retval = Vmx86_AllocLockedPages(vm, PtrToVA64(mpns), nPages, TRUE,
-                                         FALSE);
+         PageCnt nPages = MIN(crosspage->args[0], MODULECALL_NUM_ARGS);
+         ASSERT((int64)crosspage->args[0] >= 0);
+         retval = Vmx86_AllocLockedPages(vm, PtrToVA64(mpns), nPages,
+                                         TRUE, FALSE);
          if (retval <= nPages) {
-            int i;
+            PageCnt i;
             for (i = 0; i < retval; i++) {
                crosspage->args[i] = mpns[i];
             }
          } else {
-            // retval is holding an error code
-            Warning("Failed to alloc %u pages: %d\n", nPages, (int)retval);
+            /* retval is holding an error code */
+            Warning("Failed to alloc %"FMT64"u pages: %"FMT64"d\n", nPages,
+                    (int64)retval);
             retval = 0;
          }
          break;
@@ -197,7 +201,7 @@ skipTaskSwitch:;
       }
 
       case MODULECALL_RELEASE_ANON_PAGES: {
-         unsigned count;
+         PageCnt count;
          MPN mpns[MODULECALL_NUM_ARGS];
          for (count = 0; count < MODULECALL_NUM_ARGS; count++) {
             mpns[count] = (MPN)crosspage->args[count];
@@ -206,15 +210,14 @@ skipTaskSwitch:;
             }
          }
          ASSERT(count > 0);
-         retval = Vmx86_FreeLockedPages(vm, PtrToVA64(mpns), count, TRUE);
+         retval = Vmx86_FreeLockedPages(vm, mpns, count);
          break;
       }
 
       case MODULECALL_LOOKUP_MPN: {
-         int i;
-         VPN64  vpn    = (VPN64)crosspage->args[0];
-         uint32 nPages = (uint32)crosspage->args[1];
-         VA64   uAddr  = (VA64)VPN_2_VA(vpn);
+         VPN64   vpn        = (VPN64)crosspage->args[0];
+         PageCnt i, nPages  = crosspage->args[1];
+         VA64    uAddr      = (VA64)VPN_2_VA(vpn);
          ASSERT(nPages <= MODULECALL_NUM_ARGS);
          HostIF_VMLock(vm, 38);
          for (i = 0; i < nPages; i++) {
@@ -292,17 +295,36 @@ skipTaskSwitch:;
          vm->blobInfo = NULL;
       } break;
 
+      case MODULECALL_GET_SHARED_AREA: {
+         SharedAreaVmmonRequest request;
+         request.type       = (SharedAreaType)crosspage->args[0];
+         request.vcpu       = (Vcpuid)crosspage->args[1];
+         request.offset     = (PageCnt)crosspage->args[2];
+         /* Store MPN result in crosspage arg as crosspage retval is 32 bit. */
+         crosspage->args[3] = SharedAreaVmmon_GetRegionMPN(vm, &request);
+      } break;
+
+      case MODULECALL_GET_STAT_VARS: {
+         Vcpuid  vcpu   = (Vcpuid)crosspage->args[0];
+         PageCnt offset = (PageCnt)crosspage->args[1];
+         /* Store MPN result in crosspage arg as crosspage retval is 32 bit. */
+         crosspage->args[2] = StatVarsVmmon_GetRegionMPN(vm, vcpu, offset);
+      } break;
+
+      case MODULECALL_GET_NUM_PTP_PAGES: {
+         /* Store PageCnt in crosspage arg as crosspage retval is 32 bit. */
+         crosspage->args[1] = vm->numPTPPages;
+      } break;
+
       default:
          Warning("ModuleCall %d not supported\n", crosspage->moduleCallType);
       }
-
-      crosspage->retval = retval;
-
-#if defined(linux)
+      ASSERT(retval == (uint64)((uint32)retval));
+      crosspage->retval = (uint32)retval;
+#if defined(__linux__)
       cond_resched(); // Other kernels are preemptable
 #endif
    }
-
 bailOut:
    return bailValue;
 }
diff --git a/vmnet-only/Makefile b/vmnet-only/Makefile
index caab6b91..40bdb6a8 100644
--- a/vmnet-only/Makefile
+++ b/vmnet-only/Makefile
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+# Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -98,6 +98,13 @@ auto-build: $(DRIVER_KO)
 $(DRIVER): $(DRIVER_KO)
 	if [ $< -nt $@ ] || [ ! -e $@ ] ; then cp -f $< $@; fi
 
+# Use SUBDIRS on 2.x, 3.x, 4.x.  Use M on newer kernels.
+ifeq ($(filter-out 2 3 4,$(firstword $(subst ., ,$(VM_UNAME)))),)
+DIRVAR := SUBDIRS
+else
+DIRVAR := M
+endif
+
 #
 # Define a setup target that gets built before the actual driver.
 # This target may not be used at all, but if it is then it will be defined
@@ -107,7 +114,7 @@ prebuild:: ;
 postbuild:: ;
 
 $(DRIVER_KO): prebuild
-	$(MAKE) -C $(BUILD_DIR) SUBDIRS=$$PWD SRCROOT=$$PWD/$(SRCROOT) \
+	$(MAKE) -C $(BUILD_DIR) $(DIRVAR)=$$PWD SRCROOT=$$PWD/$(SRCROOT) \
 	  MODULEBUILDDIR=$(MODULEBUILDDIR) modules
 	$(MAKE) -C $$PWD SRCROOT=$$PWD/$(SRCROOT) \
 	  MODULEBUILDDIR=$(MODULEBUILDDIR) postbuild
@@ -129,6 +136,9 @@ ifdef VMX86_DEBUG
 CC_OPTS += -DVMX86_DEBUG
 endif
 
+# Add Spectre options when available
+CC_OPTS += $(call vm_check_gcc,-mindirect-branch=thunk -mindirect-branch-register,)
+
 include $(SRCROOT)/Makefile.kernel
 
 else
diff --git a/vmnet-only/net.h b/vmnet-only/net.h
index c226f92d..a7b13076 100644
--- a/vmnet-only/net.h
+++ b/vmnet-only/net.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2016,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -54,6 +54,8 @@
 
 #define ETHER_MAX_QUEUED_PACKET 1600
 
+/* Most Ethernet equipment can support jumbo frames up to 9216 bytes. */
+#define ETHER_MAX_JUMBO_FRAME_LEN 9216
 
 /*
  * State's that a NIC can be in currently we only use this
diff --git a/vmnet-only/netif.c b/vmnet-only/netif.c
index bcd9a7cb..c70f7f4c 100644
--- a/vmnet-only/netif.c
+++ b/vmnet-only/netif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2013,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -28,6 +28,7 @@
 
 #include <linux/netdevice.h>
 #include <linux/etherdevice.h>
+#include <linux/if_vlan.h>
 #include <linux/mm.h>
 #include "compat_skbuff.h"
 #include <linux/sockios.h>
@@ -44,6 +45,22 @@
 #include "vmnetInt.h"
 
 
+/*
+ * Default min MTU value as defined by kernel versions >= 4.10.0.
+ * Use the same value for earlier versions of the kernel which do not
+ * enforce a minimum MTU size.
+ */
+#define VMNET_MIN_MTU 68
+#define VMNET_MAX_MTU (ETHER_MAX_JUMBO_FRAME_LEN - \
+                      (ETH_HLEN + VLAN_HLEN + ETH_FCS_LEN))
+
+#ifdef RHEL_RELEASE_CODE
+#if (RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(7, 5) && \
+     RHEL_RELEASE_CODE < RHEL_RELEASE_VERSION(8, 0))
+#define ndo_change_mtu ndo_change_mtu_rh74
+#endif
+#endif /* RHEL_RELEASE_CODE */
+
 typedef struct VNetNetIF {
    VNetPort                port;
    struct net_device      *dev;
@@ -64,6 +81,11 @@ static int  VNetNetifSetMAC(struct net_device *dev, void *addr);
 static void VNetNetifSetMulticast(struct net_device *dev);
 static int  VNetNetIfProcRead(char *page, char **start, off_t off,
                               int count, int *eof, void *data);
+#if (LINUX_VERSION_CODE < KERNEL_VERSION(4, 10, 0)) && \
+    (defined(HAVE_NET_DEVICE_OPS) || defined(HAVE_CHANGE_MTU))
+static int VNetNetifChangeMtu(struct net_device *dev, int new_mtu);
+#endif
+
 
 /*
  *----------------------------------------------------------------------
@@ -84,7 +106,7 @@ static int  VNetNetIfProcRead(char *page, char **start, off_t off,
 static void
 VNetNetIfSetup(struct net_device *dev)  // IN:
 {
-#if !COMPAT_LINUX_VERSION_CHECK_LT(3, 1, 0) || defined(HAVE_NET_DEVICE_OPS)
+#ifdef HAVE_NET_DEVICE_OPS
    static const struct net_device_ops vnetNetifOps = {
       .ndo_init = VNetNetifProbe,
       .ndo_open = VNetNetifOpen,
@@ -97,12 +119,23 @@ VNetNetIfSetup(struct net_device *dev)  // IN:
 #else
       .ndo_set_rx_mode = VNetNetifSetMulticast,
 #endif
-
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 10, 0)
+      .ndo_change_mtu = VNetNetifChangeMtu,
+#endif
    };
+#endif /* HAVE_NET_DEVICE_OPS */
+
+   /* Turns on IFF_BROADCAST, IFF_MULTICAST. */
+   ether_setup(dev);
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 10, 0)
+   /* Set the maximum allowed MTU value. */
+   dev->max_mtu = VMNET_MAX_MTU;
 #endif
 
-   ether_setup(dev); // turns on IFF_BROADCAST, IFF_MULTICAST
-#if COMPAT_LINUX_VERSION_CHECK_LT(3, 1, 0) && !defined(HAVE_NET_DEVICE_OPS) 
+#ifdef HAVE_NET_DEVICE_OPS
+   dev->netdev_ops = &vnetNetifOps;
+#else
    dev->init = VNetNetifProbe;
    dev->open = VNetNetifOpen;
    dev->hard_start_xmit = VNetNetifStartXmit;
@@ -110,9 +143,10 @@ VNetNetIfSetup(struct net_device *dev)  // IN:
    dev->get_stats = VNetNetifGetStats;
    dev->set_mac_address = VNetNetifSetMAC;
    dev->set_multicast_list = VNetNetifSetMulticast;
-#else
-   dev->netdev_ops = &vnetNetifOps;
-   #endif /* HAVE_NET_DEVICE_OPS */
+#ifdef HAVE_CHANGE_MTU
+   dev->change_mtu = VNetNetifChangeMtu;
+#endif /* HAVE_CHANGE_MTU */
+#endif /* HAVE_NET_DEVICE_OPS */
 
 }
 
@@ -530,6 +564,38 @@ VNetNetifSetMulticast(struct net_device *dev) // IN: unused
 }
 
 
+#if (LINUX_VERSION_CODE < KERNEL_VERSION(4, 10, 0)) && \
+    (defined(HAVE_NET_DEVICE_OPS) || defined(HAVE_CHANGE_MTU))
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetNetifChangeMtu --
+ *
+ *      Changes the current MTU value of a given vmnet interface.
+ *
+ * Results:
+ *      Returns zero on success, or invalid argument error if an incorrect
+ *      MTU size is being set.
+ *
+ * Side effects:
+ *      None.
+ *----------------------------------------------------------------------
+ */
+
+int
+VNetNetifChangeMtu(struct net_device *dev, // IN/OUT: assigning the mtu member.
+                   int new_mtu)            // IN:     new mtu value.
+{
+   if (new_mtu < VMNET_MIN_MTU || new_mtu > VMNET_MAX_MTU) {
+      return -EINVAL;
+   }
+
+   dev->mtu = new_mtu;
+   return 0;
+}
+#endif
+
+
 /*
  *----------------------------------------------------------------------
  *
diff --git a/vmnet-only/smac.c b/vmnet-only/smac.c
index c1c8da8f..8dc0f956 100644
--- a/vmnet-only/smac.c
+++ b/vmnet-only/smac.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002,2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -41,8 +41,6 @@
 
 #else /* _WIN32 */
 
-#undef __KERNEL__ //To prevent including any kernel specific stuff 
-
 #ifdef VMX86_DEVEL
 #define DBG 1
 #else
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index a598dba8..d3850885 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2017,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -367,12 +367,12 @@ VNetUserIfReceive(VNetJack       *this, // IN
    VNetUserIF *userIf = (VNetUserIF*)this->private;
    uint8 *dest = SKB_2_DESTMAC(skb);
    unsigned long flags;
-   
+
    if (!UP_AND_RUNNING(userIf->port.flags)) {
       userIf->stats.droppedDown++;
       goto drop_packet;
    }
-   
+
    if (!VNetPacketMatch(dest,
                         userIf->port.paddr,
                         (const uint8 *)userIf->port.exactFilter,
@@ -382,13 +382,17 @@ VNetUserIfReceive(VNetJack       *this, // IN
       userIf->stats.droppedMismatch++;
       goto drop_packet;
    }
-   
+
    if (skb_queue_len(&userIf->packetQueue) >= vnet_max_qlen) {
       userIf->stats.droppedOverflow++;
       goto drop_packet;
    }
-   
-   if (skb->len > ETHER_MAX_QUEUED_PACKET) {
+
+   /*
+    * The check would be more accurate if based on the current MTU value
+    * of the corresponding vmnet interface. PR 2267716 is filed to track this.
+    */
+   if (skb->len > ETHER_MAX_JUMBO_FRAME_LEN) {
       userIf->stats.droppedLargePacket++;
       goto drop_packet;
    }
@@ -752,7 +756,7 @@ VNetUserIfRead(VNetPort    *port, // IN
  *----------------------------------------------------------------------
  */
 
-static int 
+static int
 VNetUserIfWrite(VNetPort    *port, // IN
                 struct file *filp, // IN
                 const char  *buf,  // IN
@@ -762,11 +766,14 @@ VNetUserIfWrite(VNetPort    *port, // IN
    struct sk_buff *skb;
 
    /*
-    * Check size
+    * Check size.
+    *
+    * Regarding the upper count limit the check would be more accurate
+    * if based on the current MTU value of the corresponding vmnet interface.
+    * PR 2267716 is filed to track this.
     */
-   
-   if (count < sizeof (struct ethhdr) || 
-       count > ETHER_MAX_QUEUED_PACKET) {
+   if (count < sizeof (struct ethhdr) ||
+       count > ETHER_MAX_JUMBO_FRAME_LEN) {
       return -EINVAL;
    }
 
diff --git a/vmnet-only/vm_assert.h b/vmnet-only/vm_assert.h
index 8cdbc93e..74cbc2fb 100644
--- a/vmnet-only/vm_assert.h
+++ b/vmnet-only/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2017,2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -202,7 +202,7 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 
 #define NOT_TESTED_1024()                                               \
    do {                                                                 \
-      static uint16 count = 0;                                          \
+      static MONITOR_ONLY(PERVCPU) uint16 count = 0;                    \
       if (UNLIKELY(count == 0)) { NOT_TESTED(); }                       \
       count = (count + 1) & 1023;                                       \
    } while (0)
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index 5fa2fcaf..800b3eda 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -1317,7 +1317,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
 #else
    __asm mov eax, val
    __asm mov ebx, var
-   __asm lock and [ebx]Atomic_uint32.value, eax
+   __asm lock And [ebx]Atomic_uint32.value, eax
 #endif
 #else
 #error No compiler defined for Atomic_And
@@ -1382,7 +1382,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
 #else
    __asm mov eax, val
    __asm mov ebx, var
-   __asm lock or [ebx]Atomic_uint32.value, eax
+   __asm lock Or [ebx]Atomic_uint32.value, eax
 #endif
 #else
 #error No compiler defined for Atomic_Or
@@ -1447,7 +1447,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
 #else
    __asm mov eax, val
    __asm mov ebx, var
-   __asm lock xor [ebx]Atomic_uint32.value, eax
+   __asm lock Xor [ebx]Atomic_uint32.value, eax
 #endif
 #else
 #error No compiler defined for Atomic_Xor
@@ -2303,7 +2303,10 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
  *
  * Atomic_ReadSub64 --
  *
- *      Atomically subtracts a 64-bit integer to another
+ *      Atomically subtracts a 64-bit integer from another.
+ *
+ *      Note: It is expected that val <= var.  If untrue, the result
+ *            cannot be represented in an unsigned type.
  *
  * Results:
  *      Returns the old value just prior to the subtraction
@@ -2321,7 +2324,7 @@ Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
 #if defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
-   return Atomic_ReadAdd64(var, -(int64)val);
+   return Atomic_ReadAdd64(var, (uint64)-(int64)val);
 #endif
 }
 
@@ -3618,7 +3621,7 @@ Atomic_ReadInc16(Atomic_uint16 *var) // IN/OUT
 static INLINE uint16
 Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
 {
-   return Atomic_ReadAdd16(var, -1);
+   return Atomic_ReadAdd16(var, (uint16)-1);
 }
 #endif
 
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index 79bb2789..02172e64 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -221,8 +221,9 @@ mssb64_0(const uint64 value)
 #endif
 
 static INLINE int
-lssb32_0(uint32 value)
+lssb32_0(uint32 v)
 {
+   int value = (int)v;
 #ifdef USE_ARCH_X86_CUSTOM
    if (!__builtin_constant_p(value)) {
       if (UNLIKELY(value == 0)) {
@@ -262,8 +263,10 @@ mssb32_0(uint32 value)
 }
 
 static INLINE int
-lssb64_0(const uint64 value)
+lssb64_0(const uint64 v)
 {
+   int64 value = (int64)v;
+
 #ifdef USE_ARCH_X86_CUSTOM
    if (!__builtin_constant_p(value)) {
       if (UNLIKELY(value == 0)) {
@@ -373,10 +376,10 @@ lssbPtr_0(const uintptr_t value)
 #endif
 }
 
-static INLINE int
+static INLINE unsigned
 lssbPtr(const uintptr_t value)
 {
-   return lssbPtr_0(value) + 1;
+   return (unsigned)lssbPtr_0(value) + 1;
 }
 
 static INLINE int
@@ -389,34 +392,34 @@ mssbPtr_0(const uintptr_t value)
 #endif
 }
 
-static INLINE int
+static INLINE unsigned
 mssbPtr(const uintptr_t value)
 {
-   return mssbPtr_0(value) + 1;
+   return (unsigned)mssbPtr_0(value) + 1;
 }
 
-static INLINE int
+static INLINE unsigned
 lssb32(const uint32 value)
 {
-   return lssb32_0(value) + 1;
+   return (unsigned)lssb32_0(value) + 1;
 }
 
-static INLINE int
+static INLINE unsigned
 mssb32(const uint32 value)
 {
-   return mssb32_0(value) + 1;
+   return (unsigned)mssb32_0(value) + 1;
 }
 
-static INLINE int
+static INLINE unsigned
 lssb64(const uint64 value)
 {
-   return lssb64_0(value) + 1;
+   return (unsigned)lssb64_0(value) + 1;
 }
 
-static INLINE int
+static INLINE unsigned
 mssb64(const uint64 value)
 {
-   return mssb64_0(value) + 1;
+   return (unsigned)mssb64_0(value) + 1;
 }
 
 #ifdef __GNUC__
@@ -768,12 +771,14 @@ static INLINE void
 PAUSE(void)
 #if defined(__GNUC__) || defined(VM_ARM_32)
 {
-#ifdef VM_ARM_ANY
+#ifdef VM_ARM_64
+   __asm__ __volatile__("yield");
+#elif defined VM_ARM_32
    /*
-    * ARM has no instruction to execute "spin-wait loop", just leave it
-    * empty.
+    * YIELD is available in ARMv6K and above, so we could probably refine this
+    * instead of leaving it empty.
     */
-#else
+#else // x86
    __asm__ __volatile__( "pause" :);
 #endif
 }
@@ -888,7 +893,7 @@ RDTSC(void)
  *
  * {Clear,Set,Test}Bit{32,64} --
  *
- *    Sets or clears a specified single bit in the provided variable.
+ *    Sets tests or clears a specified single bit in the provided variable.
  *
  *    The index input value specifies which bit to modify and is 0-based.
  *    Index is truncated by hardware to a 5-bit or 6-bit offset for the
@@ -902,111 +907,39 @@ RDTSC(void)
  */
 
 static INLINE void
-SetBit32(uint32 *var, uint32 index)
+SetBit32(uint32 *var, unsigned index)
 {
-#if defined(__GNUC__) && defined(VM_X86_ANY)
-   __asm__ (
-      "bts %1, %0"
-      : "+mr" (*var)
-      : "rI" (index)
-      : "cc"
-   );
-#elif defined(_MSC_VER)
-   _bittestandset((long *)var, index);
-#else
-   *var |= (1 << index);
-#endif
+   *var |= 1 << index;
 }
 
 static INLINE void
-ClearBit32(uint32 *var, uint32 index)
+ClearBit32(uint32 *var, unsigned index)
 {
-#if defined(__GNUC__) && defined(VM_X86_ANY)
-   __asm__ (
-      "btr %1, %0"
-      : "+mr" (*var)
-      : "rI" (index)
-      : "cc"
-   );
-#elif defined(_MSC_VER)
-   _bittestandreset((long *)var, index);
-#else
    *var &= ~(1 << index);
-#endif
 }
 
 static INLINE void
-SetBit64(uint64 *var, uint64 index)
+SetBit64(uint64 *var, unsigned index)
 {
-#if defined(VM_64BIT) && !defined(VM_ARM_64)
-#ifdef __GNUC__
-   __asm__ (
-      "bts %1, %0"
-      : "+mr" (*var)
-      : "rJ" (index)
-      : "cc"
-   );
-#elif defined(_MSC_VER)
-   _bittestandset64((__int64 *)var, index);
-#endif
-#else
-   *var |= ((uint64)1 << index);
-#endif
+   *var |= CONST64U(1) << index;
 }
 
 static INLINE void
-ClearBit64(uint64 *var, uint64 index)
+ClearBit64(uint64 *var, unsigned index)
 {
-#if defined(VM_64BIT) && !defined(VM_ARM_64)
-#ifdef __GNUC__
-   __asm__ (
-      "btrq %1, %0"
-      : "+mr" (*var)
-      : "rJ" (index)
-      : "cc"
-   );
-#elif defined(_MSC_VER)
-   _bittestandreset64((__int64 *)var, index);
-#endif
-#else
-   *var &= ~((uint64)1 << index);
-#endif
+   *var &= ~(CONST64U(1) << index);
 }
 
 static INLINE Bool
-TestBit32(const uint32 *var, uint32 index)
+TestBit32(const uint32 *var, unsigned index)
 {
-#if defined(__GNUC__) && defined(VM_X86_ANY)
-   Bool bit;
-   __asm__ (
-      "bt %[index], %[var] \n"
-      "setc %[bit]"
-      : [bit] "=qQm" (bit)
-      : [index] "rI" (index), [var] "r" (*var)
-      : "cc"
-   );
-   return bit;
-#else
    return (*var & (1 << index)) != 0;
-#endif
 }
 
 static INLINE Bool
-TestBit64(const uint64 *var, uint64 index)
+TestBit64(const uint64 *var, unsigned index)
 {
-#if defined __GNUC__ && defined VM_X86_64
-   Bool bit;
-   __asm__ (
-      "bt %[index], %[var] \n"
-      "setc %[bit]"
-      : [bit] "=qQm" (bit)
-      : [index] "rJ" (index), [var] "r" (*var)
-      : "cc"
-   );
-   return bit;
-#else
    return (*var & (CONST64U(1) << index)) != 0;
-#endif
 }
 
 /*
@@ -1170,7 +1103,9 @@ RoundUpPow2C32(uint32 value)
    if (value <= 1 || value > (1U << 31)) {
       return 1; // Match the assembly's undefined value for large inputs.
    } else {
-      return (2 << mssb32_0(value - 1));
+      int mssb32 = mssb32_0(value - 1);
+      /* invariant: mssb32 >= 0 */
+      return (2U << (uint32)mssb32);
    }
 }
 
@@ -1226,6 +1161,101 @@ RoundUpPow2_32(uint32 value)
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PopCount32 --
+ *
+ *     Counts "1" bits in a uint32.
+ *
+ * Results:
+ *     Returns the number of bits set to 1.
+ *
+ * Side effects:
+ *     None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE unsigned
+PopCount32(uint32 value)
+{
+   /*
+    * Attribution:
+    *     This algorithm was copied from:
+    *         http://www.aggregate.org/MAGIC#Population Count (Ones Count)
+    *
+    *     A virtually identical version (but in assembly) appears in an
+    *     AMD reference manual.
+    *
+    *     No license appears in the original code, but the website
+    *     header states:
+    *
+    *     "None of the following coding tricks came from proprietary
+    *     sources; further, we believe that each of the tricks we did
+    *     not invent is essentially "standard engineering practice" in
+    *     the specialized niche where it applies. Thus, although we
+    *     have not conducted patent searches, etc., to confirm it, we
+    *     believe that these are tricks that freely can be used for
+    *     any purpose. Of course, The Aggregate accepts no
+    *     responsibility for your use of these tricks; you must
+    *     confirm that the trick does what you want and that you can
+    *     use it as you intend. That said, we do intend to maintain
+    *     this page by adding new algorithms and/or correcting
+    *     existing entries. If you have any comments, please contact
+    *     Professor Hank Dietz, http://aggregate.org/hankd/"
+    *
+    *     "This document should be cited using something like the
+    *     following bibtex entry:" (most recent retrieval date added)
+    *
+    *     @techreport{magicalgorithms,
+    *     author={Henry Gordon Dietz},
+    *     title={{The Aggregate Magic Algorithms}},
+    *     institution={University of Kentucky},
+    *     howpublished={Aggregate.Org online technical report},
+    *     URL={http://aggregate.org/MAGIC/},
+    *     urldate={2016-01-27}
+    *     }
+    */
+   value -= ((value >> 1) & 0x55555555);
+   value = (((value >> 2) & 0x33333333) + (value & 0x33333333));
+   value = (((value >> 4) + value) & 0x0f0f0f0f);
+   value += (value >> 8);
+   value += (value >> 16);
+   return value & 0x0000003f;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * PopCount64 --
+ *
+ *     Counts "1" bits in a uint64.
+ *
+ * Results:
+ *     Returns the number of bits set to 1.
+ *
+ * Side effects:
+ *     None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE unsigned
+PopCount64(uint64 value)
+{
+   value -= (value >> 1) & 0x5555555555555555ULL;
+   value = ((value >> 2) & 0x3333333333333333ULL) +
+           (value & 0x3333333333333333ULL);
+   value = ((value >> 4) + value) & 0x0f0f0f0f0f0f0f0fULL;
+   value += value >> 8;
+   value += value >> 16;
+   value += value >> 32;
+   return (unsigned) (value & 0xff);
+}
+
+
 #if defined __cplusplus
 } // extern "C"
 #endif
diff --git a/vmnet-only/vm_basic_asm_x86.h b/vmnet-only/vm_basic_asm_x86.h
index e293ed25..9879dc6d 100644
--- a/vmnet-only/vm_basic_asm_x86.h
+++ b/vmnet-only/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -52,16 +52,25 @@ extern "C" {
  * XTEST
  *     Return TRUE if processor is in transaction region.
  *
+ *  Using condition codes as output values (=@ccnz) requires gcc6 or
+ *  above.  Clang does not support condition codes as output
+ *  constraints.
+ *
  */
 #if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
 static INLINE Bool
 xtest(void)
 {
-   uint8 al;
-   __asm__ __volatile__(".byte 0x0f, 0x01, 0xd6    # xtest \n"
-                        "setnz %%al\n"
-                        : "=a"(al) : : "cc");
-   return al;
+   Bool result;
+#if defined(__clang__)
+   __asm__ __volatile__("xtest\n"
+                        "setnz %%al"
+                        : "=a" (result) : : "cc");
+#else
+   __asm__ __volatile__("xtest"
+                        : "=@ccnz" (result) : : "cc");
+#endif
+   return result;
 }
 
 #endif /* __GNUC__ */
@@ -135,49 +144,32 @@ FXRSTOR_AMD_ES0(const void *load)
 static INLINE void 
 XSAVE_ES1(void *save, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x21 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
    __asm__ __volatile__ (
         "xsave %0 \n"
         : "=m" (*(uint8 *)save)
         : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
-#endif
 }
 
 static INLINE void 
 XSAVEOPT_ES1(void *save, uint64 mask)
 {
    __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x31 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        "xsaveopt %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
 }
 
 static INLINE void 
 XRSTOR_ES1(const void *load, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x29 \n"
-        :
-        : "c" ((const uint8 *)load),
-          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
    __asm__ __volatile__ (
         "xrstor %0 \n"
         :
         : "m" (*(const uint8 *)load),
           "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
-#endif
 }
 
 static INLINE void 
@@ -195,17 +187,10 @@ XRSTOR_AMD_ES0(const void *load, uint64 mask)
         "fildl   %0      \n"     // Dummy Load from "safe address" changes all
                                  // x87 exception pointers.
         "mov %%ebx, %%eax \n"
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-        ".byte 0x0f, 0xae, 0x29 \n"
-        :
-        : "m" (dummy), "c" ((const uint8 *)load),
-          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
-#else
         "xrstor %1 \n"
         :
         : "m" (dummy), "m" (*(const uint8 *)load),
           "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
-#endif
         : "eax", "memory");
 }
 #endif /* __GNUC__ */
@@ -415,7 +400,7 @@ Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
       shr  edx, cl
       jmp  SHORT l3
    l2:
-      xor  esi, esi
+      Xor  esi, esi
       shrd eax, edx, cl                     // result = hi(p2):hi(p1):lo(p1) >> shift
       adc  esi, 0                           // Get highest order bit shifted out, from CF
       shrd edx, ebx, cl
@@ -536,7 +521,7 @@ Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
       sar  edx, cl
       jmp  SHORT l3
    l2:
-      xor  esi, esi
+      Xor  esi, esi
       shrd eax, edx, cl                     // result = hi(p2):hi(p1):lo(p1) << shift
       adc  esi, 0                           // Get highest order bit shifted out, from CF
       shrd edx, ebx, cl
diff --git a/vmnet-only/vm_basic_asm_x86_64.h b/vmnet-only/vm_basic_asm_x86_64.h
index f9b255a9..ee1d1fb0 100644
--- a/vmnet-only/vm_basic_asm_x86_64.h
+++ b/vmnet-only/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -49,12 +49,29 @@ uint64 _umul128(uint64 multiplier, uint64 multiplicand,
 int64 _mul128(int64 multiplier, int64 multiplicand,
               int64 *highProduct);
 uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
+#ifdef ULM
+void _fxsave64(void *save);
+void _fxsave(void *save);
+void _fxrstor64(const void *load);
+void _fxrstor(const void *load);
+void _xsave64(void *save, uint64 mask);
+void _xsave(void *save, uint64 mask);
+void _xsaveopt64(void *save, uint64 mask);
+void _xsavec(void *save, uint64 mask);
+void _xrstor64(const void *load, uint64 mask);
+void _xrstor(const void *load, uint64 mask);
+#endif /* ULM */
 #ifdef __cplusplus
 }
 #endif
 
 #pragma intrinsic(_umul128, _mul128, __shiftright128)
 
+#ifdef ULM
+#pragma intrinsic(_fxsave64, _fxsave, _fxrstor64, _fxrstor, _xsave64, _xsave, \
+                  _xsaveopt64, _xsavec, _xrstor64, _xrstor)
+#endif /* ULM */
+
 #endif // _MSC_VER
 
 #if defined(__GNUC__)
@@ -113,40 +130,57 @@ uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
  * The workaround (FXRSTOR_AMD_ES0) only costs 1 cycle more than just doing an
  * fxrstor, on both AMD Opteron and Intel Core CPUs.
  */
-#if defined(__GNUC__)
 
-static INLINE void 
+#if defined(VMM) || defined(VMKERNEL) || defined(FROBOS) || defined(ULM)
+static INLINE void
 FXSAVE_ES1(void *save)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ ("fxsaveq %0  \n" : "=m" (*(uint8 *)save) : : "memory");
+#elif defined(_MSC_VER)
+   _fxsave64(save);
+#endif
 }
 
-static INLINE void 
+static INLINE void
 FXSAVE_COMPAT_ES1(void *save)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ ("fxsave %0  \n" : "=m" (*(uint8 *)save) : : "memory");
+#elif defined(_MSC_VER)
+   _fxsave(save);
+#endif
 }
 
-static INLINE void 
+static INLINE void
 FXRSTOR_ES1(const void *load)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ ("fxrstorq %0 \n"
                          : : "m" (*(const uint8 *)load) : "memory");
+#elif defined(_MSC_VER)
+   _fxrstor64(load);
+#endif
 }
 
-static INLINE void 
+static INLINE void
 FXRSTOR_COMPAT_ES1(const void *load)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ ("fxrstor %0 \n"
                          : : "m" (*(const uint8 *)load) : "memory");
+#elif defined(_MSC_VER)
+   _fxrstor(load);
+#endif
 }
 
-static INLINE void 
+#if defined(__GNUC__)
+static INLINE void
 FXRSTOR_AMD_ES0(const void *load)
 {
    uint64 dummy = 0;
 
-   __asm__ __volatile__ 
+   __asm__ __volatile__
        ("fnstsw  %%ax    \n"     // Grab x87 ES bit
         "bt      $7,%%ax \n"     // Test ES bit
         "jnc     1f      \n"     // Jump if ES=0
@@ -170,100 +204,100 @@ FXRSTOR_AMD_ES0(const void *load)
  * The pointer passed in must be 64-byte aligned.
  * See above comment for more information.
  */
-#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
 
-static INLINE void 
+static INLINE void
 XSAVE_ES1(void *save, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x48, 0x0f, 0xae, 0x21 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
+#ifdef __GNUC__
    __asm__ __volatile__ (
         "xsaveq %0 \n"
         : "=m" (*(uint8 *)save)
         : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xsave64(save, mask);
 #endif
 }
 
-static INLINE void 
+static INLINE void
 XSAVE_COMPAT_ES1(void *save, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x21 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
+#ifdef __GNUC__
    __asm__ __volatile__ (
         "xsave %0 \n"
         : "=m" (*(uint8 *)save)
         : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xsave(save, mask);
 #endif
 }
 
-static INLINE void 
+static INLINE void
 XSAVEOPT_ES1(void *save, uint64 mask)
 {
+#ifdef __GNUC__
    __asm__ __volatile__ (
-        ".byte 0x48, 0x0f, 0xae, 0x31 \n"
-        :
-        : "c" ((uint8 *)save), "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        "xsaveoptq %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xsaveopt64(save, mask);
+#endif
 }
 
-static INLINE void 
-XRSTOR_ES1(const void *load, uint64 mask)
+static INLINE void
+XSAVEC_COMPAT_ES1(void *save, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
+#ifdef __GNUC__
    __asm__ __volatile__ (
-        ".byte 0x48, 0x0f, 0xae, 0x29 \n"
-        :
-        : "c" ((const uint8 *)load),
-          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        "xsavec %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
-#else
+#elif defined(_MSC_VER)
+   _xsavec(save, mask);
+#endif
+}
+
+static INLINE void
+XRSTOR_ES1(const void *load, uint64 mask)
+{
+#ifdef __GNUC__
    __asm__ __volatile__ (
         "xrstorq %0 \n"
         :
         : "m" (*(const uint8 *)load),
           "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xrstor64(load, mask);
 #endif
 }
 
-static INLINE void 
+static INLINE void
 XRSTOR_COMPAT_ES1(const void *load, uint64 mask)
 {
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-   __asm__ __volatile__ (
-        ".byte 0x0f, 0xae, 0x29 \n"
-        :
-        : "c" ((const uint8 *)load),
-          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
-        : "memory");
-#else
+#ifdef __GNUC__
    __asm__ __volatile__ (
         "xrstor %0 \n"
         :
         : "m" (*(const uint8 *)load),
           "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
         : "memory");
+#elif defined(_MSC_VER)
+   _xrstor(load, mask);
 #endif
 }
 
-static INLINE void 
+#if defined(__GNUC__)
+static INLINE void
 XRSTOR_AMD_ES0(const void *load, uint64 mask)
 {
    uint64 dummy = 0;
 
-   __asm__ __volatile__ 
+   __asm__ __volatile__
        ("fnstsw  %%ax    \n"     // Grab x87 ES bit
         "bt      $7,%%ax \n"     // Test ES bit
         "jnc     1f      \n"     // Jump if ES=0
@@ -273,36 +307,39 @@ XRSTOR_AMD_ES0(const void *load, uint64 mask)
         "fildl   %0      \n"     // Dummy Load from "safe address" changes all
                                  // x87 exception pointers.
         "mov %%ebx, %%eax \n"
-#if __GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ == 1
-        ".byte 0x48, 0x0f, 0xae, 0x29 \n"
-        :
-        : "m" (dummy), "c" ((const uint8 *)load),
-          "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
-#else
         "xrstorq %1 \n"
         :
         : "m" (dummy), "m" (*(const uint8 *)load),
           "b" ((uint32)mask), "d" ((uint32)(mask >> 32))
-#endif
         : "eax", "memory");
 }
 
 #endif /* __GNUC__ */
+#endif /* VMM || VMKERNEL || FROBOS || ULM */
 
 /*
  * XTEST
  *     Return TRUE if processor is in transaction region.
  *
+ *  Using condition codes as output values (=@ccnz) requires gcc6 or
+ *  above.  Clang does not support condition codes as output
+ *  constraints.
+ *
  */
 #if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
 static INLINE Bool
 xtest(void)
 {
-   uint8 al;
-   __asm__ __volatile__(".byte 0x0f, 0x01, 0xd6    # xtest \n"
-                        "setnz %%al\n"
-                        : "=a"(al) : : "cc"); 
-   return al;
+   Bool result;
+#if defined(__clang__)
+   __asm__ __volatile__("xtest\n"
+                        "setnz %%al"
+                        : "=a" (result) : : "cc");
+#else
+   __asm__ __volatile__("xtest"
+                        : "=@ccnz" (result) : : "cc");
+#endif
+   return result;
 }
 
 #endif /* __GNUC__ */
@@ -314,7 +351,7 @@ xtest(void)
  *
  *    Unsigned integer by fixed point multiplication, with rounding:
  *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
- * 
+ *
  *       Unsigned 64-bit integer multiplicand.
  *       Unsigned 64-bit fixed point multiplier, represented as
  *         (multiplier, shift), where shift < 64.
@@ -396,7 +433,7 @@ Mul64x6464(uint64 multiplicand,
  *
  *    Signed integer by fixed point multiplication, with rounding:
  *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
- * 
+ *
  *       Signed 64-bit integer multiplicand.
  *       Unsigned 64-bit fixed point multiplier, represented as
  *         (multiplier, shift), where shift < 64.
@@ -481,7 +518,7 @@ Muls64x64s64(int64 multiplicand,
  *
  *    Unsigned integer by fixed point multiplication, with rounding:
  *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
- * 
+ *
  *       Unsigned 64-bit integer multiplicand.
  *       Unsigned 32-bit fixed point multiplier, represented as
  *         (multiplier, shift), where shift < 64.
@@ -505,7 +542,7 @@ Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
  *
  *    Signed integer by fixed point multiplication, with rounding:
  *       result = floor(multiplicand * multiplier * 2**(-shift) + 0.5)
- * 
+ *
  *       Signed 64-bit integer multiplicand.
  *       Unsigned 32-bit fixed point multiplier, represented as
  *         (multiplier, shift), where shift < 64.
diff --git a/vmnet-only/vm_basic_asm_x86_common.h b/vmnet-only/vm_basic_asm_x86_common.h
index a724178e..9fc0cacb 100644
--- a/vmnet-only/vm_basic_asm_x86_common.h
+++ b/vmnet-only/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -244,9 +244,131 @@ GetCallerEFlags(void)
 
 /* Sequence recommended by Intel for the Pentium 4. */
 #define INTEL_MICROCODE_VERSION() (             \
-   __SET_MSR(MSR_BIOS_SIGN_ID, 0),              \
+   X86MSR_SetMSR(MSR_BIOS_SIGN_ID, 0),          \
    __GET_EAX_FROM_CPUID(1),                     \
-   __GET_MSR(MSR_BIOS_SIGN_ID))
+   X86MSR_GetMSR(MSR_BIOS_SIGN_ID))
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * MFENCE --
+ *
+ *      Wrapper around the MFENCE instruction.
+ *
+ *      Caveat Emptor! This function is _NOT_ _PORTABLE_ and most certainly
+ *      not something you should use. Take a look at the SMP_*_BARRIER_*,
+ *      DMA_*_BARRIER_* and MMIO_*_BARRIER_* interfaces instead, when writing
+ *      general OS/VMM code.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      See MFENCE instruction in Intel SDM or AMD Programmer's Manual.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+MFENCE(void)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "mfence"
+      ::: "memory"
+   );
+#elif defined _MSC_VER
+   _ReadWriteBarrier();
+   _mm_mfence();
+   _ReadWriteBarrier();
+#else
+#error No compiler defined for MFENCE
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LFENCE --
+ *
+ *      Wrapper around the LFENCE instruction.
+ *
+ *      Caveat Emptor! This function is _NOT_ _PORTABLE_ and most certainly
+ *      not something you should use. Take a look at the SMP_*_BARRIER_*,
+ *      DMA_*_BARRIER_* and MMIO_*_BARRIER_* interfaces instead, when writing
+ *      general OS/VMM code.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      See LFENCE instruction in Intel SDM or AMD Programmer's Manual.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+LFENCE(void)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "lfence"
+      : : : "memory"
+   );
+#elif defined _MSC_VER
+   _ReadWriteBarrier();
+   _mm_lfence();
+   _ReadWriteBarrier();
+#else
+#error No compiler defined for LFENCE
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * SFENCE --
+ *
+ *      Wrapper around the SFENCE instruction.
+ *
+ *      Caveat Emptor! This function is _NOT_ _PORTABLE_ and most certainly
+ *      not something you should use. Take a look at the SMP_*_BARRIER_*,
+ *      DMA_*_BARRIER_* and MMIO_*_BARRIER_* interfaces instead, when writing
+ *      general OS/VMM code.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      See SFENCE instruction in Intel SDM or AMD Programmer's Manual.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+SFENCE(void)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "sfence"
+      : : : "memory"
+   );
+#elif defined _MSC_VER
+   _ReadWriteBarrier();
+#if defined VM_X86_32
+   __asm sfence;
+#else
+   _mm_sfence();
+#endif
+   _ReadWriteBarrier();
+#else
+#error No compiler defined for SFENCE
+#endif
+}
+
 
 /*
  *-----------------------------------------------------------------------------
@@ -278,24 +400,63 @@ GetCallerEFlags(void)
 static INLINE void
 RDTSC_BARRIER(void)
 {
-#ifdef __GNUC__
-   __asm__ __volatile__(
-      "mfence \n\t"
-      "lfence \n\t"
-      ::: "memory"
-   );
+   MFENCE();
+   LFENCE();
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * LOCKED_INSN_BARRIER --
+ *
+ *      Implements a full WB load/store barrier using a locked instruction.
+ *
+ *      See PR 1674199 for details. You may choose to use this for
+ *      performance reasons over MFENCE iff you are only dealing with
+ *      WB memory accesses.
+ *
+ *      DANGER! Do not use this barrier instead of MFENCE when dealing
+ *      with non-temporal instructions or UC/WC memory accesses.
+ *
+ *      Caveat Emptor! This function is _NOT_ _PORTABLE_ and most certainly
+ *      not something you should use. Take a look at the SMP_*_BARRIER_*,
+ *      DMA_*_BARRIER_* and MMIO_*_BARRIER_* interfaces instead, when writing
+ *      general OS/VMM code.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      Cause WB loads and stores before the call to be globally visible
+ *      before WB loads and stores after this call.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+LOCKED_INSN_BARRIER(void)
+{
+   volatile long temp = 0;
+
+#if defined __GNUC__
+   __asm__ __volatile__ (
+      "lock xorl $1, %0"
+      : "+m" (temp)
+      : /* no additional inputs */
+      : "cc", "memory");
 #elif defined _MSC_VER
-   /* Prevent compiler from moving code across mfence/lfence. */
-   _ReadWriteBarrier();
-   _mm_mfence();
-   _mm_lfence();
-   _ReadWriteBarrier();
+   /*
+    * Ignore warning about _InterlockedXor operation on a local variable; we are
+    * using the operation for its side-effects only.
+    */
+   #pragma warning(suppress:28113)
+   _InterlockedXor(&temp, 1);
 #else
-#error No compiler defined for RDTSC_BARRIER
+#error LOCKED_INSN_BARRIER not defined for this compiler
 #endif
 }
 
-
 /*
  * Memory Barriers
  * ===============
@@ -354,7 +515,6 @@ RDTSC_BARRIER(void)
 #   define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
 #endif
 
-
 /*
  * Memory barriers. These take the form of
  *
@@ -373,47 +533,73 @@ RDTSC_BARRIER(void)
  *
  * Thanks for pasting this whole comment into every architecture header.
  *
- * On x86, we only need to care specifically about store-load reordering on
- * normal memory types. In other cases, only a compiler barrier is needed.
- * SMP_W_BARRIER_R is implemented with a locked xor operation (instead of the
- * mfence instruction) for performance reasons. See PR 1674199 for more
- * details.
- *
- * On x64, special instructions are only provided for load-load (lfence) and
- * store-store (sfence) ordering, and they don't apply to normal memory.
+ * This is a simplified version of Table 7-3 (Memory Access Ordering Rules) from
+ * AMD AMD64 Architecture Programmer's Manual Volume 2: System Programming
+ * (September 2018, Publication 24593, Revision 3.30).
+ *
+ * https://www.amd.com/system/files/TechDocs/24593.pdf#page=228
+ *
+ * This table only includes the memory types we care about in the context of
+ * SMP, DMA and MMIO barriers.
+ *
+ * +-------------+------+------+------+------+------+------+
+ * |\ 2nd mem op |      |      |      |      |      |      |
+ * | `---------. | R WB | R UC | R WC | W WB | W UC | W WC |
+ * | 1st mem op \|      |      |      |      |      |      |
+ * +-------------+------+------+------+------+------+------+
+ * |    R WB     |      |      | LF1  |      |      |      |
+ * +-------------+------+------+------+------+------+------+
+ * |    R UC     |      |      | LF1  |      |      |      |
+ * +-------------+------+------+------+------+------+------+
+ * |    R WC     |      |      | LF1  |      |      |      |
+ * +-------------+------+------+------+------+------+------+
+ * |    W WB     | MF1  |      | MF1  |      |      | SF2  |
+ * +-------------+------+------+------+------+------+------+
+ * |    W UC     | MF1  |      | MF1  |      |      | SF2  |
+ * +-------------+------+------+------+------+------+------+
+ * |    W WC     | MF1  |      | MF1  | SF1  |      | SF2  |
+ * +-------------+------+------+------+------+------+------+
+ *
+ * MF1 - WB or WC load may pass a previous non-conflicting WB, WC or UC store.
+ *       Use MFENCE. This is a combination of rules 'e' and 'i' in the AMD
+ *       diagram.
+ * LF1 - WC load may pass a previous WB, WC or UC load. Use LFENCE. This is
+ *       rule 'b' in the AMD diagram.
+ * SF1 - WB store may pass a previous WC store. Use SFENCE. This is rule 'j' in
+ *       the AMD diagram.
+ * SF2 - WC store may pass a previous UC, WB or non-conflicting WC store. Use
+ *       SFENCE. This is rule 'h' in the AMD diagram.
+ *
+ * To figure out the specific barrier required, pick and collapse the relevant
+ * rows and columns, choosing the strongest barrier.
+ *
+ * SMP barriers only concern with access to "normal memory" (write-back cached
+ * i.e. WB using above terminology), so we only need to worry about store-load
+ * reordering. In other cases a compiler barrier is sufficient. SMP store-load
+ * reordering is handled with a locked XOR (instead of a proper MFENCE
+ * instructon) for performance reasons. See PR 1674199 for more details.
+ *
+ * DMA barriers are equivalent to SMP barriers on x86.
+ *
+ * MMIO barriers are used to mix access to different memory types, so more
+ * reordering is possible, and is handled via LFENCE/SFENCE. Also, a proper
+ * MFENCE must be used instead of the locked XOR trick, due to the latter
+ * not guarding non-temporal/WC accesses.
  */
 
-
-static INLINE void
-SMP_W_BARRIER_R(void)
-{
-   volatile long temp;
-
-#if defined __GNUC__
-   __asm__ __volatile__ (
-      "lock xorl $1, %0"
-      : "+m" (temp)
-      : /* no additional inputs */
-      : "cc", "memory");
-#elif defined _MSC_VER
-   _InterlockedXor(&temp, 1);
-#else
-#error SMP_W_BARRIER_R not defined for this compiler
-#endif
-}
-
 #define SMP_R_BARRIER_R()     COMPILER_READ_BARRIER()
 #define SMP_R_BARRIER_W()     COMPILER_MEM_BARRIER()
 #define SMP_R_BARRIER_RW()    COMPILER_MEM_BARRIER()
+#define SMP_W_BARRIER_R()     LOCKED_INSN_BARRIER()
 #define SMP_W_BARRIER_W()     COMPILER_WRITE_BARRIER()
-#define SMP_W_BARRIER_RW()    SMP_W_BARRIER_R()
-#define SMP_RW_BARRIER_R()    SMP_W_BARRIER_R()
+#define SMP_W_BARRIER_RW()    LOCKED_INSN_BARRIER()
+#define SMP_RW_BARRIER_R()    LOCKED_INSN_BARRIER()
 #define SMP_RW_BARRIER_W()    COMPILER_MEM_BARRIER()
-#define SMP_RW_BARRIER_RW()   SMP_W_BARRIER_R()
+#define SMP_RW_BARRIER_RW()   LOCKED_INSN_BARRIER()
 
 /*
  * Like the above, only for use with observers other than CPUs,
- * i.e. DMA masters.
+ * i.e. DMA masters. Same as SMP barriers for x86.
  */
 
 #define DMA_R_BARRIER_R()     SMP_R_BARRIER_R()
@@ -427,18 +613,178 @@ SMP_W_BARRIER_R(void)
 #define DMA_RW_BARRIER_RW()   SMP_RW_BARRIER_RW()
 
 /*
- * And finally a set for use with MMIO accesses.
+ * And finally a set for use with MMIO accesses. These barriers must be stronger
+ * because they are used when mixing accesses to different memory types.
  */
 
-#define MMIO_R_BARRIER_R()    SMP_R_BARRIER_R()
+#define MMIO_R_BARRIER_R()    LFENCE()
 #define MMIO_R_BARRIER_W()    SMP_R_BARRIER_W()
-#define MMIO_R_BARRIER_RW()   SMP_R_BARRIER_RW()
-#define MMIO_W_BARRIER_R()    SMP_W_BARRIER_R()
-#define MMIO_W_BARRIER_W()    SMP_W_BARRIER_W()
-#define MMIO_W_BARRIER_RW()   SMP_W_BARRIER_RW()
-#define MMIO_RW_BARRIER_R()   SMP_RW_BARRIER_R()
-#define MMIO_RW_BARRIER_W()   SMP_RW_BARRIER_W()
-#define MMIO_RW_BARRIER_RW()  SMP_RW_BARRIER_RW()
+#define MMIO_R_BARRIER_RW()   LFENCE()
+#define MMIO_W_BARRIER_R()    MFENCE()
+#define MMIO_W_BARRIER_W()    SFENCE()
+#define MMIO_W_BARRIER_RW()   MFENCE()
+#define MMIO_RW_BARRIER_R()   MFENCE()
+#define MMIO_RW_BARRIER_W()   SFENCE()
+#define MMIO_RW_BARRIER_RW()  MFENCE()
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIORead8 --
+ *
+ *      IO read from address "addr".
+ *
+ * Results:
+ *      8-bit value at given location.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint8
+MMIORead8(const volatile void *addr)
+{
+   volatile uint8 *addr8 = (volatile uint8 *) addr;
+
+   return *addr8;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIOWrite8 --
+ *
+ *      IO write to address "addr".
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE void
+MMIOWrite8(volatile void *addr, // IN
+           uint8 val)           // IN
+{
+   volatile uint8 *addr8 = (volatile uint8 *) addr;
+
+   *addr8 = val;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIORead16 --
+ *
+ *      IO read from address "addr".
+ *
+ * Results:
+ *      16-bit value at given location.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint16
+MMIORead16(const volatile void *addr)
+{
+   volatile uint16 *addr16 = (volatile uint16 *) addr;
 
+   return *addr16;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIOWrite16 --
+ *
+ *      IO write to address "addr".
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE void
+MMIOWrite16(volatile void *addr,  // IN
+            uint16 val)           // IN
+{
+   volatile uint16 *addr16 = (volatile uint16 *) addr;
+
+   *addr16 = val;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIORead32 --
+ *
+ *      IO read from address "addr".
+ *
+ * Results:
+ *      32-bit value at given location.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint32
+MMIORead32(const volatile void *addr)
+{
+   volatile uint32 *addr32 = (volatile uint32 *) addr;
+
+   return *addr32;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIOWrite32 --
+ *
+ *      IO write to address "addr".
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE void
+MMIOWrite32(volatile void *addr, // OUT
+            uint32 val)
+{
+   volatile uint32 *addr32 = (volatile uint32 *) addr;
+
+   *addr32 = val;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIORead64 --
+ *
+ *      IO read from address "addr".
+ *
+ * Results:
+ *      64-bit value at given location.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+MMIORead64(const volatile void *addr)
+{
+   volatile uint64 *addr64 = (volatile uint64 *) addr;
+
+   return *addr64;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * MMIOWrite64 --
+ *
+ *      IO write to address "addr".
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE void
+MMIOWrite64(volatile void *addr, // OUT
+            uint64 val)
+{
+   volatile uint64 *addr64 = (volatile uint64 *) addr;
+
+   *addr64 = val;
+}
 
 #endif // _VM_BASIC_ASM_X86_COMMON_H_
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index b40e9b6a..29298257 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -44,56 +44,54 @@
 #endif
 #define __IS_FREEBSD_VER__(ver) (__IS_FREEBSD__ && __FreeBSD_version >= (ver))
 
-#if defined _WIN32 && defined USERLEVEL
-   #include <stddef.h>  /*
-                         * We redefine offsetof macro from stddef; make
-                         * sure that it's already defined before we do that.
-                         */
-   #include <windows.h>	// for Sleep() and LOWORD() etc.
-   #undef GetFreeSpace  // Unpollute preprocessor namespace.
-#endif
-
-
 /*
- * Simple macros
+ * <stddef.h> provides definitions for:
+ *   NULL, offsetof
+ * References:
+ *   C90 7.17, C99 7.19, C11 7.19
  */
+#if !defined(VMKERNEL)
+#  include <stddef.h>
+#else
+   /*
+    * Vmkernel's bogus __FreeBSD__ value causes gcc <stddef.h> to break.
+    * Work around by doing similar things. Bug 2116887 and 2229647.
+    */
+#  ifndef offsetof
+      /*
+       * We use the builtin offset for gcc/clang, except when we're running
+       * under the vmkernel's GDB macro preprocessor, since gdb doesn't
+       * understand __builtin_offsetof.
+       */
+#     if defined VMKERNEL_GDB_MACRO_BUILDER
+#        define offsetof(TYPE, MEMBER) ((size_t) &((TYPE *)0)->MEMBER)
+#     else
+#        define offsetof __builtin_offsetof
+#     endif
+#  endif
+
+#  ifndef NULL
+#     ifdef  __cplusplus
+#        define NULL    0
+#     else
+#        define NULL    ((void *)0)
+#     endif
+#  endif
+
+#endif  // VMKERNEL
 
-#ifndef vmw_offsetof
-#define vmw_offsetof(TYPE, MEMBER) ((size_t) &((TYPE *)0)->MEMBER)
+#if defined _WIN32 && defined USERLEVEL
+   #include <windows.h> // for Sleep() and LOWORD() etc.
+   #undef GetFreeSpace  // Unpollute preprocessor namespace.
 #endif
 
-#if (defined __APPLE__ || defined __FreeBSD__) && \
-    (!defined KERNEL && !defined _KERNEL && !defined VMKERNEL && !defined __KERNEL__)
-#   include <stddef.h>
-#else
-#ifndef offsetof
-#define VMW_DEFINED_OFFSETOF
 
 /*
- * XXX While the _WIN32 implementation appears to be identical to vmw_offsetof
- * in terms of behavior, they need to be separate to match verbatim the
- * definition used by the respective compilers, to avoid a redefinition warning.
- *
- * This is necessary until we eliminate the inclusion of <windows.h> above.
- */
-#ifdef _WIN32
-#define offsetof(s,m)   (size_t)&(((s *)0)->m)
-/*
- * We use the builtin offset for gcc/clang, except when we're running under the
- * vmkernel's GDB macro preprocessor, since gdb doesn't understand
- * __builtin_offsetof.
+ * Simple macros
  */
-#elif defined __GNUC__ && !defined VMKERNEL_GDB_MACRO_BUILDER
-#define offsetof __builtin_offsetof
-#else
-#define offsetof vmw_offsetof
-#endif
-
-#endif // offsetof
-#endif // __APPLE__
 
 #define VMW_CONTAINER_OF(ptr, type, member) \
-   ((type *)((char *)(ptr) - vmw_offsetof(type, member)))
+   ((type *)((char *)(ptr) - offsetof(type, member)))
 
 #ifndef ARRAYSIZE
 #define ARRAYSIZE(a) (sizeof (a) / sizeof *(a))
@@ -159,18 +157,6 @@ Max(int a, int b)
 
 #define IMPLIES(a,b) (!(a) || (b))
 
-/*
- * Not everybody (e.g., the monitor) has NULL
- */
-
-#ifndef NULL
-#ifdef  __cplusplus
-#define NULL    0
-#else
-#define NULL    ((void *)0)
-#endif
-#endif
-
 
 /*
  * Token concatenation
@@ -209,7 +195,7 @@ Max(int a, int b)
  */
 
 #ifndef PAGE_SHIFT // {
-#if defined VM_I386
+#if defined __x86_64__ || defined __i386__
    #define PAGE_SHIFT    12
 #elif defined __APPLE__
    #define PAGE_SHIFT    12
@@ -255,6 +241,10 @@ Max(int a, int b)
 #define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
 #endif
 
+#ifndef KBYTES_SHIFT
+#define KBYTES_SHIFT 10
+#endif
+
 #ifndef MBYTES_SHIFT
 #define MBYTES_SHIFT 20
 #endif
@@ -286,6 +276,14 @@ Max(int a, int b)
 #define PAGES_2_GBYTES(_npages) ((_npages) >> (30 - PAGE_SHIFT))
 #endif
 
+#ifndef BYTES_2_KBYTES
+#define BYTES_2_KBYTES(_nbytes) ((_nbytes) >> KBYTES_SHIFT)
+#endif
+
+#ifndef KBYTES_2_BYTES
+#define KBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << KBYTES_SHIFT)
+#endif
+
 #ifndef BYTES_2_MBYTES
 #define BYTES_2_MBYTES(_nbytes) ((_nbytes) >> MBYTES_SHIFT)
 #endif
@@ -556,10 +554,10 @@ typedef int pid_t;
 #undef DEBUG_ONLY
 #ifdef VMX86_DEBUG
 #define vmx86_debug      1
-#define DEBUG_ONLY(x)    x
+#define DEBUG_ONLY(...)  __VA_ARGS__
 #else
 #define vmx86_debug      0
-#define DEBUG_ONLY(x)
+#define DEBUG_ONLY(...)
 #endif
 
 #ifdef VMX86_STATS
@@ -664,6 +662,20 @@ typedef int pid_t;
 #define VMM_ONLY(x)
 #endif
 
+#ifdef ULM
+#define vmx86_ulm 1
+#define ULM_ONLY(x) x
+#else
+#define vmx86_ulm 0
+#define ULM_ONLY(x)
+#endif
+
+#if defined(VMM) || defined(ULM)
+#define MONITOR_ONLY(x) x
+#else
+#define MONITOR_ONLY(x)
+#endif
+
 #if defined(VMM) || defined(VMKERNEL)
 #define USER_ONLY(x)
 #else
@@ -702,12 +714,6 @@ typedef int pid_t;
 #endif
 #endif // _WIN32
 
-#ifdef HOSTED_LG_PG
-#define hosted_lg_pg 1
-#else
-#define hosted_lg_pg 0
-#endif
-
 /*
  * Use to initialize cbSize for this structure to preserve < Vista
  * compatibility.
@@ -718,7 +724,7 @@ typedef int pid_t;
 /* This is not intended to be thread-safe. */
 #define DO_ONCE(code)                                                   \
    do {                                                                 \
-      static Bool _doOnceDone = FALSE;                                  \
+      static MONITOR_ONLY(PERVCPU) Bool _doOnceDone = FALSE;            \
       if (UNLIKELY(!_doOnceDone)) {                                     \
          _doOnceDone = TRUE;                                            \
          code;                                                          \
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index 54f3e7e7..f7f5b93f 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -63,18 +63,9 @@
  * - VM_<arch>_32 for the 32-bit variant.
  * - VM_<arch>_64 for the 64-bit variant.
  * - VM_<arch>_ANY for any variant of <arch>.
- *
- * VM_X86_ANY is synonymous with the confusing and deprecated VM_I386 (which
- * should really be VM_X86_32).
  */
 
 #ifdef __i386__
-/*
- * VM_I386 is historically synonymous with VM_X86_ANY in bora, but misleading,
- * since it is confused with the __i386__ gcc but defined for both 32- and
- * 64-bit x86. We retain it here for legacy compatibility.
- */
-#define VM_I386
 #define VM_X86_32
 #define VM_X86_ANY
 #define VM_32BIT
@@ -83,7 +74,6 @@
 #ifdef __x86_64__
 #define VM_X86_64
 #define vm_x86_64 1
-#define VM_I386
 #define VM_X86_ANY
 #define VM_64BIT
 #else
@@ -120,14 +110,91 @@
 
 #endif
 
-#if defined(__cplusplus) && __cplusplus >= 201103L || \
-    defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L || \
-    defined(__APPLE__) || defined(HAVE_STDINT_H)
+#if defined(__FreeBSD__) && (__FreeBSD__ + 0 < 5)
+#  error FreeBSD detected without major version (PR 2116887)
+#endif
+
+/*
+ * C99 <stdint.h> or equivalent
+ * Special cases:
+ * - Linux kernel lacks <stdint.h>, preferring <linux/types.h>
+ *   (and defines uintptr_t since 2.6.24, but not intptr_t)
+ * - Solaris collides with gcc <stdint.h>, but has <sys/stdint.h>
+ * - VMKernel + FreeBSD collides with gcc <stdint.h>, but has <sys/stdint.h>
+ * - VMKernel (+DECODERLIB) share macros with Linux kernel
+ * - Windows only added <stdint.h> in vc10/vs2010 (MSC ver 1600),
+ *   and WDKs lack it.
+ *
+ * NB about LLP64 in LP64 environments:
+ * - Apple uses 'long long' uint64_t
+ * - Linux kernel uses 'long long' uint64_t
+ * - Linux userlevel uses 'long' uint64_t
+ */
+#if !defined(VMKERNEL) && !defined(DECODERLIB) && \
+    defined(__linux__) && defined(__KERNEL__)
+#  include <linux/types.h>
+#  include <linux/version.h>
+#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 24)
+   typedef unsigned long uintptr_t;
+#endif
+   typedef   signed long  intptr_t;
+#elif (defined(__sun__) && defined(_KERNEL)) || \
+      (defined(VMKERNEL) && defined(__FreeBSD__)) || \
+      defined(_SYS_STDINT_H_)
+#  include <sys/stdint.h>
+#elif !defined(_MSC_VER)
+   /* Common case */
+#  include <stdint.h>
+#else
+   /* COMPAT: until pre-vc10 is retired */
+#  include <crtdefs.h>  // uintptr_t
+   typedef unsigned __int64   uint64_t;
+   typedef unsigned int       uint32_t;
+   typedef unsigned short     uint16_t;
+   typedef unsigned char      uint8_t;
+
+   typedef __int64            int64_t;
+   typedef int                int32_t;
+   typedef short              int16_t;
+   typedef signed char        int8_t;
+#endif
+
 /*
- * We're using <stdint.h> instead of <cstdint> below because some C++ code
- * deliberately compiles without C++ include paths.
+ * size_t and ssize_t, or equivalent
+ * Options:
+ * C90+ <stddef.h> has size_t, but is incompatible with many kernels.
+ * POSIX <sys/types.h> has size_t and ssize_t, is always available at
+ *    userlevel but is missing from some kernels.
+ *
+ * Special cases:
+ * - Linux kernel (again) does everything via <linux/types.h>
+ * - VMKernel may or may not have POSIX headers (tcpip only)
+ * - VMM does not have POSIX headers
+ * - Windows <sys/types.h> does not define ssize_t
  */
-#include <stdint.h>
+#if defined(VMKERNEL) || defined(VMM) || defined(DECODERLIB)
+   /* Guard against FreeBSD <sys/types.h> collison. */
+#  if !defined(_SIZE_T_DEFINED) && !defined(_SIZE_T)
+#     define _SIZE_T_DEFINED
+#     define _SIZE_T
+      typedef __SIZE_TYPE__ size_t;
+#endif
+#  if !defined(_SSIZE_T_DEFINED) && !defined(_SSIZE_T)
+#     define _SSIZE_T_DEFINED
+#     define _SSIZE_T
+      typedef int64_t ssize_t;
+#  endif
+#elif defined(__linux__) && defined(__KERNEL__)
+   /* <linux/types.h> provided size_t, ssize_t. */
+#else
+#  include <sys/types.h>
+#  if defined(_WIN64)
+      typedef int64_t ssize_t;
+#  elif defined(_WIN32)
+      typedef int32_t ssize_t;
+#  endif
+#endif
+
 
 typedef uint64_t    uint64;
 typedef  int64_t     int64;
@@ -138,40 +205,6 @@ typedef  int16_t     int16;
 typedef  uint8_t     uint8;
 typedef   int8_t      int8;
 
-#else /* !HAVE_STDINT_H */
-
-/* Pre-c99 or pre-c++11; use compiler extension to get 64-bit types */
-#ifdef _MSC_VER
-
-typedef unsigned __int64 uint64;
-typedef signed __int64 int64;
-
-#elif __GNUC__
-#   if defined(VM_X86_64) || defined(VM_ARM_64)
-typedef unsigned long uint64;
-typedef long int64;
-#   else
-/*
- * Only strict c90 (without extensions) lacks a 'long long' type.
- * If this declaration fails ... use -std=c99 or -std=gnu90.
- */
-typedef unsigned long long uint64;
-typedef long long int64;
-#   endif
-#else
-#   error - Need compiler define for int64/uint64
-#endif /* _MSC_VER */
-
-typedef unsigned int       uint32;
-typedef unsigned short     uint16;
-typedef unsigned char      uint8;
-
-typedef int                int32;
-typedef short              int16;
-typedef signed char        int8;
-
-#endif /* HAVE_STDINT_H */
-
 
 /*
  * The _XTYPEDEF_BOOL guard prevents colliding with:
@@ -202,14 +235,6 @@ typedef char           Bool;
 #define IS_BOOL(x)     (((x) & ~1) == 0)
 
 
-/*
- * FreeBSD (for the tools build) unconditionally defines these in
- * sys/inttypes.h so don't redefine them if this file has already
- * been included. [greg]
- *
- * This applies to Solaris as well.
- */
-
 /*
  * Before trying to do the includes based on OS defines, see if we can use
  * feature-based defines to get as much functionality as possible
@@ -218,9 +243,6 @@ typedef char           Bool;
 #ifdef HAVE_INTTYPES_H
 #include <inttypes.h>
 #endif
-#ifdef HAVE_SYS_TYPES_H
-#include <sys/types.h>
-#endif
 #ifdef HAVE_SYS_INTTYPES_H
 #include <sys/inttypes.h>
 #endif
@@ -234,14 +256,11 @@ typedef char           Bool;
 
 #if !defined(USING_AUTOCONF)
 #   if defined(__FreeBSD__) || defined(sun)
-#      ifdef KLD_MODULE
-#         include <sys/types.h>
-#      else
+#      ifndef KLD_MODULE
 #         if __FreeBSD_version >= 500043
 #            if !defined(VMKERNEL)
 #               include <inttypes.h>
 #            endif
-#            include <sys/types.h>
 #         else
 #            include <sys/inttypes.h>
 #         endif
@@ -249,46 +268,10 @@ typedef char           Bool;
 #   elif defined __APPLE__
 #      if KERNEL
 #         include <sys/unistd.h>
-#         include <sys/types.h> /* mostly for size_t */
-#         include <stdint.h>
 #      else
 #         include <unistd.h>
 #         include <inttypes.h>
 #         include <stdlib.h>
-#         include <stdint.h>
-#      endif
-#   elif defined __ANDROID__
-#      include <stdint.h>
-#   else
-#      if !defined(__intptr_t_defined) && !defined(intptr_t)
-#         ifdef VM_I386
-#            define __intptr_t_defined
-#            if defined(VM_X86_64)
-typedef int64     intptr_t;
-#            else
-typedef int32     intptr_t;
-#            endif
-#         elif defined(VM_ARM_64)
-#            define __intptr_t_defined
-typedef int64     intptr_t;
-#         elif defined(__arm__)
-#            define __intptr_t_defined
-typedef int32     intptr_t;
-#         endif
-#      endif
-
-#      ifndef _STDINT_H
-#         ifdef VM_I386
-#            if defined(VM_X86_64)
-typedef uint64    uintptr_t;
-#            else
-typedef uint32    uintptr_t;
-#            endif
-#         elif defined(VM_ARM_64)
-typedef uint64    uintptr_t;
-#         elif defined(__arm__)
-typedef uint32    uintptr_t;
-#         endif
 #      endif
 #   endif
 #endif
@@ -337,10 +320,11 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
       #define FMTPD      "I"
       #define FMTH       "I"
    #endif
-#elif defined __APPLE__
-   /* macOS hosts use the same formatters for 32- and 64-bit. */
+#elif defined __APPLE__ || (!defined VMKERNEL && !defined DECODERLIB && \
+                            defined __linux__ && defined __KERNEL__)
+   /* semi-LLP64 targets; 'long' is 64-bit, but uint64_t is 'long long' */
    #define FMT64         "ll"
-   #if KERNEL
+   #if defined(__APPLE__) && KERNEL
       /* macOS osfmk/kern added 'z' length specifier in 10.13 */
       #define FMTSZ      "l"
    #else
@@ -452,7 +436,6 @@ typedef uintptr_t VPN;
 
 typedef uint64    PA;
 typedef uint64    PPN;
-typedef uint32    PPNTMP;
 
 typedef uint64    TPA;
 typedef uint64    TPPN;
@@ -470,9 +453,7 @@ typedef uint64    BPN;
 #define UINT64_2_BPN(u) ((BPN)(u))
 #define BPN_2_UINT64(b) ((uint64)(b))
 
-typedef uint64    PgCnt64;
 typedef uint64    PageCnt;
-typedef uint64    PgNum64;
 typedef uint64    PageNum;
 typedef unsigned  MemHandle;
 typedef unsigned  IoHandle;
@@ -515,7 +496,7 @@ typedef uint128 UReg128;
 #endif
 
 #if defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
-    defined (VMKERNEL) || defined (VMKBOOT)
+    defined (VMKERNEL) || defined (VMKBOOT) || defined (ULM)
 typedef  Reg64  Reg;
 typedef UReg64 UReg;
 #endif
@@ -598,15 +579,14 @@ typedef void * UserVA;
 
 
 /* Maximal observable PPN value. */
-#define MAX_PPN_BITS      31
-#define MAX_PPN           (((PPN64)1 << MAX_PPN_BITS) - 1)
+#define MAX_PPN_BITS      33
+#define MAX_PPN           (((PPN)1 << MAX_PPN_BITS) - 1)
 
-#define INVALID_PPN       ((PPN64)0xffffffff)
+#define INVALID_PPN       ((PPN)0x000fffffffffffffull)
 #define INVALID_PPN32     ((PPN32)0xffffffff)
-#define INVALID_PPN64     ((PPN64)0xffffffffffffffffull)
-#define APIC_INVALID_PPN  ((PPN64)0xfffffffe)
+#define APIC_INVALID_PPN  ((PPN)0x000ffffffffffffeull)
 
-#define INVALID_BPN       ((BPN)0x000000ffffffffffull)
+#define INVALID_BPN       ((BPN)0x0000ffffffffffffull)
 
 #define MPN38_MASK        ((1ull << 38) - 1)
 
@@ -624,7 +604,8 @@ typedef void * UserVA;
 #define INVALID_LPN       ((LPN)-1)
 #define INVALID_VPN       ((VPN)-1)
 #define INVALID_LPN64     ((LPN64)-1)
-#define INVALID_PAGENUM   ((uint32)-1)
+#define INVALID_PAGENUM   ((PageNum)0x000000ffffffffffull)
+#define INVALID_PAGENUM32 ((uint32)-1)
 
 /*
  * Format modifier for printing VA, LA, and VPN.
@@ -837,7 +818,7 @@ typedef void * UserVA;
  * will convert any !=0 to a 1.
  */
 #define LIKELY(_exp)     __builtin_expect(!!(_exp), 1)
-#define UNLIKELY(_exp)   __builtin_expect((_exp), 0)
+#define UNLIKELY(_exp)   __builtin_expect(!!(_exp), 0)
 #else
 #define LIKELY(_exp)      (_exp)
 #define UNLIKELY(_exp)    (_exp)
@@ -934,82 +915,6 @@ typedef void * UserVA;
 
 #define INFINITE_LOOP()           do { } while (1)
 
-/*
- * On FreeBSD (for the tools build), size_t is typedef'd if _BSD_SIZE_T_
- * is defined. Use the same logic here so we don't define it twice. [greg]
- */
-#ifdef __FreeBSD__
-#   ifdef _BSD_SIZE_T_
-#      undef _BSD_SIZE_T_
-#      ifdef VM_I386
-#         ifdef VM_X86_64
-             typedef uint64 size_t;
-#         else
-             typedef uint32 size_t;
-#         endif
-#      endif /* VM_I386 */
-#   endif
-
-#   ifdef _BSD_SSIZE_T_
-#      undef _BSD_SSIZE_T_
-#      ifdef VM_I386
-#         ifdef VM_X86_64
-             typedef int64 ssize_t;
-#         else
-             typedef int32 ssize_t;
-#         endif
-#      endif /* VM_I386 */
-#   endif
-
-#else
-#   if !defined(_SIZE_T) && !defined(_SIZE_T_DEFINED)
-#      ifdef VM_I386
-#         define _SIZE_T
-#         ifdef VM_X86_64
-             typedef uint64 size_t;
-#         else
-             typedef uint32 size_t;
-#         endif
-#      elif defined(VM_ARM_64)
-#         define _SIZE_T
-          typedef uint64 size_t;
-#      elif defined(__arm__)
-#         define _SIZE_T
-          typedef uint32 size_t;
-#      endif
-#   endif
-
-#   if !defined(FROBOS) && !defined(_SSIZE_T) && !defined(_SSIZE_T_) && \
-       !defined(ssize_t) && !defined(__ssize_t_defined) && \
-       !defined(_SSIZE_T_DECLARED) && !defined(_SSIZE_T_DEFINED) && \
-       !defined(_SSIZE_T_DEFINED_)
-#      ifdef VM_I386
-#         define _SSIZE_T
-#         define __ssize_t_defined
-#         define _SSIZE_T_DECLARED
-#         define _SSIZE_T_DEFINED_
-#         ifdef VM_X86_64
-             typedef int64 ssize_t;
-#         else
-             typedef int32 ssize_t;
-#         endif
-#      elif defined(VM_ARM_64)
-#         define _SSIZE_T
-#         define __ssize_t_defined
-#         define _SSIZE_T_DECLARED
-#         define _SSIZE_T_DEFINED_
-          typedef int64 ssize_t;
-#      elif defined(__arm__)
-#         define _SSIZE_T
-#         define __ssize_t_defined
-#         define _SSIZE_T_DECLARED
-#         define _SSIZE_T_DEFINED_
-             typedef int32 ssize_t;
-#      endif
-#   endif
-
-#endif
-
 /*
  * Format modifier for printing pid_t.  On sun the pid_t is a ulong, but on
  * Linux it's an int.
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
index 39371ad2..440038d0 100644
--- a/vmnet-only/vm_device_version.h
+++ b/vmnet-only/vm_device_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2005-2012,2014-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2005-2012,2014-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -54,6 +54,7 @@
  *    VMware HD Audio controller
  */
 #define PCI_VENDOR_ID_VMWARE                    0x15AD
+#define PCI_DEVICE_ID_VMWARE_SVGA3              0x0406
 #define PCI_DEVICE_ID_VMWARE_SVGA2              0x0405
 #define PCI_DEVICE_ID_VMWARE_SVGA               0x0710
 #define PCI_DEVICE_ID_VMWARE_VGA                0x0711
@@ -138,23 +139,24 @@
  *    Intel 82545EM (e1000, server adapter, single port)
  *    Intel 82546EB (e1000, server adapter, dual port)
  *    Intel HECI (as embedded in ich9m)
- *    Intel XHCI (Panther Point / Intel 7 Series)
+ *    Intel XHCI (Panther Point / Intel 7 Series, 5Gbps)
+ *    Intel XHCI (Cannon Lake / Intel 300 Series, 10Gbps)
  */
-#define PCI_VENDOR_ID_INTEL             0x8086
-#define PCI_DEVICE_ID_INTEL_82439TX     0x7100
-#define PCI_DEVICE_ID_INTEL_82371AB_0   0x7110
-#define PCI_DEVICE_ID_INTEL_82371AB_2   0x7112
-#define PCI_DEVICE_ID_INTEL_82371AB_3   0x7113
-#define PCI_DEVICE_ID_INTEL_82371AB     0x7111
-#define PCI_DEVICE_ID_INTEL_82443BX     0x7190
-#define PCI_DEVICE_ID_INTEL_82443BX_1   0x7191
-#define PCI_DEVICE_ID_INTEL_82443BX_2   0x7192 /* Used when no AGP support */
-#define PCI_DEVICE_ID_INTEL_82545EM     0x100f
-#define PCI_DEVICE_ID_INTEL_82546EB     0x1010
-#define PCI_DEVICE_ID_INTEL_82574       0x10d3
-#define PCI_DEVICE_ID_INTEL_82574_APPLE 0x10f6
-#define PCI_DEVICE_ID_INTEL_HECI        0x2a74
+#define PCI_VENDOR_ID_INTEL                   0x8086
+#define PCI_DEVICE_ID_INTEL_82439TX           0x7100
+#define PCI_DEVICE_ID_INTEL_82371AB_0         0x7110
+#define PCI_DEVICE_ID_INTEL_82371AB_2         0x7112
+#define PCI_DEVICE_ID_INTEL_82371AB_3         0x7113
+#define PCI_DEVICE_ID_INTEL_82371AB           0x7111
+#define PCI_DEVICE_ID_INTEL_82443BX           0x7190
+#define PCI_DEVICE_ID_INTEL_82443BX_1         0x7191
+#define PCI_DEVICE_ID_INTEL_82443BX_2         0x7192 /* Used when no AGP support */
+#define PCI_DEVICE_ID_INTEL_82545EM           0x100f
+#define PCI_DEVICE_ID_INTEL_82546EB           0x1010
+#define PCI_DEVICE_ID_INTEL_82574             0x10d3
+#define PCI_DEVICE_ID_INTEL_82574_APPLE       0x10f6
 #define PCI_DEVICE_ID_INTEL_PANTHERPOINT_XHCI 0x1e31
+#define PCI_DEVICE_ID_INTEL_CANNONLAKE_XHCI   0xa36d
 
 /*
  *  From drivers/usb/host/xhci-pci.c:
@@ -347,6 +349,9 @@
 /************* QAT implementation limits ********************/
 #define MAX_QAT_PCI_DEVICES 4
 
+/************* PrecisionClock implementation limits ********************/
+#define MAX_PRECISIONCLOCK_DEVICES 1
+
 /************* Strings for Host USB Driver *******************************/
 
 #ifdef _WIN32

From bf5aeaca486d987892ed9caba8bee023873cd8c0 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Thu, 14 Nov 2019 08:00:40 +0100
Subject: [PATCH 13/41] import Workstation 15.5.1 module sources

---
 vmmon-only/include/x86msr.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 469ee63f..0e765b10 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -119,6 +119,7 @@ MSRQuery;
 #define MSR_ARCH_CAPABILITIES_RSBA                (1ULL << 2)
 #define MSR_ARCH_CAPABILITIES_NOL1F_VMENTRY       (1ULL << 3)
 #define MSR_ARCH_CAPABILITIES_SSB_NO              (1ULL << 4)
+#define MSR_ARCH_CAPABILITIES_MDS_NO              (1ULL << 5)
 
 #define MSR_FLUSH_CMD                        0x10b
 #define MSR_FLUSH_CMD_FLUSH_L1D                   (1ULL << 0)
@@ -129,6 +130,7 @@ MSRQuery;
 
 #define MSR_PRED_CMD_IBPB                         (1UL << 0)
 
+
 #define MSR_MISC_FEATURES_ENABLES            0x140
 
 /* Intel Core Architecture and later: use only architected counters. */

From 02fd1f0829ee875b9c41ebea1b0d82600661e95d Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 14 Mar 2020 09:56:53 +0100
Subject: [PATCH 14/41] import Workstation 15.5.2 module sources

---
 vmmon-only/linux/hostif.c |  4 ++--
 vmnet-only/procfs.c       |  9 ++++++++-
 vmnet-only/userif.c       | 22 +++++++++++-----------
 3 files changed, 21 insertions(+), 14 deletions(-)

diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index f3a96a8b..5fcde0cc 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -2323,7 +2323,7 @@ SetVMAPICAddr(VMDriver *vm, // IN/OUT: driver state
    volatile void *hostapic;
 
    ASSERT_ON_COMPILE(APICR_SIZE <= PAGE_SIZE);
-   hostapic = (volatile void *) ioremap_nocache(ma, PAGE_SIZE);
+   hostapic = (volatile void *) ioremap(ma, PAGE_SIZE);
    if (hostapic) {
       if ((APIC_VERSIONREG(hostapic) & 0xF0) == 0x10) {
          vm->hostAPIC.base = (volatile uint32 (*)[4]) hostapic;
diff --git a/vmnet-only/procfs.c b/vmnet-only/procfs.c
index 165cda0a..4201ab88 100644
--- a/vmnet-only/procfs.c
+++ b/vmnet-only/procfs.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2013, 2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -137,6 +137,7 @@ VNetProcShow(struct seq_file *p, // IN:
 }
 
 
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 18, 0)
 /*
  *----------------------------------------------------------------------
  *
@@ -168,6 +169,7 @@ static struct file_operations fops = {
    .release = single_release,
 };
 #endif
+#endif
 
 
 /*
@@ -203,7 +205,12 @@ VNetProcMakeEntryInt(VNetProcEntry   *parent,   // IN:
       } else {
          ent->data   = data;
          ent->fn     = fn;
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 18, 0)
+         ent->pde    = proc_create_single_data(name, mode, parent->pde,
+                                               VNetProcShow, ent);
+#else
          ent->pde    = proc_create_data(name, mode, parent->pde, &fops, ent);
+#endif
       }
       if (ent->pde != NULL) {
          *ret = ent;
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index d3850885..b33708df 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -78,11 +78,11 @@ static int  VNetUserIfSetUplinkState(VNetPort *port, uint8 linkUp);
 extern unsigned int  vnet_max_qlen;
 
 #if COMPAT_LINUX_VERSION_CHECK_LT(3, 2, 0)
-#   define compat_kmap(page) kmap(page)
-#   define compat_kunmap(page) kunmap(page)
-#else
-#   define compat_kmap(page) kmap((page).p)
-#   define compat_kunmap(page) kunmap((page).p)
+#   define skb_frag_page(frag) (frag)->page
+#   define skb_frag_size(frag) (frag)->size
+#endif
+#if COMPAT_LINUX_VERSION_CHECK_LT(5, 4, 0)
+#   define skb_frag_off(frag) (frag)->page_offset
 #endif
 
 /*
@@ -568,20 +568,20 @@ VNetCsumCopyDatagram(const struct sk_buff *skb,	// IN: skb to copy
    for (frag = skb_shinfo(skb)->frags;
 	frag != skb_shinfo(skb)->frags + skb_shinfo(skb)->nr_frags;
 	frag++) {
-      if (frag->size > 0) {
+      if (skb_frag_size(frag) > 0) {
 	 unsigned int tmpCsum;
 	 const void *vaddr;
 
-	 vaddr = compat_kmap(frag->page);
-	 tmpCsum = csum_and_copy_to_user(vaddr + frag->page_offset,
-					 curr, frag->size, 0, &err);
-	 compat_kunmap(frag->page);
+	 vaddr = kmap(skb_frag_page(frag));
+	 tmpCsum = csum_and_copy_to_user(vaddr + skb_frag_off(frag),
+					 curr, skb_frag_size(frag), 0, &err);
+	 kunmap(skb_frag_page(frag));
 
 	 if (err) {
 	    return err;
 	 }
 	 csum = csum_block_add(csum, tmpCsum, curr - buf);
-	 curr += frag->size;
+	 curr += skb_frag_size(frag);
       }
    }
 

From dec5bab6a0398b9a1064112a6c4cd740eb760f8d Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 30 May 2020 02:35:30 +0200
Subject: [PATCH 15/41] import Workstation 15.5.5 module sources

---
 vmmon-only/common/hostif.h             |  14 +-
 vmmon-only/common/vmx86.c              | 103 ++++++-
 vmmon-only/common/vmx86.h              |  12 +
 vmmon-only/include/iocontrols.h        |  72 +----
 vmmon-only/include/modulecall.h        |   9 +-
 vmmon-only/include/modulecallstructs.h |   6 +-
 vmmon-only/include/monLoaderLog.h      |   2 +-
 vmmon-only/include/vcpuid.h            |   3 +
 vmmon-only/include/vm_asm_x86.h        |  45 +--
 vmmon-only/include/vm_assert.h         |  15 +-
 vmmon-only/include/vm_atomic.h         |  26 +-
 vmmon-only/include/vm_basic_asm.h      |  13 +-
 vmmon-only/include/vm_basic_defs.h     |  49 +--
 vmmon-only/include/vm_basic_types.h    |  31 +-
 vmmon-only/include/vmmem_shared.h      |   3 +-
 vmmon-only/include/x86cpuid.h          | 411 ++++++++++++++-----------
 vmmon-only/include/x86cpuid_asm.h      | 261 +---------------
 vmmon-only/include/x86msr.h            |  25 +-
 vmmon-only/include/x86svm.h            |   8 +-
 vmmon-only/include/x86vt.h             |  11 +-
 vmmon-only/linux/driver.c              | 337 +-------------------
 vmmon-only/linux/driver.h              |  19 +-
 vmmon-only/linux/hostif.c              | 294 +++++++++---------
 vmmon-only/linux/vmhost.h              |   4 +-
 vmmon-only/vmcore/moduleloop.c         |  23 +-
 vmnet-only/net.h                       |   4 +-
 vmnet-only/vm_assert.h                 |  15 +-
 vmnet-only/vm_atomic.h                 |  26 +-
 vmnet-only/vm_basic_asm.h              |  13 +-
 vmnet-only/vm_basic_defs.h             |  49 +--
 vmnet-only/vm_basic_types.h            |  31 +-
 31 files changed, 783 insertions(+), 1151 deletions(-)

diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index 9400ca25..8b085b13 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -59,6 +59,13 @@
 
 #define CROSSCALL_SLEEP_US 1000
 
+typedef struct HostIFContigMemMap {
+   MPN mpn;
+   void *addr;
+   PageCnt pages;
+   struct HostIFContigMemMap *next;
+} HostIFContigMemMap;
+
 EXTERN Bool  HostIF_Init(VMDriver *vm, uint32 numVCPUs);
 EXTERN int   HostIF_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
 EXTERN void *HostIF_MapCrossPage(VMDriver *vm, VA64 uAddr);
@@ -82,13 +89,16 @@ EXTERN void  HostIF_Wait(unsigned int timeoutMs);
 EXTERN void  HostIF_WaitForFreePages(unsigned int timeoutMs);
 EXTERN void *HostIF_AllocKernelPages(PageCnt numPages, MPN *mpns);
 EXTERN void  HostIF_FreeKernelPages(PageCnt numPages, void *ptr);
+EXTERN HostIFContigMemMap *HostIF_AllocContigPages(VMDriver *vm,
+                                                   PageCnt numPages);
+EXTERN void  HostIF_FreeContigPages(VMDriver *vm, HostIFContigMemMap *mapping);
 EXTERN void  HostIF_VMLock(VMDriver *vm, int callerID);
 EXTERN void  HostIF_VMUnlock(VMDriver *vm, int callerID);
 #ifdef VMX86_DEBUG
 EXTERN Bool HostIF_VMLockIsHeld(VMDriver *vm);
 #endif
 
-EXTERN Bool  HostIF_APICInit(VMDriver *vm, Bool setVMPtr, Bool probe);
+EXTERN void  HostIF_APICInit(VMDriver *vm);
 EXTERN uint8 HostIF_GetMonitorIPIVector(void);
 EXTERN uint8 HostIF_GetHVIPIVector(void);
 EXTERN void  HostIF_GetTimerVectors(uint8 *v0, uint8 *v1);
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index 2ae9fb7a..a33f393b 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -108,6 +108,9 @@ static int vmIDsUnused;
 /* Max rate requested for fast clock by any virtual machine. */
 static unsigned globalFastClockRate;
 
+/* 3 physically contiguous pages for the I/O bitmap.  SVM only. */
+HostIFContigMemMap *hvIOBitmap;
+
 typedef struct {
    Atomic_uint32 index;
    MSRQuery *query;
@@ -687,6 +690,38 @@ Vmx86_CleanupVMMPages(VMDriver *vm)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86CleanupContigMappings --
+ *
+ *     Frees all allocations from HostIF_AllocContigPages that are associated
+ *     with the given vm.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86CleanupContigMappings(VMDriver *vm)
+{
+   HostIFContigMemMap *m, *next;
+
+   HostIF_VMLock(vm, 48);
+   for (m = vm->contigMappings; m != NULL; m = next) {
+      next = m->next;
+      HostIF_FreeContigPages(vm, m);
+   }
+   HostIF_VMUnlock(vm, 48);
+   vm->contigMappings = NULL;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -732,7 +767,9 @@ Vmx86FreeAllVMResources(VMDriver *vm)
          StatVarsVmmon_Cleanup(vm->statVars);
          vm->statVars = NULL;
       }
-
+      if (vm->contigMappings != NULL) {
+         Vmx86CleanupContigMappings(vm);
+      }
       HostIF_FreeAllResources(vm);
 
       Vmx86FreeVMDriver(vm);
@@ -2042,7 +2079,9 @@ Vmx86_AllocLowPage(VMDriver *vm,      // IN: VMDriver
       return INVALID_MPN;
    }
 
+   HostIF_VMLock(vm, 49);
    mpn = HostIF_AllocLowPage(vm);
+   HostIF_VMUnlock(vm, 49);
 
    if (mpn == INVALID_MPN) {
       Vmx86UnreserveFreePages(vm, 1);
@@ -3393,3 +3432,65 @@ Vmx86_GetMonitorContext(VMDriver *vm,       // IN: The VM instance.
    context->rip = cpData->monRIP;
    return TRUE;
 }
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_CleanupHVIOBitmap --
+ *
+ *      Free any resources that were allocated for the HV I/O bitmap.
+ *
+ * Results:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+Vmx86_CleanupHVIOBitmap(void)
+{
+   if (hvIOBitmap != NULL) {
+      HostIF_FreeContigPages(NULL, hvIOBitmap);
+      hvIOBitmap = NULL;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_CreateHVIOBitmap --
+ *
+ *      Called on driver load to create and initialize the host wide SVM I/O
+ *      bitmap.  This item is a physically contiguous region of
+ *      SVM_VMCB_IO_BITMAP_PAGES pages and is initialized to all-bits-set.
+ *
+ * Results:
+ *      TRUE on success or FALSE on failure.
+ *
+ *----------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_CreateHVIOBitmap(void)
+{
+   if (!CPUID_HostSupportsSVM()) {
+      return TRUE;
+   }
+   if (vmx86_apple) {
+      /*
+       * This function is not called on MacOS.  No supported MacOS system is
+       * available for AMD so that platform has no need to create the SVM I/O
+       * bitmap.
+       */
+      return TRUE;
+   }
+   hvIOBitmap = HostIF_AllocContigPages(NULL, SVM_VMCB_IO_BITMAP_PAGES);
+   if (hvIOBitmap == NULL) {
+      Warning("Failed to allocate SVM I/O bitmap.\n");
+      return FALSE;
+   }
+   memset(hvIOBitmap->addr, 0xff, SVM_VMCB_IO_BITMAP_SIZE);
+   return TRUE;
+}
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index 4a8fb2fb..cda9aefc 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -48,6 +48,10 @@ typedef struct TSCDelta {
 
 struct VmmBlobInfo;
 
+struct HostIFContigMemMap;
+
+extern struct HostIFContigMemMap *hvIOBitmap;
+
 /*
  * VMDriver - the main data structure for the driver side of a
  *            virtual machine.
@@ -79,6 +83,12 @@ typedef struct VMDriver {
    int64                  *ptscOffsets;      /* numVCPUs-sized array. */
    Atomic_uint32          *currentHostCpu;   /* numVCPUs-sized array. */
    PageCnt                 numPTPPages;      /* Num PTP pages allocated. */
+   /*
+    * List of physically contiguous allocations associated with this VM.
+    * Access is protected by the VM lock.
+    */
+   struct HostIFContigMemMap     *contigMappings;
+
 } VMDriver;
 
 typedef struct MonLoaderArgs {
@@ -168,6 +178,8 @@ extern Bool Vmx86_GetAllMSRs(MSRQuery *query);
 extern void Vmx86_FlushVMCSAllCPUs(MA vmcs);
 extern void Vmx86_MonTimerIPI(void);
 extern void Vmx86_InitIDList(void);
+extern Bool Vmx86_CreateHVIOBitmap(void);
+extern void Vmx86_CleanupHVIOBitmap(void);
 extern Bool Vmx86_GetPageRoot(VMDriver *vm, Vcpuid vcpuid, MPN *mpn);
 extern void Vmx86_Open(void);
 extern void Vmx86_Close(void);
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 8d5fdcdf..cbbabd94 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -143,9 +143,12 @@ PtrToVA64(void const *ptr) // IN
  * does not break vmcore compatibility.
  *
  * See bora/doc/vmcore details.
+ *
+ * If you increment VMMON_VERSION, you must also increment
+ * the NT specific VMX86_DRIVER_VERSION.
  */
 
-#define VMMON_VERSION           (385 << 16 | 0)
+#define VMMON_VERSION           (392 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -253,18 +256,10 @@ enum IOCTLCmd {
 
 #if defined __linux__
    IOCTLCMD(SET_UID),		// VMX86_DEVEL only
-#endif
-
-#if defined __linux__ || defined __APPLE__
    IOCTLCMD(GET_ALL_CPUID),
 #endif
 
-#if defined _WIN32 || defined __APPLE__
-   IOCTLCMD(ALLOC_CONTIG_PAGES),
-#endif
-
 #if defined _WIN32
-   IOCTLCMD(FREE_CONTIG_PAGES),
    IOCTLCMD(HARD_LIMIT_MONITOR_STATUS), // used by vmauthd on Windows
    IOCTLCMD(CHANGE_HARD_LIMIT),         // used by vmauthd on Windows
    IOCTLCMD(READ_DISASM_PROC_BINARY),
@@ -272,6 +267,7 @@ enum IOCTLCmd {
    IOCTLCMD(SET_MEMORY_PARAMS),
    IOCTLCMD(REMEMBER_KHZ_ESTIMATE),
    IOCTLCMD(REMAP_SCATTER_LIST),
+   IOCTLCMD(REMAP_SCATTER_LIST_RO),     // map the list as read-only
    IOCTLCMD(UNMAP_SCATTER_LIST),
 #endif
 
@@ -281,10 +277,6 @@ enum IOCTLCmd {
    IOCTLCMD(BLUEPILL),
 #endif
 
-#if defined __linux__
-   IOCTLCMD(SET_HOST_SWAP_SIZE),
-#endif
-
    IOCTLCMD(GET_UNAVAIL_PERF_CTRS),
    IOCTLCMD(GET_MONITOR_CONTEXT),
    // Must be last.
@@ -336,8 +328,6 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_UPDATE_MEM_INFO     VMIOCTL_BUFFERED(UPDATE_MEM_INFO)
 #define IOCTL_VMX86_HARD_LIMIT_MONITOR_STATUS   VMIOCTL_BUFFERED(HARD_LIMIT_MONITOR_STATUS)
 #define IOCTL_VMX86_CHANGE_HARD_LIMIT   VMIOCTL_BUFFERED(CHANGE_HARD_LIMIT)
-#define IOCTL_VMX86_ALLOC_CONTIG_PAGES  VMIOCTL_BUFFERED(ALLOC_CONTIG_PAGES)
-#define IOCTL_VMX86_FREE_CONTIG_PAGES   VMIOCTL_BUFFERED(FREE_CONTIG_PAGES)
 
 #define IOCTL_VMX86_GET_TOTAL_MEM_USAGE	VMIOCTL_BUFFERED(GET_TOTAL_MEM_USAGE)
 #define IOCTL_VMX86_GET_KHZ_ESTIMATE    VMIOCTL_BUFFERED(GET_KHZ_ESTIMATE)
@@ -367,20 +357,14 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_GET_PSEUDO_TSC           VMIOCTL_NEITHER(GET_PSEUDO_TSC)
 #define IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS    VMIOCTL_NEITHER(GET_UNAVAIL_PERF_CTRS)
 #define IOCTL_VMX86_GET_MONITOR_CONTEXT      VMIOCTL_BUFFERED(GET_MONITOR_CONTEXT)
-#define IOCTL_VMX86_REMAP_SCATTER_LIST VMIOCTL_BUFFERED(REMAP_SCATTER_LIST)
-#define IOCTL_VMX86_UNMAP_SCATTER_LIST VMIOCTL_BUFFERED(UNMAP_SCATTER_LIST)
+#define IOCTL_VMX86_REMAP_SCATTER_LIST    VMIOCTL_BUFFERED(REMAP_SCATTER_LIST)
+#define IOCTL_VMX86_REMAP_SCATTER_LIST_RO VMIOCTL_BUFFERED(REMAP_SCATTER_LIST_RO)
+#define IOCTL_VMX86_UNMAP_SCATTER_LIST    VMIOCTL_BUFFERED(UNMAP_SCATTER_LIST)
 #endif
 
 
 #define INIT_BLOCK_MAGIC     (0x1789 + 14)
 
-/*
- * Flags sent into APICBASE ioctl
- */
-
-#define APIC_FLAG_DISABLE_NMI       0x00000001
-#define APIC_FLAG_PROBE             0x00000002
-#define APIC_FLAG_FORCE_ENABLE      0x00000004
 
 typedef
 #include "vmware_pack_begin.h"
@@ -409,10 +393,6 @@ union {
 #include "vmware_pack_end.h"
 VcpuPageRoot;
 
-typedef struct VMAPICInfo {
-   uint32 flags;
-} VMAPICInfo;
-
 #define VMX86_DRIVER_VCPUID_OFFSET 1000
 
 
@@ -614,39 +594,7 @@ typedef union {
    Context64 context; // OUT
 } VMMonContext;
 
-#if defined __linux__
-
-/*
- * Linux uses mmap(2) to allocate contiguous locked pages, and uses these
- * macros to marshall real arguments to mmap's made-up 'offset' argument.
- */
-
-#define VMMON_MAP_OFFSET_SHIFT  0
-#define VMMON_MAP_OFFSET_MASK   0x00000FFF
-#define VMMON_MAP_ORDER_SHIFT   12
-#define VMMON_MAP_ORDER_MASK    0xF
-#define VMMON_MAP_RSVD_SHIFT    16
-
-#define VMMON_MAP_RSVD(base)    \
-                ((base) >> VMMON_MAP_RSVD_SHIFT)
-#define VMMON_MAP_ORDER(base)   \
-                (((base) >> VMMON_MAP_ORDER_SHIFT) & VMMON_MAP_ORDER_MASK)
-#define VMMON_MAP_OFFSET(base)  \
-                (((base) >> VMMON_MAP_OFFSET_SHIFT) & VMMON_MAP_OFFSET_MASK)
-
-#define VMMON_MAP_BASE(order)   ((order) << VMMON_MAP_ORDER_SHIFT)
-
-#elif defined _WIN32
-/*
- * Windows uses an ioctl to allocate contiguous locked pages.
- */
-
-typedef struct VMAllocContiguousMem {
-   VA64   mpnList;  // IN: User VA of an array of 64-bit MPNs.
-   uint32 mpnCount; // IN
-   uint32 order;    // IN
-} VMAllocContiguousMem;
-#elif defined __APPLE__
+#if defined __APPLE__
 #   include "iocontrolsMacos.h"
 #endif
 
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index 9187e326..dfb4060f 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -57,6 +57,7 @@
    MC(RELEASE_ANON_PAGES)                                                     \
    MC(LOOKUP_MPN)                                                             \
    MC(COSCHED)                                                                \
+   MC(ALLOC_CONTIG_PAGES)                                                     \
    MC(ALLOC_VMX_PAGE)                                                         \
    MC(ALLOC_TMP_GDT)                                                          \
    MC(PIN_MPN)                                                                \
@@ -69,7 +70,8 @@
    MC(BOOTSTRAP_CLEANUP)                                                      \
    MC(GET_SHARED_AREA)                                                        \
    MC(GET_STAT_VARS)                                                          \
-   MC(GET_NUM_PTP_PAGES)
+   MC(GET_NUM_PTP_PAGES)                                                      \
+   MC(GET_HV_IO_BITMAP)                                                       \
 
 /*
  *----------------------------------------------------------------------
@@ -393,7 +395,6 @@ struct VMCrossPageData {
    uint8         _pad7[4];
    uint64        wsUD2;                       // IP of ud2 instr or 0 if unset.
    uint64        specCtrl; /* host MSR_SPEC_CTRL value before world switch. */
-   uint8         _pad8[8];
 }
 #include "vmware_pack_end.h"
 VMCrossPageData;
@@ -450,7 +451,7 @@ struct VMCrossPage {
 #include "vmware_pack_end.h"
 VMCrossPage;
 
-#define CROSSPAGE_VERSION_BASE 0xc0c /* increment by 1 */
+#define CROSSPAGE_VERSION_BASE 0xc0e /* increment by 1 */
 #define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
 
 #if !defined(VMX86_SERVER) && defined(VMM)
diff --git a/vmmon-only/include/modulecallstructs.h b/vmmon-only/include/modulecallstructs.h
index 1537b273..ab9c0ac9 100644
--- a/vmmon-only/include/modulecallstructs.h
+++ b/vmmon-only/include/modulecallstructs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006,2009-2011,2013-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006,2009-2011,2013-2015,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -66,8 +66,7 @@
    SWMSR(MSR_CSTAR)         \
    SWMSR(MSR_SFMASK)        \
    SWMSR(MSR_TSC_AUX)       \
-   SWMSR(MSR_BD_TSC_RATIO)  \
-   SWMSR(MSR_BNDCFGS)
+   SWMSR(MSR_BD_TSC_RATIO)
 
 /*
  *      Data structures for dealing with the context-switched MSRs that need
@@ -94,7 +93,6 @@ typedef struct SwitchedMSRValues {
 typedef struct SwitchedMSRState {
    SwitchedMSRValues smv;
    uint8             flags[NUM_SWITCHED_MSRS];
-   uint32            _pad;
 } SwitchedMSRState;
 
 #endif
diff --git a/vmmon-only/include/monLoaderLog.h b/vmmon-only/include/monLoaderLog.h
index 53fbd437..eefba6ff 100644
--- a/vmmon-only/include/monLoaderLog.h
+++ b/vmmon-only/include/monLoaderLog.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vcpuid.h b/vmmon-only/include/vcpuid.h
index 050d0b69..648d9244 100644
--- a/vmmon-only/include/vcpuid.h
+++ b/vmmon-only/include/vcpuid.h
@@ -59,6 +59,9 @@ typedef uint32 Vcpuid;                 // VCPU number
  */
 #define MAX_SMALL_VM_VCPUS 128
 
+/* Supported limit. */
+#define MAX_SUPPORTED_VCPUS   256
+
 #if defined __cplusplus
 } // extern "C"
 #endif
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index af45a5bf..ba699382 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -155,7 +155,6 @@ _GET_LDT(Selector * const result)
    } while (0)
 
 
-/* Checked against the Intel manual and GCC --thutt */
 #define _BUILD_SET_R(func, reg)        \
    static INLINE void                  \
    func(uintptr_t r)                   \
@@ -166,24 +165,20 @@ _GET_LDT(Selector * const result)
               : "memory");             \
    }
 
-/* Not yet checked against the Intel manual and GCC --slava
- *
- * 'volatile' because CRs and DRs can change without the compiler
- * knowing it (when there is a page fault, when a breakpoint occurs,
- * and moreover it seems there is no way to teach gcc that smsw
- * clobbers cr0 for example).
- *
- * The parameter is a 'uintptr_t *' so that the size of the actual
- * parameter must exactly match the size of the hardware register.
- * This prevents the use of 32-bit variables when building 64-bit
- * code.
+/*
+ * The inline asm is marked 'volatile' because CRs and DRs can change
+ * without the compiler knowing it (when there is a page fault, when a
+ * breakpoint occurs, and moreover it seems there is no way to teach
+ * gcc that smsw clobbers cr0 for example).
  */
 #define _BUILD_GET_R(func, reg)                         \
-   static INLINE void                                   \
-   func(uintptr_t *result)                              \
+   static INLINE uintptr_t                              \
+   func(void)                                           \
    {                                                    \
+      uintptr_t result;                                 \
       __asm__ __volatile__("mov %%" #reg ", %0"         \
-                           : "=r" (*result));           \
+                           : "=r" (result));            \
+      return result;                                    \
    }
 
 _BUILD_SET_R(_SET_CR0, cr0)
@@ -374,10 +369,10 @@ CLTS(void)
    }
 
 #define _BUILD_GET_DR(func, reg)                      \
-   static INLINE void                                 \
-   func(uintptr_t *result)                            \
+   static INLINE uintptr_t                            \
+   func(void)                                         \
    {                                                  \
-      *result = __readdr(reg);                        \
+      return __readdr(reg);                           \
    }
 
 #define _BUILD_SET_CR(func, reg)                      \
@@ -388,10 +383,10 @@ CLTS(void)
    }
 
 #define _BUILD_GET_CR(func, reg)                      \
-   static INLINE void                                 \
-   func(uintptr_t *result)                            \
+   static INLINE uintptr_t                            \
+   func(void)                                         \
    {                                                  \
-      *result = __readcr##reg();                      \
+      return __readcr##reg();                         \
    }
 
 _BUILD_SET_DR(_SET_DR0, 0)
@@ -618,7 +613,7 @@ _Get_TR(void)
 
 #define GET_CR_DR(regType, regNum, var) \
    do {                                 \
-      _GET_##regType##regNum(&(var));   \
+      var = _GET_##regType##regNum();   \
    } while (0)
 
 #define SET_DR0(expr) SET_CR_DR(DR, 0, expr)
@@ -648,6 +643,11 @@ _Get_TR(void)
 #define SET_CR4(expr) SET_CR_DR(CR, 4, expr)
 #define SET_CR8(expr) SET_CR_DR(CR, 8, expr)
 
+/*
+ * When the ULM macro-defines INTERRUPTS_ENABLED, attempting to define
+ * it as a function produces hard-to-diagnose compile-time errors.
+ */
+#if !defined(ULM) && !defined(INTERRUPTS_ENABLED)
 static INLINE Bool
 INTERRUPTS_ENABLED(void)
 {
@@ -655,6 +655,7 @@ INTERRUPTS_ENABLED(void)
    SAVE_FLAGS(flags);
    return ((flags & EFLAGS_IF) != 0);
 }
+#endif
 
 /*
  * [GS]ET_[GI]DT() are defined as macros wrapping a function
diff --git a/vmmon-only/include/vm_assert.h b/vmmon-only/include/vm_assert.h
index 74cbc2fb..27f63477 100644
--- a/vmmon-only/include/vm_assert.h
+++ b/vmmon-only/include/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -207,7 +207,7 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
       count = (count + 1) & 1023;                                       \
    } while (0)
 
-#define LOG_ONCE(_s) DO_ONCE(Log _s)
+#define LOG_ONCE(...) DO_ONCE(Log(__VA_ARGS__))
 
 
 /*
@@ -314,6 +314,17 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
       assertions                     \
    }
 
+/*
+ * Avoid generating extra code due to asserts which are required by
+ * Clang static analyzer, e.g. right before a statement would fail, using
+ * the __clang_analyzer__ macro defined only when clang SA is parsing files.
+ */
+#ifdef __clang_analyzer__
+#define ANALYZER_ASSERT(cond) ASSERT(cond)
+#else
+#define ANALYZER_ASSERT(cond) ((void)0)
+#endif
+
 #ifdef __cplusplus
 } /* extern "C" */
 #endif
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index 800b3eda..d13c0502 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -122,27 +122,27 @@ extern "C" {
 
 
 /* Basic atomic types: 8, 16, 32, 64 and 128 bits */
-typedef struct Atomic_uint8 {
+typedef ALIGNED(1) struct Atomic_uint8 {
    volatile uint8 value;
-} Atomic_uint8 ALIGNED(1);
+} Atomic_uint8;
 
-typedef struct Atomic_uint16 {
+typedef ALIGNED(2) struct Atomic_uint16 {
    volatile uint16 value;
-} Atomic_uint16 ALIGNED(2);
+} Atomic_uint16;
 
-typedef struct Atomic_uint32 {
+typedef ALIGNED(4) struct Atomic_uint32 {
    volatile uint32 value;
-} Atomic_uint32 ALIGNED(4);
+} Atomic_uint32;
 
-typedef struct Atomic_uint64 {
+typedef ALIGNED(8) struct Atomic_uint64 {
    volatile uint64 value;
-} Atomic_uint64 ALIGNED(8);
+} Atomic_uint64;
 
 #if defined __GNUC__ && defined VM_64BIT && \
      (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
-typedef struct Atomic_uint128 {
+typedef ALIGNED(16) struct Atomic_uint128 {
    volatile uint128 value;
-} Atomic_uint128 ALIGNED(16);
+} Atomic_uint128;
 #endif
 
 /*
@@ -3584,7 +3584,7 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
  *
  * Atomic_ReadInc16 --
  *
- *      Atomically increments a 64-bit integer
+ *      Atomically increments a 16-bit integer
  *
  * Results:
  *      Returns the old value just prior to incrementing
@@ -3607,7 +3607,7 @@ Atomic_ReadInc16(Atomic_uint16 *var) // IN/OUT
  *
  * Atomic_ReadDec16 --
  *
- *      Atomically decrements a 64-bit integer
+ *      Atomically decrements a 16-bit integer
  *
  * Results:
  *      Returns the old value just prior to decrementing
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index 02172e64..ec31efd0 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -48,7 +48,6 @@
 #define MUL64_NO_ASM 1
 #include "mul64.h"
 #elif defined VM_ARM_64
-#include "arm64_basic_defs.h"
 #include "vm_basic_asm_arm64.h"
 #else
 #define MUL64_NO_ASM 1
@@ -1180,6 +1179,9 @@ RoundUpPow2_32(uint32 value)
 static INLINE unsigned
 PopCount32(uint32 value)
 {
+#if defined(__GNUC__) && !defined(FEWER_BUILTINS) && defined(__POPCNT__)
+   return __builtin_popcount(value);
+#else
    /*
     * Attribution:
     *     This algorithm was copied from:
@@ -1223,6 +1225,7 @@ PopCount32(uint32 value)
    value += (value >> 8);
    value += (value >> 16);
    return value & 0x0000003f;
+#endif
 }
 
 
@@ -1245,6 +1248,13 @@ PopCount32(uint32 value)
 static INLINE unsigned
 PopCount64(uint64 value)
 {
+#if defined(__GNUC__) && !defined(FEWER_BUILTINS) && defined(__POPCNT__)
+#if defined(VM_X86_64)
+   return __builtin_popcountll(value);
+#else
+   return PopCount32(value) + PopCount32(value >> 32);
+#endif
+#else
    value -= (value >> 1) & 0x5555555555555555ULL;
    value = ((value >> 2) & 0x3333333333333333ULL) +
            (value & 0x3333333333333333ULL);
@@ -1253,6 +1263,7 @@ PopCount64(uint64 value)
    value += value >> 16;
    value += value >> 32;
    return (unsigned) (value & 0xff);
+#endif
 }
 
 
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index 29298257..f683168c 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -438,10 +438,6 @@ void *_ReturnAddress(void);
 
 #define strtok_r  strtok_s
 
-#if (_MSC_VER < 1500)
-#define	vsnprintf _vsnprintf
-#endif
-
 typedef int uid_t;
 typedef int gid_t;
 
@@ -465,20 +461,9 @@ typedef int pid_t;
 #define       W_OK          2
 #define       R_OK          4
 
-#endif // }
-
-/*
- * Macro for username comparison.
- */
-
-#ifdef _WIN32 // {
-#define USERCMP(x,y)  Str_Strcasecmp(x,y)
-#else
-#define USERCMP(x,y)  strcmp(x,y)
-#endif // }
-
+#endif // } _WIN32
 
-#endif // }
+#endif // } USERLEVEL
 
 #ifndef va_copy
 
@@ -657,8 +642,10 @@ typedef int pid_t;
 #endif
 
 #ifdef VMM
+#define vmx86_vmm 1
 #define VMM_ONLY(x) x
 #else
+#define vmx86_vmm 0
 #define VMM_ONLY(x)
 #endif
 
@@ -699,7 +686,6 @@ typedef int pid_t;
  * display/printer drivers only.
  */
 #ifdef _WIN32
-#ifndef USES_OLD_WINDDK
 #if defined(VMX86_LOG)
 #ifdef _WIN64
 #define WinDrvPrint(arg, ...) DbgPrintEx(DPFLTR_IHVDRIVER_ID, (ULONG)~0, arg, __VA_ARGS__)
@@ -711,7 +697,6 @@ typedef int pid_t;
 #define WinDrvPrint(arg, ...)
 #define WinDrvEngPrint(arg, ...)
 #endif
-#endif
 #endif // _WIN32
 
 /*
@@ -801,4 +786,30 @@ typedef int pid_t;
 #define END_PTR_TO_ALIGNED_VAR \
    } while (0)
 
+
+/*
+ * -Wswitch means that when you pass switch an enum that it's looking for
+ * all values from that enum, and only that enum, to be accounted for.
+ * "default:;" is fine for catching values you don't care about. But today
+ * we have a bunch of code that uses internal and external enum values, or
+ * in other words combines two enums into a single variable. This cast is
+ * the workaround, but we really need to fix this mess.
+ */
+#define UNCHECKED_SWITCH__FIXME(x) switch ((uint64)(x))
+
+
+/*
+ * When clang static analyzer parses source files, it implicitly defines
+ * __clang_analyzer__ macro. We use this to define our custom macro to stop
+ * its execution for the current path of analysis by calling a function that
+ * doesn't return, making it think that it hit a failed assertion.
+ *
+ * DO NOT use to silence the analyzer! See PR2447238.
+ */
+#ifdef __clang_analyzer__
+#define VMW_CLANG_ANALYZER_NORETURN() Panic("Disable Clang static analyzer")
+#else
+#define VMW_CLANG_ANALYZER_NORETURN() ((void)0)
+#endif
+
 #endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index f7f5b93f..bb9d86cf 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -101,6 +101,7 @@
 
 #pragma warning (3 :4505) // unreferenced local function
 #pragma warning (disable :4018) // signed/unsigned mismatch
+#pragma warning (suppress:4619) // suppress warning next line (C4761 was removed in vs2019u4)
 #pragma warning (disable :4761) // integral size mismatch in argument; conversion supplied
 #pragma warning (disable :4305) // truncation from 'const int' to 'short'
 #pragma warning (disable :4244) // conversion from 'unsigned short' to 'unsigned char'
@@ -698,11 +699,11 @@ typedef void * UserVA;
 #endif
 
 /*
- * Similarly, we require a compiler that is at least vc80 (vs2005).
+ * Similarly, we require a compiler that is at least vc90 (vs2008).
  * Enforce this here.
  */
-#if defined _MSC_VER && _MSC_VER < 1400
-#error "cl.exe version is too old, need vc80 or better"
+#if defined _MSC_VER && _MSC_VER < 1500
+#error "cl.exe version is too old, need vc90 or better"
 #endif
 
 
@@ -864,12 +865,10 @@ typedef void * UserVA;
 #endif
 
 #ifndef UNUSED_TYPE
-// XXX _Pragma would better but doesn't always work right now.
 #  define UNUSED_TYPE(_parm) UNUSED_PARAM(_parm)
 #endif
 
 #ifndef UNUSED_VARIABLE
-// XXX is there a better way?
 #  define UNUSED_VARIABLE(_var) (void)_var
 #endif
 
@@ -884,29 +883,21 @@ typedef void * UserVA;
 
 /*
  * ALIGNED specifies minimum alignment in "n" bytes.
+ *
+ * NOTE: __declspec(align) has limited syntax; it must essentially be
+ *       an integer literal.  Expressions, such as sizeof(), do not
+ *       work.
  */
 
 #ifdef __GNUC__
 #define ALIGNED(n) __attribute__((__aligned__(n)))
+#elif defined(_MSC_VER)
+#define ALIGNED(n) __declspec(align(n))
 #else
 #define ALIGNED(n)
 #endif
 
 
-/*
- * Encapsulate the syntactic differences between gcc and msvc alignment control.
- * BOUNDARY must match in the prefix and suffix.
- */
-
-#ifdef _WIN32
-#define ALIGN_PREFIX(BOUNDRY) __declspec(align(BOUNDRY))
-#define ALIGN_SUFFIX(BOUNDRY)
-#else
-#define ALIGN_PREFIX(BOUNDRY)
-#define ALIGN_SUFFIX(BOUNDRY) __attribute__((__aligned__(BOUNDRY)))
-#endif
-
-
 /*
  * Once upon a time, this was used to silence compiler warnings that
  * get generated when the compiler thinks that a function returns
diff --git a/vmmon-only/include/vmmem_shared.h b/vmmon-only/include/vmmem_shared.h
index c8e58030..c301f713 100644
--- a/vmmon-only/include/vmmem_shared.h
+++ b/vmmon-only/include/vmmem_shared.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2000-2015,2017-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2000-2015,2017-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -46,6 +46,7 @@
 #define VMMEM_ANON_IOABLE_PAGE    VMMEM_FLAG_BIT(4)
 #define VMMEM_ANON_ALL_FLAGS      MASK(5)
 
+#define VMMEM_GUEST_NO_FLAGS      0
 #define VMMEM_GUEST_WRITEABLE     VMMEM_FLAG_BIT(0)
 #define VMMEM_GUEST_BREAKCOW      VMMEM_FLAG_BIT(1)
 #define VMMEM_GUEST_2M_PAGE       VMMEM_FLAG_BIT(2)
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index daf24abc..5213ae8d 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -58,6 +58,7 @@ typedef struct CPUIDRegs {
 typedef union CPUIDRegsUnion {
    uint32 array[4];
    CPUIDRegs regs;
+   uint64 force8byteAlign[2]; /* See CpuidInfoNodePtr (needed on Apple Mac). */
 } CPUIDRegsUnion;
 
 /*
@@ -117,49 +118,57 @@ CPUIDQuery;
  * this level or parts of it to guest.
  */
 
-#define CPUID_CACHED_LEVELS                         \
-   CPUIDLEVEL(TRUE,  0,   0,          0,  0)        \
-   CPUIDLEVEL(TRUE,  1,   1,          0,  0)        \
-   CPUIDLEVEL(FALSE, 2,   2,          0,  0)        \
-   CPUIDLEVEL(FALSE, 4,   4,          7,  0)        \
-   CPUIDLEVEL(FALSE, 5,   5,          0,  0)        \
-   CPUIDLEVEL(TRUE,  6,   6,          0,  0)        \
-   CPUIDLEVEL(TRUE,  7,   7,          1,  0)        \
-   CPUIDLEVEL(FALSE, A,   0xA,        0,  0)        \
-   CPUIDLEVEL(FALSE, B,   0xB,        2,  0)        \
-   CPUIDLEVEL(TRUE,  D,   0xD,       10,  0)        \
-   CPUIDLEVEL(TRUE,  F,   0xF,        2, 13)        \
-   CPUIDLEVEL(TRUE,  10,  0x10,       2, 13)        \
-   CPUIDLEVEL(TRUE,  12,  0x12,       4, 13)        \
-   CPUIDLEVEL(TRUE,  14,  0x14,       2, 13)        \
-   CPUIDLEVEL(TRUE,  15,  0x15,       0, 13)        \
-   CPUIDLEVEL(TRUE,  16,  0x16,       0, 13)        \
-   CPUIDLEVEL(TRUE,  17,  0x17,       4, 14)        \
-   CPUIDLEVEL(FALSE, 400, 0x40000000, 0,  0)        \
-   CPUIDLEVEL(FALSE, 401, 0x40000001, 0,  0)        \
-   CPUIDLEVEL(FALSE, 402, 0x40000002, 0,  0)        \
-   CPUIDLEVEL(FALSE, 403, 0x40000003, 0,  0)        \
-   CPUIDLEVEL(FALSE, 404, 0x40000004, 0,  0)        \
-   CPUIDLEVEL(FALSE, 405, 0x40000005, 0,  0)        \
-   CPUIDLEVEL(FALSE, 406, 0x40000006, 0,  0)        \
-   CPUIDLEVEL(FALSE, 410, 0x40000010, 0,  0)        \
-   CPUIDLEVEL(FALSE, 80,  0x80000000, 0,  0)        \
-   CPUIDLEVEL(TRUE,  81,  0x80000001, 0,  0)        \
-   CPUIDLEVEL(FALSE, 82,  0x80000002, 0,  0)        \
-   CPUIDLEVEL(FALSE, 83,  0x80000003, 0,  0)        \
-   CPUIDLEVEL(FALSE, 84,  0x80000004, 0,  0)        \
-   CPUIDLEVEL(FALSE, 85,  0x80000005, 0,  0)        \
-   CPUIDLEVEL(FALSE, 86,  0x80000006, 0,  0)        \
-   CPUIDLEVEL(FALSE, 87,  0x80000007, 0,  0)        \
-   CPUIDLEVEL(TRUE,  88,  0x80000008, 0,  0)        \
-   CPUIDLEVEL(TRUE,  8A,  0x8000000A, 0,  0)        \
-   CPUIDLEVEL(FALSE, 819, 0x80000019, 0,  0)        \
-   CPUIDLEVEL(FALSE, 81A, 0x8000001A, 0,  0)        \
-   CPUIDLEVEL(FALSE, 81B, 0x8000001B, 0,  0)        \
-   CPUIDLEVEL(FALSE, 81C, 0x8000001C, 0,  0)        \
-   CPUIDLEVEL(FALSE, 81D, 0x8000001D, 5,  0)        \
-   CPUIDLEVEL(FALSE, 81E, 0x8000001E, 0,  0)        \
-   CPUIDLEVEL(TRUE,  81F, 0x8000001F, 0, 14)
+/*            MASKS, LVL, VAL,      CNT, HWV */
+#define CPUID_CACHED_LEVELS                  \
+   CPUIDLEVEL(TRUE,  0,   0x0,        0,  0) \
+   CPUIDLEVEL(TRUE,  1,   0x1,        0,  0) \
+   CPUIDLEVEL(FALSE, 2,   0x2,        0,  0) \
+   CPUIDLEVEL(FALSE, 4,   0x4,        7,  0) \
+   CPUIDLEVEL(FALSE, 5,   0x5,        0,  0) \
+   CPUIDLEVEL(TRUE,  6,   0x6,        0,  0) \
+   CPUIDLEVEL(TRUE,  7,   0x7,        2,  0) \
+   CPUIDLEVEL(TRUE,  9,   0x9,        0, 17) \
+   CPUIDLEVEL(FALSE, A,   0xa,        0,  0) \
+   CPUIDLEVEL(FALSE, B,   0xb,        3,  0) \
+   CPUIDLEVEL(TRUE,  D,   0xd,       10,  0) \
+   CPUIDLEVEL(TRUE,  F,   0xf,        2, 13) \
+   CPUIDLEVEL(TRUE,  10,  0x10,       4, 13) \
+   CPUIDLEVEL(TRUE,  12,  0x12,       4, 13) \
+   CPUIDLEVEL(TRUE,  14,  0x14,       2, 13) \
+   CPUIDLEVEL(TRUE,  15,  0x15,       0, 13) \
+   CPUIDLEVEL(TRUE,  16,  0x16,       0, 13) \
+   CPUIDLEVEL(TRUE,  17,  0x17,       4, 14) \
+   CPUIDLEVEL(TRUE,  18,  0x18,       8, 17) \
+   CPUIDLEVEL(TRUE,  1A,  0x1a,       0, 17) \
+   CPUIDLEVEL(TRUE,  1B,  0x1b,       2, 17) \
+   CPUIDLEVEL(TRUE,  1F,  0x1f,       6, 17) \
+   CPUIDLEVEL(FALSE, 400, 0x40000000, 0,  0) \
+   CPUIDLEVEL(FALSE, 401, 0x40000001, 0,  0) \
+   CPUIDLEVEL(FALSE, 402, 0x40000002, 0,  0) \
+   CPUIDLEVEL(FALSE, 403, 0x40000003, 0,  0) \
+   CPUIDLEVEL(FALSE, 404, 0x40000004, 0,  0) \
+   CPUIDLEVEL(FALSE, 405, 0x40000005, 0,  0) \
+   CPUIDLEVEL(FALSE, 406, 0x40000006, 0,  0) \
+   CPUIDLEVEL(FALSE, 410, 0x40000010, 0,  0) \
+   CPUIDLEVEL(FALSE, 80,  0x80000000, 0,  0) \
+   CPUIDLEVEL(TRUE,  81,  0x80000001, 0,  0) \
+   CPUIDLEVEL(FALSE, 82,  0x80000002, 0,  0) \
+   CPUIDLEVEL(FALSE, 83,  0x80000003, 0,  0) \
+   CPUIDLEVEL(FALSE, 84,  0x80000004, 0,  0) \
+   CPUIDLEVEL(FALSE, 85,  0x80000005, 0,  0) \
+   CPUIDLEVEL(FALSE, 86,  0x80000006, 0,  0) \
+   CPUIDLEVEL(FALSE, 87,  0x80000007, 0,  0) \
+   CPUIDLEVEL(TRUE,  88,  0x80000008, 0,  0) \
+   CPUIDLEVEL(TRUE,  8A,  0x8000000a, 0,  0) \
+   CPUIDLEVEL(FALSE, 819, 0x80000019, 0,  0) \
+   CPUIDLEVEL(FALSE, 81A, 0x8000001a, 0,  0) \
+   CPUIDLEVEL(FALSE, 81B, 0x8000001b, 0,  0) \
+   CPUIDLEVEL(FALSE, 81C, 0x8000001c, 0,  0) \
+   CPUIDLEVEL(FALSE, 81D, 0x8000001d, 5,  0) \
+   CPUIDLEVEL(FALSE, 81E, 0x8000001e, 0,  0) \
+   CPUIDLEVEL(TRUE,  81F, 0x8000001f, 0, 14) \
+   CPUIDLEVEL(TRUE,  820, 0x80000020, 2, 17) \
+   CPUIDLEVEL(TRUE,  821, 0x80000021, 0, 17)
 
 #define CPUID_ALL_LEVELS CPUID_CACHED_LEVELS
 
@@ -183,6 +192,7 @@ enum {
 #define CPUID_FEATURE_INFORMATION  0x01
 #define CPUID_PROCESSOR_TOPOLOGY   4
 #define CPUID_MWAIT_FEATURES       5
+#define CPUID_PMC_FEATURES         0xa
 #define CPUID_XSAVE_FEATURES       0xd
 #define CPUID_SGX_FEATURES         0x12
 #define CPUID_PT_FEATURES          0x14
@@ -453,7 +463,13 @@ FLAG(   6,  0, EAX,  9,  1, HWP_ACTIVITY_WINDOW,                 NO,    0 ) \
 FLAG(   6,  0, EAX, 10,  1, HWP_ENERGY_PERFORMANCE_PREFERENCE,   NO,    0 ) \
 FLAG(   6,  0, EAX, 11,  1, HWP_PACKAGE_LEVEL_REQUEST,           NO,    0 ) \
 FLAG(   6,  0, EAX, 13,  1, HDC,                                 NO,    0 ) \
+FLAG(   6,  0, EAX, 14,  1, TURBO_BOOST_MAX_3,                   NO,    0 ) \
+FLAG(   6,  0, EAX, 15,  1, HWP_CAPABILITIES,                    NO,    0 ) \
+FLAG(   6,  0, EAX, 16,  1, HWP_PECI,                            NO,    0 ) \
+FLAG(   6,  0, EAX, 17,  1, HWP_FLEXIBLE,                        NO,    0 ) \
+FLAG(   6,  0, EAX, 18,  1, HWP_FAST_ACCESS,                     NO,    0 ) \
 FLAG(   6,  0, EAX, 19,  1, HW_FEEDBACK,                         NO,    0 ) \
+FLAG(   6,  0, EAX, 20,  1, HWP_IGNORE_IDLE_REQUEST,             NO,    0 ) \
 FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,                 NO,    0 ) \
 FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                   NO,    0 ) \
 FLAG(   6,  0, ECX,  1,  1, ACNT2,                               ANY,  13 ) \
@@ -463,12 +479,9 @@ FLAG(   6,  0, EDX,  1,  1, ENERGY_CAP_REPORTING,                NO,    0 ) \
 FIELD(  6,  0, EDX,  8,  4, HW_FEEDBACK_SIZE,                    NO,    0 ) \
 FIELD(  6,  0, EDX, 16, 16, HW_FEEDBACK_INDEX,                   NO,    0 )
 
-/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
-#define CPUID_7_EDX_10 \
-FLAG(   7,  0, EDX, 10,  1, LEAF7_RSVD,                          NO,    0 )
-
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_7                                            \
+FIELD(  7,  0, EAX,  0, 32, LEAF_7_MAX_SUBLEVEL,                 YES, FUT ) \
 FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                            YES,   9 ) \
 FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                          ANY,  11 ) \
 FLAG(   7,  0, EBX,  2,  1, SGX,                                 ANY,  17 ) \
@@ -507,6 +520,7 @@ FLAG(   7,  0, ECX,  3,  1, PKU,                                 YES,  13 ) \
 FLAG(   7,  0, ECX,  4,  1, OSPKE,                               ANY,  13 ) \
 FLAG(   7,  0, ECX,  5,  1, WAITPKG,                             NO,    0 ) \
 FLAG(   7,  0, ECX,  6,  1, AVX512VBMI2,                         YES,  17 ) \
+FLAG(   7,  0, ECX,  7,  1, CET_SS,                              NO,    0 ) \
 FLAG(   7,  0, ECX,  8,  1, GFNI,                                YES,  17 ) \
 FLAG(   7,  0, ECX,  9,  1, VAES,                                YES,  17 ) \
 FLAG(   7,  0, ECX, 10,  1, VPCLMULQDQ,                          YES,  17 ) \
@@ -516,21 +530,31 @@ FLAG(   7,  0, ECX, 14,  1, AVX512VPOPCNTDQ,                     YES,  16 ) \
 FLAG(   7,  0, ECX, 16,  1, VA57,                                NO,    0 ) \
 FIELD(  7,  0, ECX, 17,  5, MAWA,                                NO,    0 ) \
 FLAG(   7,  0, ECX, 22,  1, RDPID,                               YES,  17 ) \
-FLAG(   7,  0, ECX, 25,  1, CLDEMOTE,                            NO,    0 ) \
-FLAG(   7,  0, ECX, 27,  1, MOVDIRI,                             NO,    0 ) \
-FLAG(   7,  0, ECX, 28,  1, MOVDIR64B,                           NO,    0 ) \
+FLAG(   7,  0, ECX, 25,  1, CLDEMOTE,                            YES, FUT ) \
+FLAG(   7,  0, ECX, 27,  1, MOVDIRI,                             YES, FUT ) \
+FLAG(   7,  0, ECX, 28,  1, MOVDIR64B,                           YES, FUT ) \
+FLAG(   7,  0, ECX, 29,  1, ENQCMD,                              NO,    0 ) \
 FLAG(   7,  0, ECX, 30,  1, SGX_LC,                              ANY,  17 ) \
 FLAG(   7,  0, EDX,  2,  1, AVX512QVNNIW,                        YES,  16 ) \
 FLAG(   7,  0, EDX,  3,  1, AVX512QFMAPS,                        YES,  16 ) \
-FLAG(   7,  0, EDX,  4,  1, FAST_SHORT_REPMOV,                   NO,    0 ) \
-CPUID_7_EDX_10 \
+FLAG(   7,  0, EDX,  4,  1, FAST_SHORT_REPMOV,                   YES, FUT ) \
+FLAG(   7,  0, EDX,  8,  1, AVX512VP2INTERSECT,                  YES, FUT ) \
+FLAG(   7,  0, EDX, 10,  1, MDCLEAR,                             YES,   9 ) \
 FLAG(   7,  0, EDX, 13,  1, TSX_MICROCODE_UPDATE,                NO,    0 ) \
+FLAG(   7,  0, EDX, 15,  1, HYBRID,                              NO,    0 ) \
 FLAG(   7,  0, EDX, 18,  1, PCONFIG,                             NO,    0 ) \
+FLAG(   7,  0, EDX, 20,  1, CET_IBT,                             NO,    0 ) \
 FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                            ANY,   9 ) \
 FLAG(   7,  0, EDX, 27,  1, STIBP,                               YES,   9 ) \
 FLAG(   7,  0, EDX, 28,  1, FCMD,                                YES,   9 ) \
 FLAG(   7,  0, EDX, 29,  1, ARCH_CAPABILITIES,                   ANY,   9 ) \
-FLAG(   7,  0, EDX, 31,  1, SSBD,                                YES,   9 )
+FLAG(   7,  0, EDX, 30,  1, CORE_CAPABILITIES,                   NO,    0 ) \
+FLAG(   7,  0, EDX, 31,  1, SSBD,                                YES,   9 ) \
+FLAG(   7,  1, EAX,  5,  1, AVX512BF16,                          YES, FUT )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_9                                            \
+FIELD(  9,  0, EAX,  0, 32, IA32_PLATFORM_DCA_CAP_VAL,           NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_A                                            \
@@ -574,7 +598,7 @@ FLAG(   D,  0, EAX,  6,  1, XCR0_MASTER_ZMM_H,                   YES,  13 ) \
 FLAG(   D,  0, EAX,  7,  1, XCR0_MASTER_HI16_ZMM,                YES,  13 ) \
 FLAG(   D,  0, EAX,  8,  1, XCR0_MASTER_XSS,                     NO,    0 ) \
 FLAG(   D,  0, EAX,  9,  1, XCR0_MASTER_PKRU,                    YES,  13 ) \
-FIELD(  D,  0, EAX,  10,22, XCR0_MASTER_LOWER,                   NO,    0 ) \
+FIELD(  D,  0, EAX, 10, 22, XCR0_MASTER_LOWER,                   NO,    0 ) \
 FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                  ANY,   8 ) \
 FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                      YES,   8 ) \
 FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                   NO,    0 ) \
@@ -588,7 +612,7 @@ FIELD(  D,  1, EBX,  0, 32, XSAVES_ENABLED_SIZE,                 ANY,  13 ) \
 FIELD(  D,  1, ECX,  0,  7, XSS_XCR0_USED0,                      NO,    0 ) \
 FLAG(   D,  1, ECX,  8,  1, XSS_PT,                              NO,    0 ) \
 FIELD(  D,  1, ECX,  9,  1, XSS_XCR0_USED1,                      NO,    0 ) \
-FIELD(  D,  1, ECX,  10,22, XSS_RSVD0,                           NO,    0 ) \
+FIELD(  D,  1, ECX, 10, 22, XSS_RSVD0,                           NO,    0 ) \
 FIELD(  D,  1, EDX,  0, 32, XSS_RSVD1,                           NO,    0 ) \
 FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                      YES,   8 ) \
 FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                    YES,   8 ) \
@@ -637,11 +661,8 @@ FIELD(  D,  9, EBX,  0, 32, XSAVE_PKRU_OFFSET,                   YES,  13 ) \
 FLAG(   D,  9, ECX,  0,  1, XSAVE_PKRU_SUP_BY_XSS,               NO,    0 ) \
 FLAG(   D,  9, ECX,  1,  1, XSAVE_PKRU_ALIGN,                    YES,  13 ) \
 FIELD(  D,  9, ECX,  2, 30, XSAVE_PKRU_RSVD1,                    NO,    0 ) \
-FIELD(  D,  9, EDX,  0, 32, XSAVE_PKRU_RSVD2,                    NO,    0 ) \
-FIELD(  D, 62, EAX,  0, 32, XSAVE_LWP_SIZE,                      NO,    0 ) \
-FIELD(  D, 62, EBX,  0, 32, XSAVE_LWP_OFFSET,                    NO,    0 ) \
-FIELD(  D, 62, ECX,  0, 32, XSAVE_LWP_RSVD1,                     NO,    0 ) \
-FIELD(  D, 62, EDX,  0, 32, XSAVE_LWP_RSVD2,                     NO,    0 )
+FIELD(  D,  9, EDX,  0, 32, XSAVE_PKRU_RSVD2,                    NO,    0 )
+/* D, 62: AMD LWP leaf on BD, PD, SR. Dropped in Zen. Never referenced. */
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_F                                            \
@@ -675,10 +696,10 @@ FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                    ANY,  17 ) \
 FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                    ANY,  17 ) \
 FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                    ANY,  17 ) \
 FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                    ANY,  17 ) \
-FIELD( 12,  2, EAX,  0, 15, EPC00_VALID,                         ANY,  17 ) \
+FIELD( 12,  2, EAX,  0,  4, EPC00_VALID,                         ANY,  17 ) \
 FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                      ANY,  17 ) \
 FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                     ANY,  17 ) \
-FIELD( 12,  2, ECX,  0, 15, EPC00_PROTECTED,                     ANY,  17 ) \
+FIELD( 12,  2, ECX,  0,  4, EPC00_PROTECTED,                     ANY,  17 ) \
 FIELD( 12,  2, ECX, 12, 20, EPC00_SIZE_LOW,                      ANY,  17 ) \
 FIELD( 12,  2, EDX,  0, 20, EPC00_SIZE_HIGH,                     ANY,  17 ) \
 FIELD( 12,  3, EAX,  0,  4, EPC01_VALID,                         NO,    0 ) \
@@ -711,6 +732,7 @@ FIELD( 14,  1, EBX, 16, 16, PT_AVAIL_PSB_FREQ_ENCS,             YES, FUT ) \
 #define CPUID_FIELD_DATA_LEVEL_15                                           \
 FIELD( 15,  0, EAX,  0, 32, DENOM_TSC_TO_CORE_CRYSTAL_CLK,       NO,    0 ) \
 FIELD( 15,  0, EBX,  0, 32, NUMER_TSC_TO_CORE_CRYSTAL_CLK,       NO,    0 ) \
+FIELD( 15,  0, ECX,  0, 32, CORE_CRYSTAL_CLK_FREQ,               NO,    0 ) \
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_16                                           \
@@ -739,7 +761,42 @@ FIELD( 17,  3, ECX,  0, 32, SOC_VENDOR_BRAND_STRING_3_2,         NO,    0 ) \
 FIELD( 17,  3, EDX,  0, 32, SOC_VENDOR_BRAND_STRING_3_3,         NO,    0 ) \
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
-#define CPUID_FIELD_DATA_LEVEL_400                                         \
+#define CPUID_FIELD_DATA_LEVEL_18                                           \
+FIELD( 18,  0, EAX,  0, 32, TLB_INFO_MAX_SUBLEAF,                NO,    0 ) \
+FLAG(  18,  0, EBX,  0,  1, TLB_INFO_LEVEL_SIZE_4K,              NO,    0 ) \
+FLAG(  18,  0, EBX,  1,  1, TLB_INFO_LEVEL_SIZE_2M,              NO,    0 ) \
+FLAG(  18,  0, EBX,  2,  1, TLB_INFO_LEVEL_SIZE_4M,              NO,    0 ) \
+FLAG(  18,  0, EBX,  3,  1, TLB_INFO_LEVEL_SIZE_1G,              NO,    0 ) \
+FIELD( 18,  0, EBX,  8,  3, TLB_INFO_PARTITIONING,               NO,    0 ) \
+FIELD( 18,  0, EBX, 16, 16, TLB_INFO_NUM_WAYS,                   NO,    0 ) \
+FIELD( 18,  0, ECX,  0, 32, TLB_INFO_NUM_SETS,                   NO,    0 ) \
+FIELD( 18,  0, EDX,  0,  5, TLB_INFO_TYPE,                       NO,    0 ) \
+FIELD( 18,  0, EDX,  5,  3, TLB_INFO_LEVEL,                      NO,    0 ) \
+FLAG(  18,  0, EDX,  8,  1, TLB_INFO_FULLY_ASSOCIATIVE,          NO,    0 ) \
+FIELD( 18,  0, EDX, 14, 12, TLB_INFO_MAX_ADDRESSABLE_IDS,        NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_1A                                           \
+FIELD( 1A,  0, EAX,  0, 24, NATIVE_MODEL_ID,                     NO,    0 ) \
+FIELD( 1A,  0, EAX, 24,  8, CORE_TYPE,                           NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_1B                                           \
+FIELD( 1B,  0, EAX,  0, 12, PCONFIG_SUBLEAF_TYPE,                NO,    0 ) \
+FIELD( 1B,  0, EBX,  0, 32, PCONFIG_TARGET_ID1,                  NO,    0 ) \
+FIELD( 1B,  0, ECX,  0, 32, PCONFIG_TARGET_ID2,                  NO,    0 ) \
+FIELD( 1B,  0, EDX,  0, 32, PCONFIG_TARGET_ID3,                  NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_1F                                           \
+FIELD( 1F,  0, EAX,  0,  5, TOPOLOGY_V2_MASK_WIDTH,              NO,    0 ) \
+FIELD( 1F,  0, EBX,  0, 16, TOPOLOGY_V2_CPUS_SHARING_LEVEL,      NO,    0 ) \
+FIELD( 1F,  0, ECX,  0,  8, TOPOLOGY_V2_LEVEL_NUMBER,            NO,    0 ) \
+FIELD( 1F,  0, ECX,  8,  8, TOPOLOGY_V2_LEVEL_TYPE,              NO,    0 ) \
+FIELD( 1F,  0, EDX,  0, 32, TOPOLOGY_V2_X2APIC_ID,               NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_400                                          \
 FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                       NA,    0 ) \
 FIELD(400,  0, EBX,  0, 32, HYPERVISOR_VENDOR0,                  NA,    0 ) \
 FIELD(400,  0, ECX,  0, 32, HYPERVISOR_VENDOR1,                  NA,    0 ) \
@@ -850,16 +907,17 @@ FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                      NA,    0 ) \
 FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                      NA,    0 ) \
 FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                      NA,    0 )
 
+#define CPUID_81_ECX_14 \
+FLAG(  81,  0, ECX, 14,  1, LEAF81ECX_RSVD1,                     NO,    0 )
+
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_81                                           \
-FIELD( 81,  0, EAX,  0, 32, UNKNOWN81EAX,                        ANY,   4 ) \
 FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                     ANY,   4 ) \
 FIELD( 81,  0, EAX,  4,  4, LEAF81_MODEL,                        ANY,   4 ) \
 FIELD( 81,  0, EAX,  8,  4, LEAF81_FAMILY,                       ANY,   4 ) \
 FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                         ANY,   4 ) \
 FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,               ANY,   4 ) \
 FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,              ANY,   4 ) \
-FIELD( 81,  0, EBX,  0, 32, UNKNOWN81EBX,                        ANY,   4 ) \
 FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                     ANY,   4 ) \
 FIELD( 81,  0, EBX, 16, 16, UNDEF,                               ANY,   4 ) \
 FLAG(  81,  0, ECX,  0,  1, LAHF64,                              YES,   4 ) \
@@ -876,6 +934,7 @@ FLAG(  81,  0, ECX, 10,  1, IBS,                                 NO,    0 ) \
 FLAG(  81,  0, ECX, 11,  1, XOP,                                 YES,   8 ) \
 FLAG(  81,  0, ECX, 12,  1, SKINIT,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                            NO,    0 ) \
+CPUID_81_ECX_14 \
 FLAG(  81,  0, ECX, 15,  1, LWP,                                 NO,    0 ) \
 FLAG(  81,  0, ECX, 16,  1, FMA4,                                YES,   8 ) \
 FLAG(  81,  0, ECX, 17,  1, TCE,                                 NO,    0 ) \
@@ -888,6 +947,7 @@ FLAG(  81,  0, ECX, 26,  1, DATABK,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 27,  1, PERFTSC,                             NO,    0 ) \
 FLAG(  81,  0, ECX, 28,  1, PERFL3,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 29,  1, MWAITX,                              NO,    0 ) \
+FLAG(  81,  0, ECX, 30,  1, ADDR_MASK_EXT,                       NO,    0 ) \
 FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                          YES,   4 ) \
 FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                          YES,   4 ) \
 FLAG(  81,  0, EDX,  2,  1, LEAF81_DE,                           YES,   4 ) \
@@ -982,6 +1042,7 @@ FLAG(  87,  0, EBX,  1,  1, SUCCOR,                              NA,    0 ) \
 FLAG(  87,  0, EBX,  2,  1, HWA,                                 NA,    0 ) \
 FLAG(  87,  0, EBX,  3,  1, SCALABLE_MCA,                        NA,    0 ) \
 FLAG(  87,  0, EBX,  4,  1, PFEH_SUPPORT_PRESENT,                NA,    0 ) \
+FIELD( 87,  0, ECX,  0, 32, POWER_SAMPLE_TIME_RATIO,             NA,    0 ) \
 FLAG(  87,  0, EDX,  0,  1, TS,                                  NA,    0 ) \
 FLAG(  87,  0, EDX,  1,  1, FID,                                 NA,    0 ) \
 FLAG(  87,  0, EDX,  2,  1, VID,                                 NA,    0 ) \
@@ -991,7 +1052,12 @@ FLAG(  87,  0, EDX,  5,  1, STC,                                 NA,    0 ) \
 FLAG(  87,  0, EDX,  6,  1, 100MHZSTEPS,                         NA,    0 ) \
 FLAG(  87,  0, EDX,  7,  1, HWPSTATE,                            NA,    0 ) \
 FLAG(  87,  0, EDX,  8,  1, TSC_INVARIANT,                       NA,    0 ) \
-FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                     NA,    0 )
+FLAG(  87,  0, EDX,  9,  1, CORE_PERF_BOOST,                     NA,    0 ) \
+FLAG(  87,  0, EDX, 10,  1, EFFECTIVE_FREQUENCY,                 NA,    0 ) \
+FLAG(  87,  0, EDX, 11,  1, PROC_FEEDBACK_INTERFACE,             NA,    0 ) \
+FLAG(  87,  0, EDX, 12,  1, PROC_POWER_REPORTING,                NA,    0 ) \
+FLAG(  87,  0, EDX, 13,  1, CONNECTED_STANDBY,                   NA,    0 ) \
+FLAG(  87,  0, EDX, 14,  1, RAPL,                                NA,    0 )
 
 /*    LEVEL, REG, POS, SIZE, NAME,                          MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_88                                           \
@@ -1001,7 +1067,9 @@ FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                  YES,   8 ) \
 FLAG(  88,  0, EBX,  0,  1, CLZERO,                              YES,  14 ) \
 FLAG(  88,  0, EBX,  1,  1, IRPERF,                              NO,    0 ) \
 FLAG(  88,  0, EBX,  2,  1, XSAVE_ERR_PTR,                       NO,    0 ) \
-FLAG(  88,  0, EBX,  9,  1, WBNOINVD,                            YES, FUT ) \
+FLAG(  88,  0, EBX,  4,  1, RDPRU,                               NO,    0 ) \
+FLAG(  88,  0, EBX,  6,  1, MBE,                                 NO,    0 ) \
+FLAG(  88,  0, EBX,  9,  1, WBNOINVD,                            YES,  17 ) \
 FLAG(  88,  0, EBX, 12,  1, LEAF88_IBPB,                         ANY,   9 ) \
 FLAG(  88,  0, EBX, 14,  1, LEAF88_IBRS,                         NO,    0 ) \
 FLAG(  88,  0, EBX, 15,  1, LEAF88_STIBP,                        NO,    0 ) \
@@ -1013,14 +1081,13 @@ FLAG(  88,  0, EBX, 25,  1, LEAF88_SSBD_VIRT_SPEC_CTRL,          ANY,   9 ) \
 FLAG(  88,  0, EBX, 26,  1, LEAF88_SSBD_NOT_NEEDED,              NO,    0 ) \
 FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                   YES,   4 ) \
 FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                  YES,   7 ) \
-FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                        NO,    0 )
+FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                        NO,    0 ) \
+FIELD( 88,  0, EDX, 16,  8, RDPRU_MAX,                           NO,    0 )
 
 #define CPUID_8A_EDX_11 \
 FLAG(  8A,  0, EDX, 11,  1, SVMEDX_RSVD1,                        NO,    0 )
 #define CPUID_8A_EDX_14 \
 FLAG(  8A,  0, EDX, 14,  1, SVMEDX_RSVD2,                        NO,    0 )
-#define CPUID_8A_EDX_17 \
-FLAG(  8A,  0, EDX, 17,  1, SVMEDX_RSVD3,                        NO,    0 )
 
 /*    LEVEL, REG, POS, SIZE, NAME,                          MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_8A                                           \
@@ -1045,8 +1112,10 @@ FLAG(  8A,  0, EDX, 13,  1, SVM_AVIC,                            NO,    0 ) \
 CPUID_8A_EDX_14 \
 FLAG(  8A,  0, EDX, 15,  1, SVM_V_VMSAVE_VMLOAD,                 NO,    0 ) \
 FLAG(  8A,  0, EDX, 16,  1, SVM_VGIF,                            NO,    0 ) \
-CPUID_8A_EDX_17 \
-FIELD( 8A,  0, EDX, 18, 14, SVMEDX_RSVD,                         NO,    0 )
+FLAG(  8A,  0, EDX, 17,  1, SVM_GMET,                            YES,  17 ) \
+FIELD( 8A,  0, EDX, 18,  2, SVMEDX_RSVD3,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 20,  1, SVM_GUEST_SPEC_CTRL,                 NO,    0 ) \
+FIELD( 8A,  0, EDX, 21, 11, SVMEDX_RSVD4,                        NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_819                                          \
@@ -1137,20 +1206,28 @@ FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,              NA,    0 ) \
 FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                          NA,    0 ) \
 FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                       NA,    0 )
 
+#define CPUID_81F_EAX_10 \
+FLAG( 81F,  0, EAX, 10,  1, SVMEAX_RSVD1,                        NO,    0 )
+
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_81F                                          \
 FLAG( 81F,  0, EAX,  0,  1, SME,                                 NO,    0 ) \
 FLAG( 81F,  0, EAX,  1,  1, SEV,                                 YES,  17 ) \
 FLAG( 81F,  0, EAX,  2,  1, PAGE_FLUSH_MSR,                      NO,    0 ) \
 FLAG( 81F,  0, EAX,  3,  1, SEV_ES,                              YES,  17 ) \
+CPUID_81F_EAX_10 \
 FIELD(81F,  0, EBX,  0,  6, SME_PAGE_TABLE_BIT_NUM,              YES,  17 ) \
 FIELD(81F,  0, EBX,  6,  6, SME_PHYS_ADDR_SPACE_REDUCTION,       NO,    0 ) \
 FIELD(81F,  0, ECX,  0, 32, NUM_ENCRYPTED_GUESTS,                NO,    0 ) \
 FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                        NO,    0 )
 
-#define INTEL_CPUID_FIELD_DATA
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_820                                          \
+FLAG( 820,  0, EBX,  1,  1, LEAF820_MBE,                         NO,    0 ) \
+FIELD(820,  1, EAX,  0, 32, CAPACITY_MASK_LEN,                   NO,    0 ) \
+FIELD(820,  1, EDX,  0, 32, NUM_SERVICE_CLASSES,                 NO,    0 )
 
-#define AMD_CPUID_FIELD_DATA
+#define CPUID_FIELD_DATA_LEVEL_821
 
 #define CPUID_FIELD_DATA                                              \
    CPUID_FIELD_DATA_LEVEL_0                                           \
@@ -1160,6 +1237,7 @@ FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                        NO,    0 )
    CPUID_FIELD_DATA_LEVEL_5                                           \
    CPUID_FIELD_DATA_LEVEL_6                                           \
    CPUID_FIELD_DATA_LEVEL_7                                           \
+   CPUID_FIELD_DATA_LEVEL_9                                           \
    CPUID_FIELD_DATA_LEVEL_A                                           \
    CPUID_FIELD_DATA_LEVEL_B                                           \
    CPUID_FIELD_DATA_LEVEL_D                                           \
@@ -1170,6 +1248,10 @@ FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                        NO,    0 )
    CPUID_FIELD_DATA_LEVEL_15                                          \
    CPUID_FIELD_DATA_LEVEL_16                                          \
    CPUID_FIELD_DATA_LEVEL_17                                          \
+   CPUID_FIELD_DATA_LEVEL_18                                          \
+   CPUID_FIELD_DATA_LEVEL_1A                                          \
+   CPUID_FIELD_DATA_LEVEL_1B                                          \
+   CPUID_FIELD_DATA_LEVEL_1F                                          \
    CPUID_FIELD_DATA_LEVEL_400                                         \
    CPUID_FIELD_DATA_LEVEL_401                                         \
    CPUID_FIELD_DATA_LEVEL_402                                         \
@@ -1195,8 +1277,8 @@ FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                        NO,    0 )
    CPUID_FIELD_DATA_LEVEL_81D                                         \
    CPUID_FIELD_DATA_LEVEL_81E                                         \
    CPUID_FIELD_DATA_LEVEL_81F                                         \
-   INTEL_CPUID_FIELD_DATA                                             \
-   AMD_CPUID_FIELD_DATA
+   CPUID_FIELD_DATA_LEVEL_820                                         \
+   CPUID_FIELD_DATA_LEVEL_821
 
 /*
  * Define all field and flag values as an enum.  The result is a full
@@ -1376,6 +1458,7 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_FAMILY_BULLDOZER       0x15  // BD PD SR EX
 #define CPUID_FAMILY_KYOTO           0x16  // Note: Jaguar microarch
 #define CPUID_FAMILY_ZEN             0x17
+#define CPUID_FAMILY_ZEN3            0x19
 
 /* Effective VIA CPU Families */
 #define CPUID_FAMILY_C7               6
@@ -1429,10 +1512,13 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_ATOM_5D        0x5d  // Future Silvermont
 #define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S / Kaby Lake S/H ES
 #define CPUID_MODEL_ATOM_5F        0x5f  // Denverton
+#define CPUID_MODEL_ATOM_86        0x86  // Snow Ridge
 #define CPUID_MODEL_CANNONLAKE_66  0x66  // Cannon Lake
 #define CPUID_MODEL_KNM_85         0x85  // Knights Mill
 #define CPUID_MODEL_KABYLAKE_8E    0x8e  // Kaby Lake U/Y QS
 #define CPUID_MODEL_KABYLAKE_9E    0x9e  // Kaby Lake S/H QS
+#define CPUID_MODEL_COMETLAKE_A5   0xa5  // Comet Lake S
+#define CPUID_MODEL_COMETLAKE_A6   0xa6  // Comet Lake U
 
 /* Intel stepping information */
 #define CPUID_STEPPING_KABYLAKE_ES     0x8  // Kaby Lake S/H/U/Y ES
@@ -1441,6 +1527,7 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_STEPPING_CASCADELAKE_A   0x5  // Cascade Lake A-step
 #define CPUID_STEPPING_CASCADELAKE_B1  0x7  // Cascade Lake B1-step
 #define CPUID_STEPPING_WHISKEYLAKE     0xB  // Whiskey Lake U
+#define CPUID_STEPPING_AMBERLAKE       0xC  // Amber Lake Y
 
 #define CPUID_MODEL_PIII_07    7
 #define CPUID_MODEL_PIII_08    8
@@ -1468,6 +1555,10 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_ZEN_1F            0x1F // Max Zen model defined in BKDG
 #define CPUID_MODEL_ZEN2_30           0x30 // family == CPUID_FAMILY_ZEN
 #define CPUID_MODEL_ZEN2_3F           0x3F // Max Zen2 model
+#define CPUID_MODEL_ZEN2_70           0x70 // Ryzen3: family Zen, model Zen2
+#define CPUID_MODEL_ZEN2_7F           0x7F // Ryzen3: max model
+#define CPUID_MODEL_ZEN3_00           0x00 // family == CPUID_FAMILY_ZEN3
+#define CPUID_MODEL_ZEN3_0F           0x0F // Max Zen3 model
 
 /* AMD stepping information */
 #define CPUID_STEPPING_ZEN_NAPLES_B2  0x02 // Zen Naples ZP-B2
@@ -1716,6 +1807,24 @@ CPUID_MODEL_IS_WHISKEYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
           CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_WHISKEYLAKE;
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_COMETLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_COMETLAKE_A5 ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_COMETLAKE_A6);
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_AMBERLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_KABYLAKE_8E &&
+          CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_AMBERLAKE;
+}
+
 static INLINE Bool
 CPUID_MODEL_IS_KABYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
@@ -1747,6 +1856,8 @@ CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
           CPUID_MODEL_IS_KABYLAKE(v)    ||
           CPUID_MODEL_IS_COFFEELAKE(v)  ||
           CPUID_MODEL_IS_WHISKEYLAKE(v) ||
+          CPUID_MODEL_IS_COMETLAKE(v)   ||
+          CPUID_MODEL_IS_AMBERLAKE(v)   ||
           CPUID_MODEL_IS_CASCADELAKE(v) ||
           CPUID_MODEL_IS_CANNONLAKE(v);
 }
@@ -1801,6 +1912,21 @@ CPUID_MODEL_IS_DENVERTON(uint32 v) // IN: %eax from CPUID with %eax=1.
           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_5F;
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_SNOWRIDGE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ATOM_86;
+}
+
+static INLINE Bool
+CPUID_UARCH_IS_TREMONT(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) && CPUID_MODEL_IS_SNOWRIDGE(v);
+}
+
 static INLINE Bool
 CPUID_MODEL_IS_WESTMERE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
@@ -1938,6 +2064,12 @@ CPUID_FAMILY_IS_ZEN(uint32 eax)
    return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN;
 }
 
+static INLINE Bool
+CPUID_FAMILY_IS_ZEN3(uint32 eax)
+{
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN3;
+}
+
 /*
  * AMD Barcelona (of either Opteron or Phenom kind).
  */
@@ -2044,8 +2176,10 @@ static INLINE Bool
 CPUID_MODEL_IS_ZEN2(uint32 eax)
 {
   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN &&
-         (CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_ZEN2_30 &&
-          CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN2_3F);
+         ((CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_ZEN2_30 &&
+           CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN2_3F) ||
+          (CPUID_EFFECTIVE_MODEL(eax) >= CPUID_MODEL_ZEN2_70 &&
+           CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN2_7F));
 }
 
 
@@ -2064,14 +2198,18 @@ CPUID_MODEL_IS_DHYANA_A(uint32 eax)
 }
 
 
+static INLINE Bool
+CPUID_MODEL_IS_ZEN3(uint32 eax)
+{
+  return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN3 &&
+         CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN3_0F;
+}
+
+
 #define CPUID_TYPE_PRIMARY     0
 #define CPUID_TYPE_OVERDRIVE   1
 #define CPUID_TYPE_SECONDARY   2
 
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_NULL      0
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_DATA      1
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_INST      2
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_TYPE_UNIF      3
 #define CPUID_LEAF4_CACHE_TYPE_NULL      0
 #define CPUID_LEAF4_CACHE_TYPE_DATA      1
 #define CPUID_LEAF4_CACHE_TYPE_INST      2
@@ -2079,17 +2217,15 @@ CPUID_MODEL_IS_DHYANA_A(uint32 eax)
 #define CPUID_LEAF4_CACHE_INDEXING_DIRECT  0
 #define CPUID_LEAF4_CACHE_INDEXING_COMPLEX 1
 
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_SELF_INIT      0x00000100
-#define CPUID_INTEL_ID4EAX_LEAF4_CACHE_FULLY_ASSOC    0x00000200
 #define CPUID_LEAF4_CACHE_SELF_INIT      0x00000100
 #define CPUID_LEAF4_CACHE_FULLY_ASSOC    0x00000200
 
-#define CPUID_INTEL_IDBECX_LEVEL_TYPE_INVALID   0
-#define CPUID_INTEL_IDBECX_LEVEL_TYPE_SMT       1
-#define CPUID_INTEL_IDBECX_LEVEL_TYPE_CORE      2
 #define CPUID_TOPOLOGY_LEVEL_TYPE_INVALID   0
 #define CPUID_TOPOLOGY_LEVEL_TYPE_SMT       1
 #define CPUID_TOPOLOGY_LEVEL_TYPE_CORE      2
+#define CPUID_TOPOLOGY_LEVEL_TYPE_MODULE    3
+#define CPUID_TOPOLOGY_LEVEL_TYPE_TILE      4
+#define CPUID_TOPOLOGY_LEVEL_TYPE_DIE       5
 
 #define CPUID_AMD_LEAF85_L1_CACHE_FULLY_ASSOC     0xff
 #define CPUID_AMD_LEAF86_L2_L3_CACHE_FULLY_ASSOC  0x0f
@@ -2103,64 +2239,13 @@ CPUID_MODEL_IS_DHYANA_A(uint32 eax)
  * places to ensure ordering.
  */
 
-static INLINE Bool
-CPUID_VendorRequiresFence(CpuidVendor vendor)
-{
-   return vendor == CPUID_VENDOR_AMD;
-}
-
-static INLINE Bool
-CPUID_VersionRequiresFence(uint32 version)
-{
-   return CPUID_EFFECTIVE_FAMILY(version) == CPUID_FAMILY_K8 &&
-          CPUID_EFFECTIVE_MODEL(version) < 0x40;
-}
-
-static INLINE Bool
-CPUID_ID0RequiresFence(CPUIDRegs *id0)
-{
-   if (id0->eax == 0) {
-      return FALSE;
-   }
-   return CPUID_IsVendorAMD(id0);
-}
-
-static INLINE Bool
-CPUID_ID1RequiresFence(CPUIDRegs *id1)
-{
-   return CPUID_VersionRequiresFence(id1->eax);
-}
-
 static INLINE Bool
 CPUID_RequiresFence(CpuidVendor vendor, // IN
-                    uint32 version)      // IN: %eax from CPUID with %eax=1.
+                    uint32 version)     // IN: %eax from CPUID with %eax=1.
 {
-   return CPUID_VendorRequiresFence(vendor) &&
-          CPUID_VersionRequiresFence(version);
-}
-
-
-/*
- * The following low-level functions compute the number of
- * cores per cpu.  They should be used cautiously because
- * they do not necessarily work on all types of CPUs.
- * High-level functions that are correct for all CPUs are
- * available elsewhere: see lib/cpuidInfo/cpuidInfo.c.
- */
-
-static INLINE uint32
-CPUID_IntelCoresPerPackage(uint32 v) /* %eax from CPUID with %eax=4 and %ecx=0. */
-{
-   // Note: This is not guaranteed to work on older Intel CPUs.
-   return 1 + CPUID_GET(4, EAX, LEAF4_CORE_COUNT, v);
-}
-
-
-static INLINE uint32
-CPUID_AMDCoresPerPackage(uint32 v) /* %ecx from CPUID with %eax=0x80000008. */
-{
-   // Note: This is not guaranteed to work on older AMD CPUs.
-   return 1 + CPUID_GET(0x80000008, ECX, LEAF88_CORE_COUNT, v);
+   return vendor == CPUID_VENDOR_AMD &&
+          CPUID_EFFECTIVE_FAMILY(version) == CPUID_FAMILY_K8 &&
+          CPUID_EFFECTIVE_MODEL(version) < 0x40;
 }
 
 
@@ -2188,8 +2273,8 @@ CPUID_LevelUsesEcx(uint32 level) {
    switch (level)
    {
 
-#define CPUIDLEVEL(t, s, v, c, h)   \
-      case v:                       \
+#define CPUIDLEVEL(t, s, v, c, h)     \
+      case v:                         \
          return c != 0;
 
       CPUID_ALL_LEVELS
@@ -2201,37 +2286,6 @@ CPUID_LevelUsesEcx(uint32 level) {
    }
 }
 
-/*
- *----------------------------------------------------------------------
- *
- * CPUID_IsValid*Subleaf --
- *
- *      Functions to determine the last subleaf for the level specified
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE Bool
-CPUID_IsValidBSubleaf(uint32 ebx)  // IN: %ebx = cpuid.b.sublevel.ebx
-{
-   return ebx != 0;
-}
-
-static INLINE Bool
-CPUID_IsValid4Subleaf(uint32 eax)  // IN: %eax = cpuid.4.sublevel.eax
-{
-   return eax != 0;
-}
-
-static INLINE Bool
-CPUID_IsValid7Subleaf(uint32 eax, uint32 subleaf)  // IN: %eax = cpuid.7.0.eax
-{
-   /*
-    * cpuid.7.0.eax is the max ecx (subleaf) index
-    */
-   return subleaf <= eax;
-}
-
 /*
  *----------------------------------------------------------------------
  *
@@ -2251,8 +2305,9 @@ CPUID_SupportsMsrPlatformInfo(CpuidVendor vendor, uint32 version)
            CPUID_UARCH_IS_HASWELL(version)     ||
            CPUID_UARCH_IS_SKYLAKE(version)     ||
            CPUID_MODEL_IS_KNIGHTS_LANDING(version) ||
-           CPUID_MODEL_IS_DENVERTON(version) ||
-           CPUID_UARCH_IS_SILVERMONT(version));
+           CPUID_MODEL_IS_DENVERTON(version)   ||
+           CPUID_UARCH_IS_SILVERMONT(version)  ||
+           CPUID_UARCH_IS_TREMONT(version));
 }
 
 #ifdef _MSC_VER
diff --git a/vmmon-only/include/x86cpuid_asm.h b/vmmon-only/include/x86cpuid_asm.h
index b27772af..8addeca8 100644
--- a/vmmon-only/include/x86cpuid_asm.h
+++ b/vmmon-only/include/x86cpuid_asm.h
@@ -40,15 +40,7 @@
 
 
 /*
- * x86-64 windows doesn't support inline asm so we have to use these
- * intrinsic functions defined in the compiler.  Not all of these are well
- * documented.  There is an array in the compiler dll (c1.dll) which has
- * an array of the names of all the intrinsics minus the leading
- * underscore.  Searching around in the ntddk.h file can also be helpful.
- *
- * The declarations for the intrinsic functions were taken from the DDK.
- * Our declarations must match the ddk's otherwise the 64-bit c++ compiler
- * will complain about second linkage of the intrinsic functions.
+ * The declarations for the intrinsic functions were taken from MSDN.
  * We define the intrinsic using the basic types corresponding to the
  * Windows typedefs. This avoids having to include windows header files
  * to get to the windows types.
@@ -57,21 +49,14 @@
 #ifdef __cplusplus
 extern "C" {
 #endif
-#ifdef VM_X86_64
-/*
- * intrinsic functions only supported by x86-64 windows as of 2k3sp1
- */
-void __cpuid(int regs[4], int eax);
-#pragma intrinsic(__cpuid)
-
 /*
+ * __cpuid has been supported since VS2003
  * __cpuidex has been supported since VS2008
  */
-#if _MSC_VER >= 1500
+void __cpuid(int regs[4], int eax);
 void __cpuidex(int regs[4], int eax, int ecx);
+#pragma intrinsic(__cpuid)
 #pragma intrinsic(__cpuidex)
-#endif /* _MSC_VER >= 1500 */
-#endif /* VM_X86_64 */
 
 #ifdef __cplusplus
 }
@@ -89,34 +74,16 @@ void __cpuidex(int regs[4], int eax, int ecx);
  *
  */
 
-/*
- * %ebx is reserved on i386 PIC.  Apple's gcc-5493 (gcc 4.0) compiling
- * for x86_64 incorrectly errors out saying %ebx is reserved.  This is
- * Apple bug 7304232.
- */
-#if vm_x86_64 ? (defined __APPLE_CC__ && __APPLE_CC__ == 5493) : defined __PIC__
-#if vm_x86_64
-/*
- * Note that this generates movq %rbx,%rbx; cpuid; xchgq %rbx,%rbx ...
- * Unfortunately Apple's assembler does not have .ifnes, and I cannot
- * figure out how to do that with .if.   If we ever enable this code
- * on other 64bit systems, both movq & xchgq should be surrounded by
- * .ifnes \"%%rbx\", \"%q1\" & .endif
- */
-#define VM_CPUID_BLOCK  "movq %%rbx, %q1\n\t" \
-                        "cpuid\n\t"           \
-                        "xchgq %%rbx, %q1\n\t"
-#define VM_EBX_OUT(reg) "=&r"(reg)
+#if defined VM_X86_64 || !defined __PIC__
+#define VM_CPUID_BLOCK  "cpuid"
+#define VM_EBX_OUT(reg) "=b"(reg)
 #else
+/* %ebx is reserved on i386 PIC. */
 #define VM_CPUID_BLOCK  "movl %%ebx, %1\n\t" \
                         "cpuid\n\t"          \
                         "xchgl %%ebx, %1\n\t"
 #define VM_EBX_OUT(reg) "=&rm"(reg)
 #endif
-#else
-#define VM_CPUID_BLOCK  "cpuid"
-#define VM_EBX_OUT(reg) "=b"(reg)
-#endif
 
 static INLINE void
 __GET_CPUID(uint32     eax,  // IN
@@ -217,22 +184,6 @@ __GET_EDX_FROM_CPUID(uint32 eax) // IN
 }
 
 
-static INLINE uint32
-__GET_EAX_FROM_CPUID4(uint32 ecx) // IN
-{
-   uint32 eax;
-   uint32 ebx;
-
-   __asm__ __volatile__(
-      VM_CPUID_BLOCK
-      : "=a" (eax), VM_EBX_OUT(ebx), "=c" (ecx)
-      : "a" (4), "c" (ecx)
-      : "memory", "%edx"
-   );
-
-   return eax;
-}
-
 #undef VM_CPUID_BLOCK
 #undef VM_EBX_OUT
 
@@ -241,247 +192,51 @@ __GET_EAX_FROM_CPUID4(uint32 ecx) // IN
 static INLINE void
 __GET_CPUID(uint32 input, CPUIDRegs *regs)
 {
-#ifdef VM_X86_64
    __cpuid((int *)regs, input);
-#else
-   __asm push esi
-   __asm push ebx
-   __asm push ecx
-   __asm push edx
-
-   __asm mov  eax, input
-   __asm mov  esi, regs
-   __asm _emit 0x0f __asm _emit 0xa2
-   __asm mov 0x0[esi], eax
-   __asm mov 0x4[esi], ebx
-   __asm mov 0x8[esi], ecx
-   __asm mov 0xC[esi], edx
-
-   __asm pop edx
-   __asm pop ecx
-   __asm pop ebx
-   __asm pop esi
-#endif
 }
 
-#ifdef VM_X86_64
-
-#if _MSC_VER >= 1500
-
-/*
- * __cpuidex has been supported since VS2008
- */
-
 static INLINE void
 __GET_CPUID2(uint32 inputEax, uint32 inputEcx, CPUIDRegs *regs)
 {
    __cpuidex((int *)regs, inputEax, inputEcx);
 }
 
-#else // _MSC_VER >= 1500
-
-/*
- * No inline assembly in Win64. Implemented in bora/lib/misc in
- * cpuidMasm64.asm.
- */
-
-extern void
-__GET_CPUID2(uint32 inputEax, uint32 inputEcx, CPUIDRegs *regs);
-#endif // _MSC_VER >= 1500
-
-#else // VM_X86_64
-
-static INLINE void
-__GET_CPUID2(uint32 inputEax, uint32 inputEcx, CPUIDRegs *regs)
-{
-   __asm push esi
-   __asm push ebx
-   __asm push ecx
-   __asm push edx
-
-   __asm mov  eax, inputEax
-   __asm mov  ecx, inputEcx
-   __asm mov  esi, regs
-   __asm _emit 0x0f __asm _emit 0xa2
-   __asm mov 0x0[esi], eax
-   __asm mov 0x4[esi], ebx
-   __asm mov 0x8[esi], ecx
-   __asm mov 0xC[esi], edx
-
-   __asm pop edx
-   __asm pop ecx
-   __asm pop ebx
-   __asm pop esi
-}
-#endif
-
 static INLINE uint32
 __GET_EAX_FROM_CPUID(uint32 input)
 {
-#ifdef VM_X86_64
    CPUIDRegs regs;
    __cpuid((int *)&regs, input);
    return regs.eax;
-#else
-   uint32 output;
-
-   //NOT_TESTED();
-   __asm push ebx
-   __asm push ecx
-   __asm push edx
-
-   __asm mov  eax, input
-   __asm _emit 0x0f __asm _emit 0xa2
-   __asm mov  output, eax
-
-   __asm pop edx
-   __asm pop ecx
-   __asm pop ebx
-
-   return output;
-#endif
 }
 
 static INLINE uint32
 __GET_EBX_FROM_CPUID(uint32 input)
 {
-#ifdef VM_X86_64
    CPUIDRegs regs;
    __cpuid((int *)&regs, input);
    return regs.ebx;
-#else
-   uint32 output;
-
-   //NOT_TESTED();
-   __asm push ebx
-   __asm push ecx
-   __asm push edx
-
-   __asm mov  eax, input
-   __asm _emit 0x0f __asm _emit 0xa2
-   __asm mov  output, ebx
-
-   __asm pop edx
-   __asm pop ecx
-   __asm pop ebx
-
-   return output;
-#endif
 }
 
 static INLINE uint32
 __GET_ECX_FROM_CPUID(uint32 input)
 {
-#ifdef VM_X86_64
    CPUIDRegs regs;
    __cpuid((int *)&regs, input);
    return regs.ecx;
-#else
-   uint32 output;
-
-   //NOT_TESTED();
-   __asm push ebx
-   __asm push ecx
-   __asm push edx
-
-   __asm mov  eax, input
-   __asm _emit 0x0f __asm _emit 0xa2
-   __asm mov  output, ecx
-
-   __asm pop edx
-   __asm pop ecx
-   __asm pop ebx
-
-   return output;
-#endif
 }
 
 static INLINE uint32
 __GET_EDX_FROM_CPUID(uint32 input)
 {
-#ifdef VM_X86_64
    CPUIDRegs regs;
    __cpuid((int *)&regs, input);
    return regs.edx;
-#else
-   uint32 output;
-
-   //NOT_TESTED();
-   __asm push ebx
-   __asm push ecx
-   __asm push edx
-
-   __asm mov  eax, input
-   __asm _emit 0x0f __asm _emit 0xa2
-   __asm mov  output, edx
-
-   __asm pop edx
-   __asm pop ecx
-   __asm pop ebx
-
-   return output;
-#endif
 }
 
-#ifdef VM_X86_64
-
-/*
- * No inline assembly in Win64. Implemented in bora/lib/misc in
- * cpuidMasm64.asm.
- */
-
-extern uint32
-__GET_EAX_FROM_CPUID4(uint32 inputEcx);
-
-#else // VM_X86_64
-
-static INLINE uint32
-__GET_EAX_FROM_CPUID4(uint32 inputEcx)
-{
-   uint32 output;
-
-   //NOT_TESTED();
-   __asm push ebx
-   __asm push ecx
-   __asm push edx
-
-   __asm mov  eax, 4
-   __asm mov  ecx, inputEcx
-   __asm _emit 0x0f __asm _emit 0xa2
-   __asm mov  output, eax
-
-   __asm pop edx
-   __asm pop ecx
-   __asm pop ebx
-
-   return output;
-}
-
-#endif // VM_X86_64
-
 #else // }
 #error
 #endif
 
 #define CPUID_FOR_SIDE_EFFECTS() ((void)__GET_EAX_FROM_CPUID(0))
 
-/* The first parameter is used as an rvalue and then as an lvalue. */
-#define GET_CPUID(_ax, _bx, _cx, _dx) { \
-   CPUIDRegs regs;                      \
-   __GET_CPUID(_ax, &regs);             \
-   _ax = regs.eax;                      \
-   _bx = regs.ebx;                      \
-   _cx = regs.ecx;                      \
-   _dx = regs.edx;                      \
-}
-
-#define GET_CPUID2(_ax, _bx, _cx, _dx) {\
-   CPUIDRegs regs;                      \
-   __GET_CPUID2(_ax, _cx, &regs);       \
-   _ax = regs.eax;                      \
-   _bx = regs.ebx;                      \
-   _cx = regs.ecx;                      \
-   _dx = regs.edx;                      \
-}
-
 #endif
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 0e765b10..949cfbde 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -120,6 +120,9 @@ MSRQuery;
 #define MSR_ARCH_CAPABILITIES_NOL1F_VMENTRY       (1ULL << 3)
 #define MSR_ARCH_CAPABILITIES_SSB_NO              (1ULL << 4)
 #define MSR_ARCH_CAPABILITIES_MDS_NO              (1ULL << 5)
+#define MSR_ARCH_CAPABILITIES_IF_PSCHANGE_MC_NO   (1ULL << 6)
+#define MSR_ARCH_CAPABILITIES_TSX_CTRL            (1ULL << 7)
+#define MSR_ARCH_CAPABILITIES_TAA_NO              (1ULL << 8)
 
 #define MSR_FLUSH_CMD                        0x10b
 #define MSR_FLUSH_CMD_FLUSH_L1D                   (1ULL << 0)
@@ -130,6 +133,9 @@ MSRQuery;
 
 #define MSR_PRED_CMD_IBPB                         (1UL << 0)
 
+#define MSR_TSX_CTRL                         0x122
+#define MSR_TSX_CTRL_RTM_DISABLE                  (1ULL << 0)
+#define MSR_TSX_CTRL_CPUID_CLEAR                  (1ULL << 1)
 
 #define MSR_MISC_FEATURES_ENABLES            0x140
 
@@ -148,14 +154,6 @@ MSRQuery;
 
 #define IA32_MSR_PEBS_ENABLE                      0x3f1
 
-typedef enum {
-   SL_PMC_FLAGS_NONE             = 0x00, /* No flags.                      */
-   SL_PMC_FLAGS_LBR_VA32         = 0x01, /* LBR format: 32-bit VA.         */
-   SL_PMC_FLAGS_LBR_LA64         = 0x02, /* LBR format: 64-bit LA.         */
-   SL_PMC_FLAGS_LBR_VA64         = 0x04, /* LBR format: 64-bit VA.         */
-   SL_PMC_FLAGS_LBR_PACKED_VA32  = 0x08, /* LBR format: 2x32-bit VAs.      */
-} StateLoggerPMCFlags;
-
 #define MSR_MTRR_BASE0        0x00000200
 #define MSR_MTRR_MASK0        0x00000201
 #define MSR_MTRR_BASE1        0x00000202
@@ -452,7 +450,6 @@ typedef enum {
 
 /* MSR_EFER bits. */
 #define MSR_EFER_SCE         0x0000000000000001ULL  /* Sys call ext'ns:  r/w */
-#define MSR_EFER_RAZ         0x00000000000000feULL  /* Read as zero          */
 #define MSR_EFER_LME         0x0000000000000100ULL  /* Long mode enable: r/w */
 #define MSR_EFER_LMA         0x0000000000000400ULL  /* Long mode active: r/o */
 #define MSR_EFER_NXE         0x0000000000000800ULL  /* No-exec enable:   r/w */
@@ -460,7 +457,11 @@ typedef enum {
 #define MSR_EFER_LMSLE       0x0000000000002000ULL  /* LM seg lim enable:r/w */
 #define MSR_EFER_FFXSR       0x0000000000004000ULL  /* Fast FXSAVE:      r/w */
 #define MSR_EFER_TCE         0x0000000000008000ULL  /* Trans. cache ext. r/w */
-#define MSR_EFER_MBZ         0xffffffffffff0200ULL  /* Must be zero (resrvd) */
+/* Vendor specific EFER bits */
+#define MSR_EFER_INTEL_MBZ   0xffffffffffff02feULL  /* Must be zero (resrvd) */
+#define MSR_EFER_INTEL_RAZ   0x0000000000000000ULL  /* Read as zero          */
+#define MSR_EFER_AMD_MBZ     0xffffffffffff0200ULL  /* Must be zero (resrvd) */
+#define MSR_EFER_AMD_RAZ     0x00000000000000feULL  /* Read as zero          */
 
 #define MSR_AMD_PATCH_LOADER 0xc0010020
 
@@ -478,6 +479,8 @@ typedef enum {
 #endif
 #define MSR_K8_SYSCFG_MTRRTOM2EN         (1ULL<<21)
 #define MSR_K8_SYSCFG_TOM2FORCEMEMTYPEWB (1ULL<<22)
+#define MSR_K8_SYSCFG_SMEE               (1ULL<<23)
+
 #define MSR_K8_TOPMEM2       0xc001001d
 
 /* AMD "Greyhound" MSRs */
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
index 2d18e668..ae26c258 100644
--- a/vmmon-only/include/x86svm.h
+++ b/vmmon-only/include/x86svm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005-2014,2017-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2014,2017-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -141,6 +141,7 @@
 #define SVM_VMCB_NPTCTL_NP_ENABLE          (1 << 0)
 #define SVM_VMCB_NPTCTL_SEV_ENABLE         (1 << 1)
 #define SVM_VMCB_NPTCTL_SEV_ES_ENABLE      (1 << 2)
+#define SVM_VMCB_NPTCTL_GMET_ENABLE        (1 << 3)
 
 /* VMCB.virtExt */
 #define SVM_VMCB_VIRTEXT_LBR_ENABLE        (1 << 0)
@@ -251,6 +252,7 @@
 #define SVM_EXITCODE_MMIO_READ           0x80000001   // SW only
 #define SVM_EXITCODE_MMIO_WRITE          0x80000002   // SW only
 #define SVM_EXITCODE_NMI_COMPLETE        0x80000003   // SW only
+#define SVM_EXITCODE_AP_JUMP_TABLE       0x80000005   // SW only
 #define SVM_EXITCODE_UNSUPPORTED         0x8000FFFF   // SW only
 #define SVM_EXITCODE_INVALID             (-1ULL)
 
@@ -313,6 +315,10 @@
 #define SVM_NPFEXIT_FINAL_ADDR     (1ULL << 32)    /* Rev. C */
 #define SVM_NPFEXIT_PTE_ACCESS     (1ULL << 33)    /* Rev. C */
 
+/* ExitInfo1 for AP jump table exits */
+#define SVM_APEXIT_SET            0x0
+#define SVM_APEXIT_GET            0x1
+
 /* Event Injection */
 #define SVM_INTINFO_VECTOR_MASK   0x000000ff
 #define SVM_INTINFO_TYPE_SHIFT    8
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
index 6de4c30e..26536dfe 100644
--- a/vmmon-only/include/x86vt.h
+++ b/vmmon-only/include/x86vt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2004-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2004-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -173,8 +173,11 @@ enum {
 /*
  * Sizes of referenced fields
  */
-#define VT_VMCS_IO_BITMAP_SIZE    (2 * PAGE_SIZE)
-#define VT_VMCS_MSR_BITMAP_SIZE   (1 * PAGE_SIZE)
+#define VT_VMCS_IO_BITMAP_PAGES   (2)
+#define VT_VMCS_IO_BITMAP_SIZE    PAGES_2_BYTES(VT_VMCS_IO_BITMAP_PAGES)
+#define VT_VMCS_MSR_BITMAP_PAGES  (1)
+#define VT_VMCS_MSR_BITMAP_SIZE   PAGES_2_BYTES(VT_VMCS_MSR_BITMAP_PAGES)
+
 
 /*
  * Execution control bit capabilities come in pairs: a "required" bit in
@@ -552,7 +555,7 @@ enum {
 #define VT_VMCS_PENDDBG_MBZ        0xfffeaff0
 
 /* Exception error must-be-zero bits for VMEntry */
-#define VT_XCP_ERR_MBZ             0xffff8000
+#define VT_XCP_ERR_MBZ             0xffff0000
 
 
 /* Exit reasons. */
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index a1fb92b1..8256d628 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -68,8 +68,6 @@ static void LinuxDriverQueue(Device *device);
 static void LinuxDriverDequeue(Device *device);
 static Bool LinuxDriverCheckPadding(void);
 
-#define VMMON_UNKNOWN_SWAP_SIZE -1ULL
-
 struct VMXLinuxState linuxState;
 
 
@@ -95,21 +93,9 @@ long LinuxDriver_Ioctl(struct file *filp, u_int iocmd,
                        unsigned long ioarg);
 
 static int LinuxDriver_Close(struct inode *inode, struct file *filp);
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 17, 0)
-static vm_fault_t LinuxDriverFault(struct vm_fault *fault);
-#elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
-static int LinuxDriverFault(struct vm_fault *fault);
-#else
-static int LinuxDriverFault(struct vm_area_struct *vma, struct vm_fault *fault);
-#endif
-static int LinuxDriverMmap(struct file *filp, struct vm_area_struct *vma);
 
 static unsigned int LinuxDriverEstimateTSCkHz(void);
 
-static struct vm_operations_struct vmuser_mops = {
-        .fault  = LinuxDriverFault
-};
-
 static struct file_operations vmuser_fops;
 static struct timer_list tscTimer;
 static Atomic_uint32 tsckHz;
@@ -291,9 +277,11 @@ init_module(void)
       return -ENOEXEC;
    }
 
+   if (!Vmx86_CreateHVIOBitmap()) {
+      return -ENOMEM;
+   }
    linuxState.fastClockThread = NULL;
    linuxState.fastClockRate = 0;
-   linuxState.swapSize = VMMON_UNKNOWN_SWAP_SIZE;
 
    /*
     * Initialize the file_operations structure. Because this code is always
@@ -307,7 +295,6 @@ init_module(void)
    vmuser_fops.compat_ioctl = LinuxDriver_Ioctl;
    vmuser_fops.open = LinuxDriver_Open;
    vmuser_fops.release = LinuxDriver_Close;
-   vmuser_fops.mmap = LinuxDriverMmap;
 
 #ifdef VMX86_DEVEL
    devel_init_module();
@@ -328,7 +315,7 @@ init_module(void)
    if (retval) {
       Warning("Module %s: error registering with major=%d minor=%d\n",
               linuxState.deviceName, linuxState.major, linuxState.minor);
-
+      Vmx86_CleanupHVIOBitmap();
       return -ENOENT;
    }
    Log("Module %s: registered with major=%d minor=%d\n",
@@ -377,6 +364,7 @@ cleanup_module(void)
 
    del_timer_sync(&tscTimer);
 
+   Vmx86_CleanupHVIOBitmap();
    Task_Terminate();
    // Make sure fastClockThread is dead
    HostIF_FastClockLock(1);
@@ -414,7 +402,6 @@ LinuxDriver_Open(struct inode *inode, // IN
    }
    memset(device, 0, sizeof *device);
 
-   sema_init(&device->lock4Gb, 1);
    init_rwsem(&device->vmDriverRWSema);
 
    filp->private_data = device;
@@ -426,104 +413,6 @@ LinuxDriver_Open(struct inode *inode, // IN
 }
 
 
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverAllocPages --
- *
- *    Allocate physically contiguous block of memory with specified order.
- *    Pages in the allocated block are configured so that caller can pass
- *    independent pages to the VM.
- *
- * Results:
- *    Zero on success, non-zero (error code) on failure.
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static int
-LinuxDriverAllocPages(unsigned int order,   // IN
-                      struct page **pg,     // OUT
-                      PageCnt size)         // IN
-{
-   struct page* page = alloc_pages(GFP_HIGHUSER, order);
-   if (page) {
-      /*
-       * Grab an extra reference on all pages except first one - first
-       * one was already refcounted by alloc_pages.
-       *
-       * Under normal situation all pages except first one in the block
-       * have refcount zero.  As we pass these pages to the VM, we must
-       * bump their count, otherwise VM will release these pages every
-       * time they would be unmapped from user's process, causing crash.
-       *
-       * Note that this depends on Linux VM internals.  It works on all
-       * kernels we care about.
-       */
-      PageCnt i, orderToNumPages = 1 << order;
-      for (i = 0; i < orderToNumPages; i++) {
-         if (i) {
-            /*
-             * Debug kernels assert that page->_count is not zero when
-             * calling get_page. We use init_page_count as a temporary
-             * workaround. PR 894174
-             */
-#if LINUX_VERSION_CODE > KERNEL_VERSION(2, 6, 16)
-            ASSERT(page_count(page) == 0);
-            init_page_count(page);
-#else
-            get_page(page);
-#endif
-         }
-         if (i >= size) {
-            put_page(page);
-         } else {
-            void *addr = kmap(page);
-            memset(addr, 0, PAGE_SIZE);
-            kunmap(page);
-            *pg++ = page;
-         }
-         page++;
-      }
-      return 0;
-   }
-   return -ENOMEM;
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverDestructor4Gb --
- *
- *    Deallocate all directly mappable memory.
- *
- * Results:
- *    None
- *
- * Side effects:
- *    None
- *
- *-----------------------------------------------------------------------------
- */
-
-static void
-LinuxDriverDestructor4Gb(Device *device) // IN
-{
-   PageCnt pg;
-   if (!device->size4Gb) {
-      return;
-   }
-   for (pg = 0; pg < device->size4Gb; pg++) {
-      put_page(device->pages4Gb[pg]);
-   }
-   device->size4Gb = 0;
-}
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -555,194 +444,12 @@ LinuxDriver_Close(struct inode *inode, // IN
 
    Vmx86_Close();
 
-   /*
-    * Destroy all low memory allocations.
-    * We are closing the struct file here, so clearly no other process
-    * uses it anymore, and we do not need to hold the semaphore.
-    */
-
-   LinuxDriverDestructor4Gb(device);
-
    kfree(device);
    filp->private_data = NULL;
 
    return 0;
 }
 
-
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverFault --
- *
- *      Callback for returning allocated page for memory mapping
- *
- * Results:
- *    NoPage:
- *      Page or page address on success, NULL or 0 on failure.
- *    Fault:
- *      Error code; 0, minor page fault.
- *
- * Side effects:
- *      None.
- *
- *-----------------------------------------------------------------------------
- */
-
-static
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 17, 0)
-vm_fault_t
-#else
-int
-#endif
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
-LinuxDriverFault(struct vm_fault *fault)     //IN/OUT
-#else
-LinuxDriverFault(struct vm_area_struct *vma, //IN
-                 struct vm_fault *fault)     //IN/OUT
-#endif
-{
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
-   struct vm_area_struct *vma = fault->vma;
-#endif
-   Device *device = (Device *) vma->vm_file->private_data;
-   PageNum pg;
-   struct page* page;
-
-   pg = fault->pgoff;
-   pg = VMMON_MAP_OFFSET(pg);
-   if (pg >= device->size4Gb) {
-      return VM_FAULT_SIGBUS;
-   }
-   page = device->pages4Gb[pg];
-   get_page(page);
-   fault->page = page;
-   return 0;
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverAllocContig --
- *
- *      Create mapping for contiguous memory areas.
- *
- * Results:
- *
- *      0       on success,
- *      -EINVAL on invalid arguments or
- *      -ENOMEM on out of memory
- *
- * Side effects:
- *      Pages for mapping are allocated.
- *
- *-----------------------------------------------------------------------------
- */
-
-static int LinuxDriverAllocContig(Device *device,
-                                  struct vm_area_struct *vma,
-                                  unsigned long off,
-                                  PageCnt size)
-{
-   unsigned long vmaOrder = VMMON_MAP_ORDER(off);
-   PageCnt vmaAllocSize, i;
-
-   if (VMMON_MAP_RSVD(off)) {
-      /* Reserved bits set... */
-      return -EINVAL;
-   }
-   if (VMMON_MAP_OFFSET(off)) {
-      /* We do not need non-zero offsets... */
-      return -EINVAL;
-   }
-   if (size > VMMON_MAP_OFFSET_MASK + 1) {
-      /* Size is too big to fit to our window. */
-      return -ENOMEM;
-   }
-
-   /* 16 pages looks like a good limit... */
-   if (size > VMMON_MAX_LOWMEM_PAGES) {
-      return -ENOMEM;
-   }
-   /* Sorry. Only one mmap per one open. */
-   down(&device->lock4Gb);
-   if (device->size4Gb) {
-      up(&device->lock4Gb);
-      return -EINVAL;
-   }
-   vmaAllocSize = 1 << vmaOrder;
-   for (i = 0; i < size; i += vmaAllocSize) {
-      int err = LinuxDriverAllocPages(vmaOrder, device->pages4Gb + i, size - i);
-      if (err) {
-         while (i > 0) {
-            put_page(device->pages4Gb[--i]);
-         }
-         up(&device->lock4Gb);
-         return err;
-      }
-   }
-   device->size4Gb = size;
-   up(&device->lock4Gb);
-   vma->vm_ops = &vmuser_mops;
-   return 0;
-}
-
-
-/*
- *-----------------------------------------------------------------------------
- *
- * LinuxDriverMmap --
- *
- *      Create mapping for lowmem or locked memory.
- *
- * Results:
- *
- *      0       on success,
- *      -EINVAL on invalid arguments or
- *      -ENOMEM on out of memory
- *
- * Side effects:
- *      Pages for mapping are allocated.
- *
- *-----------------------------------------------------------------------------
- */
-
-static int
-LinuxDriverMmap(struct file *filp,
-                struct vm_area_struct *vma)
-{
-   Device *device = (Device *) filp->private_data;
-   PageCnt size;
-   int err;
-
-   /* Only shared mappings */
-   if (!(vma->vm_flags & VM_SHARED)) {
-      return -EINVAL;
-   }
-   if ((vma->vm_end | vma->vm_start) & (PAGE_SIZE - 1)) {
-      return -EINVAL;
-   }
-   size = (vma->vm_end - vma->vm_start) >> PAGE_SHIFT;
-   if (size < 1) {
-      return -EINVAL;
-   }
-   down_read(&device->vmDriverRWSema);
-   if (device->vm) {
-      err = -EINVAL;
-   } else {
-      err = LinuxDriverAllocContig(device, vma, vma->vm_pgoff, size);
-   }
-   up_read(&device->vmDriverRWSema);
-   if (err) {
-      return err;
-   }
-   /* Clear VM_IO, otherwise SuSE's kernels refuse to do get_user_pages */
-   vma->vm_flags &= ~VM_IO;
-   return 0;
-}
-
-
 typedef Bool (*SyncFunc)(void *data, unsigned cpu);
 
 typedef struct {
@@ -1328,25 +1035,12 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    }
 
    case IOCTL_VMX86_APIC_INIT: {
-      VMAPICInfo info;
-      Bool setVMPtr;
-      Bool probe;
-
-      retval = HostIF_CopyFromUser(&info, ioarg, sizeof info);
-      if (retval != 0) {
-         break;
-      }
-      setVMPtr = ((info.flags & APIC_FLAG_DISABLE_NMI) != 0);
-      probe = ((info.flags & APIC_FLAG_PROBE) != 0);
-
       /*
-       * Kernel uses NMIs for deadlock detection - set APIC VMptr so that
-       * NMIs get disabled in the monitor.
+       * Kernel uses NMIs for deadlock detection - so we always have to find
+       * APIC so that NMIs get disabled in the monitor.
        */
-
-      setVMPtr = TRUE;
-
-      retval = HostIF_APICInit(vm, setVMPtr, probe) ? 0 : -ENODEV;
+      HostIF_APICInit(vm);
+      retval = 0;
       break;
    }
 
@@ -1599,17 +1293,6 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
-   case IOCTL_VMX86_SET_HOST_SWAP_SIZE: {
-      uint64 swapSize;
-      retval = HostIF_CopyFromUser(&swapSize, ioarg, sizeof swapSize);
-      if (retval != 0) {
-         Warning("Could not copy swap size from user, status %ld\n", retval);
-         break;
-      }
-      linuxState.swapSize = swapSize;
-      break;
-   }
-
    case IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS: {
       uint64 ctrs = Vmx86_GetUnavailablePerfCtrs();
       retval = HostIF_CopyToUser(ioarg, &ctrs, sizeof ctrs);
diff --git a/vmmon-only/linux/driver.h b/vmmon-only/linux/driver.h
index 23ac2a1c..25c366ac 100644
--- a/vmmon-only/linux/driver.h
+++ b/vmmon-only/linux/driver.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2018-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2011,2014-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,9 +37,6 @@
 /* Per-instance driver state */
 struct VMDriver;
 
-/* 16 pages (64KB) looks as a good limit for one allocation */
-#define VMMON_MAX_LOWMEM_PAGES  16
-
 typedef struct Device {
    struct Device   *next;
    struct VMDriver *vm;
@@ -48,19 +45,10 @@ typedef struct Device {
     * avoid racing between various ioctls, and the creation
     * and removal of the VM in question. The lock is read-acquired
     * by ioctls that reference the VMDriver, and write-acquired by
-    * ioctls or device callbacks that allocate or destory the
+    * ioctls or device callbacks that allocate or destroy the
     * VMDriver.
     */
    struct rw_semaphore vmDriverRWSema;
-   /*
-    * The semaphore protect accesses to size4Gb and pages4Gb
-    * in mmap(). mmap() may happen only once, and all other
-    * accesses except cleanup are read-only, and may happen
-    * only after successful mmap.
-    */
-   struct semaphore lock4Gb;
-   PageCnt size4Gb;
-   struct page *pages4Gb[VMMON_MAX_LOWMEM_PAGES];
 } Device;
 
 
@@ -81,11 +69,8 @@ typedef struct VMXLinuxState {
 
    struct task_struct *fastClockThread;
    unsigned fastClockRate;
-   uint64 swapSize;
 } VMXLinuxState;
 
 extern VMXLinuxState linuxState;
-extern uint8 monitorIPIVector;
-extern uint8 hvIPIVector;
 
 #endif
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 5fcde0cc..0dfd3f3f 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -71,6 +71,7 @@
 #include "apic.h"
 #include "memDefaults.h"
 #include "vcpuid.h"
+#include "x86svm.h"
 
 #include "pgtbl.h"
 #include "versioned_atomic.h"
@@ -179,8 +180,22 @@ static struct {
 
 static void UnlockEntry(void *clientData, MemTrackEntry *entryPtr);
 
-uint8 monitorIPIVector;
-uint8 hvIPIVector;
+/*
+ * SPURIOUS_APIC_VECTOR is not defined on kernels built without APIC
+ * support.
+ */
+#ifndef SPURIOUS_APIC_VECTOR
+#define SPURIOUS_APIC_VECTOR 0
+#endif
+static const uint8 monitorIPIVector = SPURIOUS_APIC_VECTOR;
+/*
+ * POSTED_INTR_VECTOR is defined on kernels after 3.10 when built with
+ * KVM support.
+ */
+#ifndef POSTED_INTR_VECTOR
+#define POSTED_INTR_VECTOR 0
+#endif
+static const uint8 hvIPIVector = POSTED_INTR_VECTOR;
 
 /*
  *-----------------------------------------------------------------------------
@@ -923,7 +938,6 @@ HostIF_AllocLowPage(VMDriver *vm) //  IN: VM instance pointer
 
       mpn = (MPN)page_to_pfn(pg);
 
-      HostIF_VMLock(vm, 40);
       vmh = vm->vmhost;
       if (vmh->AWEPages != NULL) {
          if (PhysTrack_Test(vmh->AWEPages, mpn)) {
@@ -934,7 +948,6 @@ HostIF_AllocLowPage(VMDriver *vm) //  IN: VM instance pointer
          __free_page(pg);
          mpn = INVALID_MPN;
       }
-      HostIF_VMUnlock(vm, 40);
    }
    return mpn;
 }
@@ -962,8 +975,7 @@ HostIFFreeVMHost(VMHost *vmhost) // IN:
 {
    ASSERT(vmhost->lockedPages == NULL &&
           vmhost->AWEPages    == NULL &&
-          vmhost->crosspagePagesCount == 0 &&
-          !vmhost->hostAPICIsMapped);
+          vmhost->crosspagePagesCount == 0);
    Vmx86_Free(vmhost->crosspagePages);
    Vmx86_Free(vmhost->vcpuSemaTask);
    vmhost->crosspagePages = NULL;
@@ -1006,6 +1018,108 @@ HostIFAllocVMHost(uint32 numVCPUs) // IN:
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_FreeContigPages --
+ *
+ *      Free an allocated memory block returned from an earlier call to
+ *      HostIF_AllocContigPages.
+ *
+ * Results:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+void
+HostIF_FreeContigPages(VMDriver *vm,             // IN: Driver state
+                       HostIFContigMemMap *map)  // IN: Object to free
+{
+   unsigned order = 0;
+
+   /*
+    * The only users of this API are the I/O and MSR bitmap allocations.
+    * Of those, the largest is the SVM I/O bitmap at 3 pages.
+    */
+   ASSERT(map->pages <= SVM_VMCB_IO_BITMAP_PAGES);
+   if (vm != NULL) {
+      PageCnt i;
+
+      for (i = 0; i < map->pages; i++) {
+         PhysTrack_Remove(vm->vmhost->AWEPages, map->mpn + i);
+      }
+   }
+   while (1u << order < map->pages) {
+      order++;
+   }
+   free_pages(PtrToVA64(map->addr), order);
+   HostIF_FreeKernelMem(map);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_AllocContigPages --
+ *
+ *      Allocate a range of physically contiguous memory.  Also add the pages
+ *      to the VmAnon PhysTracker if 'vm' is non-NULL.  This allows the pages
+ *      to be written to a coredump when needed.
+ *
+ * Results:
+ *      A HostIFContigMemMap object containing the start MPN of the allocated
+ *      range, or NULL on failure.
+ *
+ *----------------------------------------------------------------------
+ */
+
+HostIFContigMemMap *
+HostIF_AllocContigPages(VMDriver *vm,      // IN/OUT: driver state
+                        PageCnt numPages)  // IN: Number of pages
+{
+   HostIFContigMemMap *map;
+   unsigned order = 0;
+   /*
+    * The only users of this API are the I/O and MSR bitmap allocations.
+    * Of those, the largest is the SVM I/O bitmap at 3 pages.
+    */
+   if (numPages == 0 || numPages > SVM_VMCB_IO_BITMAP_PAGES) {
+      return NULL;
+   }
+   map = HostIF_AllocKernelMem(sizeof *map, FALSE);
+   if (map == NULL) {
+      return NULL;
+   }
+   memset(map, 0, sizeof *map);
+   while (1u << order < numPages) {
+      order++;
+   }
+   map->addr = VA64ToPtr(__get_free_pages(GFP_HIGHUSER, order));
+   if (map->addr == NULL) {
+      HostIF_FreeKernelMem(map);
+      return NULL;
+   }
+   map->pages = numPages;
+   map->mpn = MA_2_MPN(virt_to_phys(map->addr));
+
+   /*
+    * Add the allocated pages to the VMM anonymous memory phystracker.
+    * This is to ensure the pages will be written out during a coredump.
+    */
+   if (vm != NULL) {
+      PageCnt i;
+
+      ASSERT(HostIF_VMLockIsHeld(vm));
+      for (i = 0; i < map->pages; i++) {
+         PhysTrack_Add(vm->vmhost->AWEPages, map->mpn + i);
+      }
+   }
+
+   return map;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -1419,12 +1533,6 @@ HostIF_FreeAllResources(VMDriver *vm) // IN
          UnmapCrossPage(p, vm->crosspage[cnt]);
       }
       vm->vmhost->crosspagePagesCount = 0;
-      if (vm->vmhost->hostAPICIsMapped) {
-         ASSERT(vm->hostAPIC.base != NULL);
-         iounmap((void*)vm->hostAPIC.base);
-         vm->hostAPIC.base = NULL;
-         vm->vmhost->hostAPICIsMapped = FALSE;
-      }
       HostIFFreeVMHost(vm->vmhost);
       vm->vmhost = NULL;
    }
@@ -1623,7 +1731,6 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
                                     : BYTES_2_PAGES(vm->memInfo.hugePageBytes);
    PageCnt lockedPages = hugePages + reservedPages;
    PageCnt anonPages;
-   PageCnt swapPages = BYTES_2_PAGES(linuxState.swapSize);
 
    /* global_page_state is global_zone_page_state in 4.14. */
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 14, 0)
@@ -1650,9 +1757,6 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
    anonPages = global_page_state(NR_ANON_PAGES);
 #endif
 
-   if (anonPages > swapPages) {
-      lockedPages += anonPages - swapPages;
-   }
    forHost = lockedPages + LOCKED_PAGE_SLACK;
    if (forHost > totalPhysicalPages) {
       forHost = totalPhysicalPages;
@@ -2297,85 +2401,6 @@ isVAReadable(VA r)  // IN:
 
    return ret == 0;
 }
-
-
-/*
- *----------------------------------------------------------------------
- *
- * SetVMAPICAddr --
- *
- *      Maps the host cpu's APIC.  The virtual address is stashed in
- *      the VMDriver structure.
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      The VMDriver structure is updated.
- *
- *----------------------------------------------------------------------
- */
-
-static void
-SetVMAPICAddr(VMDriver *vm, // IN/OUT: driver state
-              MA ma)        // IN: host APIC's ma
-{
-   volatile void *hostapic;
-
-   ASSERT_ON_COMPILE(APICR_SIZE <= PAGE_SIZE);
-   hostapic = (volatile void *) ioremap(ma, PAGE_SIZE);
-   if (hostapic) {
-      if ((APIC_VERSIONREG(hostapic) & 0xF0) == 0x10) {
-         vm->hostAPIC.base = (volatile uint32 (*)[4]) hostapic;
-         ASSERT(vm->vmhost != NULL);
-         vm->vmhost->hostAPICIsMapped = TRUE;
-      } else {
-         iounmap((void*)hostapic);
-      }
-   }
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * ProbeAPIC --
- *
- *      Attempts to map the host APIC.
- *
- *      Most versions of Linux already provide access to a mapped
- *      APIC.  This function is just a backup.
- *
- *      Caveat: We assume that the APIC physical address is the same
- *      on all host cpus.
- *
- * Results:
- *      TRUE if APIC was found, FALSE if not.
- *
- * Side effects:
- *      May map the APIC.
- *
- *----------------------------------------------------------------------
- */
-
-static Bool
-ProbeAPIC(VMDriver *vm,   // IN/OUT: driver state
-          Bool setVMPtr)  // IN: set a pointer to the APIC's virtual address
-{
-   MA ma = APIC_GetMA();
-
-   if (ma == (MA)-1) {
-      return FALSE;
-   }
-
-   if (setVMPtr) {
-      SetVMAPICAddr(vm, ma);
-   } else {
-      vm->hostAPIC.base = NULL;
-   }
-
-   return TRUE;
-}
 #endif
 
 
@@ -2384,75 +2409,50 @@ ProbeAPIC(VMDriver *vm,   // IN/OUT: driver state
  *
  * HostIF_APICInit --
  *
- *      Initialize APIC behavior.
- *      Attempts to map the host APIC into vm->hostAPIC.
- *
- *      We don't attempt to refresh the mapping after a host cpu
- *      migration.  Fortunately, hosts tend to use the same address
- *      for all APICs.
+ *      Check if APIC is present, and is regular or x2 APIC.
  *
- *      Most versions of Linux already provide a mapped APIC.  We
- *      have backup code to read APIC_BASE and map it, if needed.
+ *      We check for X2 APIC by checking X2APIC enable bit, and
+ *      for regular APIC by checking if APIC registers are mapped
+ *      as readable page (vs. not present for no APIC).
  *
  * Results:
- *      TRUE
+ *      None.
  *
  * Side effects:
- *      May map the host APIC.
+ *      None.
  *
  *----------------------------------------------------------------------
  */
-Bool
-HostIF_APICInit(VMDriver *vm,   // IN:
-                Bool setVMPtr,  // IN:
-                Bool probe)     // IN: force probing
+
+void
+HostIF_APICInit(VMDriver *vm)   // IN:
 {
 #if defined(CONFIG_SMP)         || defined(CONFIG_X86_UP_IOAPIC) || \
     defined(CONFIG_X86_UP_APIC) || defined(CONFIG_X86_LOCAL_APIC)
-   static Bool apicIPILogged = FALSE;
-   VA kAddr;
-
-   monitorIPIVector = SPURIOUS_APIC_VECTOR;
-#if defined(POSTED_INTR_VECTOR)
-   hvIPIVector      = POSTED_INTR_VECTOR;
-#else
-   hvIPIVector      = 0;
-#endif
+   if (vm->hostAPIC.base == NULL && !vm->hostAPIC.isX2) {
+      static Bool apicIPILogged = FALSE;
 
+      if (!apicIPILogged) {
+         Log("Monitor IPI vector: %x\n", monitorIPIVector);
+         Log("HV      IPI vector: %x\n", hvIPIVector);
+         apicIPILogged = TRUE;
+      }
 
-   if (!apicIPILogged) {
-      Log("Monitor IPI vector: %x\n", monitorIPIVector);
-      Log("HV      IPI vector: %x\n", hvIPIVector);
-      apicIPILogged = TRUE;
-   }
-
-   if ((X86MSR_GetMSR(MSR_APIC_BASE) & APIC_MSR_X2APIC_ENABLED) != 0) {
-      if (setVMPtr) {
-         vm->hostAPIC.base = NULL;
-         vm->vmhost->hostAPICIsMapped = FALSE;
+      if ((X86MSR_GetMSR(MSR_APIC_BASE) & APIC_MSR_X2APIC_ENABLED) != 0) {
          vm->hostAPIC.isX2 = TRUE;
+      } else {
+         VA kAddr;
+
+         /*
+          * Old APIC: use Linux's pre-mapped APIC.
+          */
+         kAddr = __fix_to_virt(FIX_APIC_BASE);
+         if (isVAReadable(kAddr)) {
+            vm->hostAPIC.base = (void *)kAddr;
+         }
       }
-      return TRUE;
-   }
-
-   if (probe && ProbeAPIC(vm, setVMPtr)) {
-      return TRUE;
-   }
-
-   /*
-    * Normal case: use Linux's pre-mapped APIC.
-    */
-   kAddr = __fix_to_virt(FIX_APIC_BASE);
-   if (!isVAReadable(kAddr)) {
-      return TRUE;
-   }
-   if (setVMPtr) {
-      vm->hostAPIC.base = (void *)kAddr;
-   } else {
-      vm->hostAPIC.base = NULL;
    }
 #endif
-   return TRUE;
 }
 
 
diff --git a/vmmon-only/linux/vmhost.h b/vmmon-only/linux/vmhost.h
index bd6c0351..8e7517f9 100644
--- a/vmmon-only/linux/vmhost.h
+++ b/vmmon-only/linux/vmhost.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -94,8 +94,6 @@ typedef struct VMHost {
     * as pages for "AWE" guest memory.
     */
    struct PhysTracker  *AWEPages;
-   /* Is VMDriver.hostAPIC mapped or is from __fix_to_virt(FIX_APIC_BASE)? */
-   Bool                 hostAPICIsMapped;
 } VMHost;
 
 #endif
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/vmcore/moduleloop.c
index 7e761f99..804494bd 100644
--- a/vmmon-only/vmcore/moduleloop.c
+++ b/vmmon-only/vmcore/moduleloop.c
@@ -316,13 +316,34 @@ skipTaskSwitch:;
          crosspage->args[1] = vm->numPTPPages;
       } break;
 
+      case MODULECALL_GET_HV_IO_BITMAP: {
+         crosspage->args[0] = hvIOBitmap == NULL ? INVALID_MPN :
+                                                   hvIOBitmap->mpn;
+      } break;
+
+      case MODULECALL_ALLOC_CONTIG_PAGES: {
+         PageCnt pages = crosspage->args[0];
+         HostIFContigMemMap *alloc;
+
+         HostIF_VMLock(vm, 47);
+         alloc = HostIF_AllocContigPages(vm, pages);
+         if (alloc != NULL) {
+            alloc->next = vm->contigMappings;
+            vm->contigMappings = alloc;
+            crosspage->args[1] = alloc->mpn;
+         } else {
+            crosspage->args[1] = INVALID_MPN;
+         }
+         HostIF_VMUnlock(vm, 47);
+      } break;
+
       default:
          Warning("ModuleCall %d not supported\n", crosspage->moduleCallType);
       }
       ASSERT(retval == (uint64)((uint32)retval));
       crosspage->retval = (uint32)retval;
 #if defined(__linux__)
-      cond_resched(); // Other kernels are preemptable
+      cond_resched(); // Other kernels are preemptible
 #endif
    }
 bailOut:
diff --git a/vmnet-only/net.h b/vmnet-only/net.h
index a7b13076..9266b5fc 100644
--- a/vmnet-only/net.h
+++ b/vmnet-only/net.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2016,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -200,7 +200,7 @@ Net_GetNumAdapters(Net_AdapterCount *counts)
       } else if (Str_Strcasecmp(adapterStr, "e1000e") == 0) {
          counts->e1000e++;
       } else {
-         LOG_ONCE(("%s: unknown adapter: %s\n", __FUNCTION__, adapterStr));
+         LOG_ONCE("%s: unknown adapter: %s\n", __FUNCTION__, adapterStr);
       }
       free(adapterStr);
    }
diff --git a/vmnet-only/vm_assert.h b/vmnet-only/vm_assert.h
index 74cbc2fb..27f63477 100644
--- a/vmnet-only/vm_assert.h
+++ b/vmnet-only/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -207,7 +207,7 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
       count = (count + 1) & 1023;                                       \
    } while (0)
 
-#define LOG_ONCE(_s) DO_ONCE(Log _s)
+#define LOG_ONCE(...) DO_ONCE(Log(__VA_ARGS__))
 
 
 /*
@@ -314,6 +314,17 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
       assertions                     \
    }
 
+/*
+ * Avoid generating extra code due to asserts which are required by
+ * Clang static analyzer, e.g. right before a statement would fail, using
+ * the __clang_analyzer__ macro defined only when clang SA is parsing files.
+ */
+#ifdef __clang_analyzer__
+#define ANALYZER_ASSERT(cond) ASSERT(cond)
+#else
+#define ANALYZER_ASSERT(cond) ((void)0)
+#endif
+
 #ifdef __cplusplus
 } /* extern "C" */
 #endif
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index 800b3eda..d13c0502 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -122,27 +122,27 @@ extern "C" {
 
 
 /* Basic atomic types: 8, 16, 32, 64 and 128 bits */
-typedef struct Atomic_uint8 {
+typedef ALIGNED(1) struct Atomic_uint8 {
    volatile uint8 value;
-} Atomic_uint8 ALIGNED(1);
+} Atomic_uint8;
 
-typedef struct Atomic_uint16 {
+typedef ALIGNED(2) struct Atomic_uint16 {
    volatile uint16 value;
-} Atomic_uint16 ALIGNED(2);
+} Atomic_uint16;
 
-typedef struct Atomic_uint32 {
+typedef ALIGNED(4) struct Atomic_uint32 {
    volatile uint32 value;
-} Atomic_uint32 ALIGNED(4);
+} Atomic_uint32;
 
-typedef struct Atomic_uint64 {
+typedef ALIGNED(8) struct Atomic_uint64 {
    volatile uint64 value;
-} Atomic_uint64 ALIGNED(8);
+} Atomic_uint64;
 
 #if defined __GNUC__ && defined VM_64BIT && \
      (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
-typedef struct Atomic_uint128 {
+typedef ALIGNED(16) struct Atomic_uint128 {
    volatile uint128 value;
-} Atomic_uint128 ALIGNED(16);
+} Atomic_uint128;
 #endif
 
 /*
@@ -3584,7 +3584,7 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
  *
  * Atomic_ReadInc16 --
  *
- *      Atomically increments a 64-bit integer
+ *      Atomically increments a 16-bit integer
  *
  * Results:
  *      Returns the old value just prior to incrementing
@@ -3607,7 +3607,7 @@ Atomic_ReadInc16(Atomic_uint16 *var) // IN/OUT
  *
  * Atomic_ReadDec16 --
  *
- *      Atomically decrements a 64-bit integer
+ *      Atomically decrements a 16-bit integer
  *
  * Results:
  *      Returns the old value just prior to decrementing
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index 02172e64..ec31efd0 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -48,7 +48,6 @@
 #define MUL64_NO_ASM 1
 #include "mul64.h"
 #elif defined VM_ARM_64
-#include "arm64_basic_defs.h"
 #include "vm_basic_asm_arm64.h"
 #else
 #define MUL64_NO_ASM 1
@@ -1180,6 +1179,9 @@ RoundUpPow2_32(uint32 value)
 static INLINE unsigned
 PopCount32(uint32 value)
 {
+#if defined(__GNUC__) && !defined(FEWER_BUILTINS) && defined(__POPCNT__)
+   return __builtin_popcount(value);
+#else
    /*
     * Attribution:
     *     This algorithm was copied from:
@@ -1223,6 +1225,7 @@ PopCount32(uint32 value)
    value += (value >> 8);
    value += (value >> 16);
    return value & 0x0000003f;
+#endif
 }
 
 
@@ -1245,6 +1248,13 @@ PopCount32(uint32 value)
 static INLINE unsigned
 PopCount64(uint64 value)
 {
+#if defined(__GNUC__) && !defined(FEWER_BUILTINS) && defined(__POPCNT__)
+#if defined(VM_X86_64)
+   return __builtin_popcountll(value);
+#else
+   return PopCount32(value) + PopCount32(value >> 32);
+#endif
+#else
    value -= (value >> 1) & 0x5555555555555555ULL;
    value = ((value >> 2) & 0x3333333333333333ULL) +
            (value & 0x3333333333333333ULL);
@@ -1253,6 +1263,7 @@ PopCount64(uint64 value)
    value += value >> 16;
    value += value >> 32;
    return (unsigned) (value & 0xff);
+#endif
 }
 
 
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index 29298257..f683168c 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -438,10 +438,6 @@ void *_ReturnAddress(void);
 
 #define strtok_r  strtok_s
 
-#if (_MSC_VER < 1500)
-#define	vsnprintf _vsnprintf
-#endif
-
 typedef int uid_t;
 typedef int gid_t;
 
@@ -465,20 +461,9 @@ typedef int pid_t;
 #define       W_OK          2
 #define       R_OK          4
 
-#endif // }
-
-/*
- * Macro for username comparison.
- */
-
-#ifdef _WIN32 // {
-#define USERCMP(x,y)  Str_Strcasecmp(x,y)
-#else
-#define USERCMP(x,y)  strcmp(x,y)
-#endif // }
-
+#endif // } _WIN32
 
-#endif // }
+#endif // } USERLEVEL
 
 #ifndef va_copy
 
@@ -657,8 +642,10 @@ typedef int pid_t;
 #endif
 
 #ifdef VMM
+#define vmx86_vmm 1
 #define VMM_ONLY(x) x
 #else
+#define vmx86_vmm 0
 #define VMM_ONLY(x)
 #endif
 
@@ -699,7 +686,6 @@ typedef int pid_t;
  * display/printer drivers only.
  */
 #ifdef _WIN32
-#ifndef USES_OLD_WINDDK
 #if defined(VMX86_LOG)
 #ifdef _WIN64
 #define WinDrvPrint(arg, ...) DbgPrintEx(DPFLTR_IHVDRIVER_ID, (ULONG)~0, arg, __VA_ARGS__)
@@ -711,7 +697,6 @@ typedef int pid_t;
 #define WinDrvPrint(arg, ...)
 #define WinDrvEngPrint(arg, ...)
 #endif
-#endif
 #endif // _WIN32
 
 /*
@@ -801,4 +786,30 @@ typedef int pid_t;
 #define END_PTR_TO_ALIGNED_VAR \
    } while (0)
 
+
+/*
+ * -Wswitch means that when you pass switch an enum that it's looking for
+ * all values from that enum, and only that enum, to be accounted for.
+ * "default:;" is fine for catching values you don't care about. But today
+ * we have a bunch of code that uses internal and external enum values, or
+ * in other words combines two enums into a single variable. This cast is
+ * the workaround, but we really need to fix this mess.
+ */
+#define UNCHECKED_SWITCH__FIXME(x) switch ((uint64)(x))
+
+
+/*
+ * When clang static analyzer parses source files, it implicitly defines
+ * __clang_analyzer__ macro. We use this to define our custom macro to stop
+ * its execution for the current path of analysis by calling a function that
+ * doesn't return, making it think that it hit a failed assertion.
+ *
+ * DO NOT use to silence the analyzer! See PR2447238.
+ */
+#ifdef __clang_analyzer__
+#define VMW_CLANG_ANALYZER_NORETURN() Panic("Disable Clang static analyzer")
+#else
+#define VMW_CLANG_ANALYZER_NORETURN() ((void)0)
+#endif
+
 #endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index f7f5b93f..bb9d86cf 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -101,6 +101,7 @@
 
 #pragma warning (3 :4505) // unreferenced local function
 #pragma warning (disable :4018) // signed/unsigned mismatch
+#pragma warning (suppress:4619) // suppress warning next line (C4761 was removed in vs2019u4)
 #pragma warning (disable :4761) // integral size mismatch in argument; conversion supplied
 #pragma warning (disable :4305) // truncation from 'const int' to 'short'
 #pragma warning (disable :4244) // conversion from 'unsigned short' to 'unsigned char'
@@ -698,11 +699,11 @@ typedef void * UserVA;
 #endif
 
 /*
- * Similarly, we require a compiler that is at least vc80 (vs2005).
+ * Similarly, we require a compiler that is at least vc90 (vs2008).
  * Enforce this here.
  */
-#if defined _MSC_VER && _MSC_VER < 1400
-#error "cl.exe version is too old, need vc80 or better"
+#if defined _MSC_VER && _MSC_VER < 1500
+#error "cl.exe version is too old, need vc90 or better"
 #endif
 
 
@@ -864,12 +865,10 @@ typedef void * UserVA;
 #endif
 
 #ifndef UNUSED_TYPE
-// XXX _Pragma would better but doesn't always work right now.
 #  define UNUSED_TYPE(_parm) UNUSED_PARAM(_parm)
 #endif
 
 #ifndef UNUSED_VARIABLE
-// XXX is there a better way?
 #  define UNUSED_VARIABLE(_var) (void)_var
 #endif
 
@@ -884,29 +883,21 @@ typedef void * UserVA;
 
 /*
  * ALIGNED specifies minimum alignment in "n" bytes.
+ *
+ * NOTE: __declspec(align) has limited syntax; it must essentially be
+ *       an integer literal.  Expressions, such as sizeof(), do not
+ *       work.
  */
 
 #ifdef __GNUC__
 #define ALIGNED(n) __attribute__((__aligned__(n)))
+#elif defined(_MSC_VER)
+#define ALIGNED(n) __declspec(align(n))
 #else
 #define ALIGNED(n)
 #endif
 
 
-/*
- * Encapsulate the syntactic differences between gcc and msvc alignment control.
- * BOUNDARY must match in the prefix and suffix.
- */
-
-#ifdef _WIN32
-#define ALIGN_PREFIX(BOUNDRY) __declspec(align(BOUNDRY))
-#define ALIGN_SUFFIX(BOUNDRY)
-#else
-#define ALIGN_PREFIX(BOUNDRY)
-#define ALIGN_SUFFIX(BOUNDRY) __attribute__((__aligned__(BOUNDRY)))
-#endif
-
-
 /*
  * Once upon a time, this was used to silence compiler warnings that
  * get generated when the compiler thinks that a function returns

From d67ec2e11cd70fa161b27a4e97a8276419157308 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Tue, 15 Sep 2020 17:05:51 +0200
Subject: [PATCH 16/41] import Workstation 16.0.0 module sources

---
 vmmon-only/Makefile                          |   3 +-
 vmmon-only/Makefile.normal                   |   4 +-
 vmmon-only/bootstrap/monLoaderVmmon.c        |  13 +-
 vmmon-only/common/crosspage.c                | 611 +++++++++++++++++++
 vmmon-only/common/crosspage.h                |  43 ++
 vmmon-only/common/hostif.h                   |   5 +-
 vmmon-only/common/task.c                     | 380 ++++++------
 vmmon-only/common/task.h                     |   4 +-
 vmmon-only/common/vmx86.c                    | 332 ++++++++--
 vmmon-only/common/vmx86.h                    |   5 +-
 vmmon-only/include/addrlayout.h              | 319 ++++++++++
 vmmon-only/include/addrlayout_table.h        | 144 +++++
 vmmon-only/include/iocontrols.h              |  14 +-
 vmmon-only/include/modulecall.h              |  96 +--
 vmmon-only/include/monLoader.h               |   9 +-
 vmmon-only/include/pcip_defs.h               |   9 +-
 vmmon-only/include/perfctr_arch.h            |  12 +-
 vmmon-only/include/ptsc.h                    |  43 +-
 vmmon-only/include/segs.h                    | 176 ++++++
 vmmon-only/include/uccostTable.h             |  19 +-
 vmmon-only/include/usercalldefs.h            |   5 +-
 vmmon-only/include/vcpuid.h                  |   4 +-
 vmmon-only/include/vm_asm_x86.h              | 157 +----
 vmmon-only/include/vm_atomic.h               | 136 +----
 vmmon-only/include/vm_basic_asm.h            |  60 +-
 vmmon-only/include/vm_basic_asm_x86_64.h     |  37 +-
 vmmon-only/include/vm_basic_asm_x86_common.h | 119 +---
 vmmon-only/include/vm_basic_types.h          |  22 +-
 vmmon-only/include/vm_idt_x86.h              |  88 +++
 vmmon-only/include/vmmem_shared.h            |   5 +-
 vmmon-only/include/x86_basic_defs.h          |  42 +-
 vmmon-only/include/x86cpuid.h                |  59 +-
 vmmon-only/include/x86cpuid_asm.h            |  27 +-
 vmmon-only/include/x86msr.h                  |  57 +-
 vmmon-only/include/x86paging_64.h            |  94 ++-
 vmmon-only/include/x86paging_common.h        |  11 +-
 vmmon-only/include/x86sel.h                  |   3 +-
 vmmon-only/include/x86vt-vmcs-fields.h       | 151 ++---
 vmmon-only/linux/driver.c                    |  89 ++-
 vmmon-only/linux/driver.h                    |   3 -
 vmmon-only/linux/hostif.c                    | 206 +++----
 vmmon-only/linux/vmhost.h                    |   2 -
 vmmon-only/vmcore/moduleloop.c               |  34 +-
 vmnet-only/Makefile                          |   3 +-
 vmnet-only/userif.c                          |   6 +-
 vmnet-only/vm_atomic.h                       | 136 +----
 vmnet-only/vm_basic_asm.h                    |  60 +-
 vmnet-only/vm_basic_asm_x86_64.h             |  37 +-
 vmnet-only/vm_basic_asm_x86_common.h         | 119 +---
 vmnet-only/vm_basic_types.h                  |  22 +-
 vmnet-only/vm_device_version.h               |   4 +-
 51 files changed, 2562 insertions(+), 1477 deletions(-)
 create mode 100644 vmmon-only/common/crosspage.c
 create mode 100644 vmmon-only/common/crosspage.h
 create mode 100644 vmmon-only/include/addrlayout.h
 create mode 100644 vmmon-only/include/addrlayout_table.h
 create mode 100644 vmmon-only/include/segs.h
 create mode 100644 vmmon-only/include/vm_idt_x86.h

diff --git a/vmmon-only/Makefile b/vmmon-only/Makefile
index f859c8c7..dc2ac3b0 100644
--- a/vmmon-only/Makefile
+++ b/vmmon-only/Makefile
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+# Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -137,7 +137,6 @@ CC_OPTS += -DVMX86_DEBUG
 endif
 
 # Add Spectre options when available
-CC_OPTS += $(call vm_check_gcc,-mindirect-branch=thunk -mindirect-branch-register,)
 
 include $(SRCROOT)/Makefile.kernel
 
diff --git a/vmmon-only/Makefile.normal b/vmmon-only/Makefile.normal
index cde99ed3..c75c70c0 100644
--- a/vmmon-only/Makefile.normal
+++ b/vmmon-only/Makefile.normal
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998,2015,2017 VMware, Inc. All rights reserved.
+# Copyright (C) 1998,2015,2017,2020 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -72,7 +72,7 @@ INCLUDE += $(shell $(CC) $(INCLUDE) -E $(SRCROOT)/autoconf/geninclude.c \
 	   | sed -n -e 's!^APATH!-I$(HEADER_DIR)/asm!p')
 
 C_TARGETS_LINUX  := driver.o hostif.o driverLog.o
-C_TARGETS_COMMON := vmx86.o memtrack.o phystrack.o cpuid.o task.o
+C_TARGETS_COMMON := vmx86.o memtrack.o phystrack.o cpuid.o task.o crosspage.o
 C_TARGETS_VMCORE := moduleloop.o
 C_TARGETS_BOOTSTRAP := bootstrap.o
 C_TARGETS_LINUX_D := ${C_TARGETS_LINUX:.o=.d}
diff --git a/vmmon-only/bootstrap/monLoaderVmmon.c b/vmmon-only/bootstrap/monLoaderVmmon.c
index dce62cbf..6ae9f670 100644
--- a/vmmon-only/bootstrap/monLoaderVmmon.c
+++ b/vmmon-only/bootstrap/monLoaderVmmon.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -447,7 +447,7 @@ MonLoaderGetSharedRegionMPN(MonLoaderEnvContext *ctx,
  *
  * MonLoaderCallout_GetSharedUserPage --
  *
- *      Gets a user-provided shared page's MPN for a VCPU.
+ *      Gets a shared page's MPN for a VCPU.
  *
  * Returns:
  *      An MPN or INVALID_MPN.
@@ -478,7 +478,14 @@ MonLoaderCallout_GetSharedHostPage(MonLoaderEnvContext *ctx,      // IN
                                    unsigned             page,     // IN
                                    Vcpuid               vcpu)     // IN
 {
-   return MonLoaderGetSharedRegionMPN(ctx, subIndex, vcpu, page);
+   switch (subIndex) {
+   case MONLOADER_CROSS_PAGE_DATA_IDX:
+      return HostIF_GetCrossPageDataMPN(ctx->vm->crosspage[vcpu]);
+   case MONLOADER_CROSS_PAGE_CODE_IDX:
+      return HostIF_GetCrossPageCodeMPN();
+   default:
+      return MonLoaderGetSharedRegionMPN(ctx, subIndex, vcpu, page);
+   }
 }
 
 
diff --git a/vmmon-only/common/crosspage.c b/vmmon-only/common/crosspage.c
new file mode 100644
index 00000000..0806e93d
--- /dev/null
+++ b/vmmon-only/common/crosspage.c
@@ -0,0 +1,611 @@
+/*********************************************************
+ * Copyright (C) 2016-2020 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * crosspage.c --
+ *
+ *    Cross page code and data.
+ *
+ *    The cross code page contains world switch code and interrupt/exception
+ *    handlers in support of world switch.  A separate data page is also mapped
+ *    in both the vmm and vmmon address spaces to describe the host and monitor
+ *    state.
+ *
+ *    Both the monitor and the vmmon driver call into the cross page to switch
+ *    worlds.  The world switch from host->vmm is able to refer directly to the
+ *    various symbols defined in CrossPage_CodePage.  On the vmm->host path
+ *    the VmmToHost entry point is stored in the data page.  Data references
+ *    must be handled as offsets from the base of the data page.
+ *
+ *    Use of inline assembly in C code is delicate as the compiler has many
+ *    possible reasons to emit unexpected instructions surrounding any assembly
+ *    in a C function.  Frame pointers are inconvenient to disable on a per-file
+ *    basis given structure of the Linux Makefile so they are being emitted
+ *    in the C wrapper function.  NORETURN and NOT_REACHED_MINIMAL are used to
+ *    omit a function epilogue.  The output/clobber lists of the assembly blocks
+ *    are not used as the compiler needs not compensate for the register use of
+ *    these hand-written assembly functions.
+ *    Each assembly function begins with a label denoting the proper entry point
+ *    for that function.  Only a handful of the functions need to be exported
+ *    out of this file, see crosspage.h.
+ */
+
+#ifdef __linux__
+#   include "driver-config.h"
+/*
+ * linux/frame.h dates back to 4.5-rc5, we need the ANNOTATE_INTRA_FUNCTION_CALL
+ * definition from it which came in with 5.7.
+ */
+#   if LINUX_VERSION_CODE > KERNEL_VERSION(5, 7, 0)
+#      include <linux/frame.h>
+#   endif
+#endif
+
+#include "modulecall.h"
+#include "iocontrols.h"
+#include "segs.h"
+#include "x86_basic_defs.h"
+#include "vm_basic_defs.h"
+#include "vm_idt_x86.h"
+#include "crosspage.h"
+
+#ifdef __APPLE__
+/*
+ * The Mac compiler expects symbols to have a _ prefix.
+ * This arranges for any symbol being exported out of the assembly code
+ * to be accessible.
+ */
+#define ASM_PREFIX "_"
+/*
+ * OSX uses a segment,section style syntax for specifying output sections.
+ * https://developer.apple.com/library/archive/documentation/Performance/
+ * Conceptual/CodeFootprint/Articles/MachOOverview.html
+ */
+#define ASM_SECTION "__TEXT,cross"
+#else
+/*
+ * This is a COFF grouped section identifier.  This ensures the crosspage code
+ * is merged with the normal .text area but as a separate unit so it can have
+ * its own alignment properties.
+ * https://docs.microsoft.com/en-us/windows/win32/debug/pe-format
+ *
+ * The Linux build will handle the section based on its contents (code).
+ */
+#define ASM_SECTION ".text$cross"
+#define ASM_PREFIX
+#endif
+
+#define EXPORTED_ASM_SYMBOL(fn) ".global " ASM_PREFIX #fn "\n"   \
+                                ASM_PREFIX #fn ":\n"
+
+/*
+ * Tag the crosspage code C wrapper with the crosspage section and page
+ * alignment.
+ */
+#define CPCODE __attribute__((section(ASM_SECTION)))   \
+               __attribute__((aligned(PAGE_SIZE)))
+
+/* No special handling is needed for the data. */
+#define CPDATA
+
+#define VMMDATALA(off) (LPN_2_LA(CROSS_PAGE_DATA_START) + (off))
+
+#define NOT_REACHED_MINIMAL __builtin_unreachable
+
+#ifdef ANNOTATE_INTRA_FUNCTION_CALL
+#define ANNOTATE_ASM_CALL_STR2(x) #x
+#define ANNOTATE_ASM_CALL_STR(x) ANNOTATE_ASM_CALL_STR2(x) "\n"
+#define ANNOTATE_ASM_CALL ANNOTATE_ASM_CALL_STR(ANNOTATE_INTRA_FUNCTION_CALL)
+#else
+#define ANNOTATE_ASM_CALL
+#endif
+
+void VmmToHost(void);
+
+CPDATA const VMCrossPageData cpDataTemplate = {
+   .version        = CROSSPAGE_VERSION,
+   .vmmonVersion   = VMMON_VERSION,
+
+   .monRSP         = VMM_LRET_STACK_TOP,
+   .monSS          = SYSTEM_DATA_SELECTOR,
+   .monDS          = SYSTEM_DATA_SELECTOR,
+   .monES          = SYSTEM_DATA_SELECTOR,
+
+   .vmmToHostLA    = (VA)VmmToHost,
+   .wsCR0          = CR0_PE | CR0_MP | CR0_EM | CR0_NE | CR0_WP | CR0_PG,
+   .wsCR4          = CR4_PAE | CR4_OSFXSR,
+
+   .monTask.rsp[0] = VMM_STACK_TOP,                   /* Monitor stack. */
+   .monTask.rsp[1] = VPN_2_VA(VMM_STACK_GUARD_START), /* CPL1 is not used. */
+   .monTask.rsp[2] = VPN_2_VA(VMM_STACK_GUARD_START), /* CPL2 is not used. */
+
+   .monTask.ist[IST_NONE]                 = 0, /* No stack switch. */
+   .monTask.ist[IST_VMM_DF]               = DF_STACK_TOP,
+   .monTask.ist[IST_VMM_NMI]              = NMI_STACK_TOP,
+   .monTask.ist[IST_VMM_MCE]              = MC_STACK_TOP,
+
+   .monTask.IOMapBase = sizeof(Task64),
+
+   .monGDTR.limit  = GDT_LIMIT,
+   .monGDTR.offset = GDT_START_VA,
+
+   .shadowDR[6].ureg64 = DR6_DEFAULT,
+   .shadowDR[7].ureg64 = DR7_ONES,
+
+   /*
+    * switchHostIDT and switchHostIDTR are initialized in vmmon.
+    * switchMonIDTR is static and can be fully initialized at compile-time.
+    * switchMonIDT is mostly static with all non-present entries except for
+    * the 4 handled exceptions which are populated by the crosspage setup
+    * code in task.c
+    */
+   .switchMonIDTR  = { sizeof(Gate64) * NUM_EXCEPTIONS - 1,
+                       VMMDATALA(offsetof(VMCrossPageData, switchMonIDT)) },
+};
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CrossPage_CodePage --
+ *
+ *      This function only serves as an anchor and wrapper for the code that
+ *      runs in the world switch's cross page.  The function must not be called
+ *      directly.  Its address may be used to locate the cross page code.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+CPCODE void
+CrossPage_CodePage(void)
+{
+   __asm__ __volatile__ (
+
+
+   /*
+    *---------------------------------------------------------------------------
+    *
+    * SwitchDBHandler --
+    *
+    *      DB handler that operates during worldswitch (in both directions).
+    *
+    *      This handler is expected to be used in two cases:
+    *      1) If the host kernel has set the DR7_GD (guard) bit, when switch
+    *         code attempts to save debug registers, a #DB will be thrown.  In
+    *         this case, the handler sets wsException[EXC_DB] and returns.
+    *      2) When stress-testing the worldswitch code, RFLAGS.TF is set across
+    *         most switch paths.  This causes a #DB to be thrown before each
+    *         instruction is executed.  In this case, the handler must set
+    *         RFLAGS.RF in the return frame to guarantee progress while
+    *         RFLAGS.TF is set.  For added stress, the handler induces a
+    *         simulated #NMI.
+    *
+    *      In case (1), returning is accomplished via a simulated iret in order
+    *      to preserve any NMI-blocking.  In case (2), the inherent
+    *      incompatibility of RFLAGS.RF for single-stepping and simulating an
+    *      iret via popf and lretq necessitates the use of an actual iret.  As
+    *      a result, there is no strong NMI-blocking guarantee when
+    *      stress-testing the switch path.
+    *
+    * Input:
+    *
+    *       0(%rsp) = previous RIP
+    *       8(%rsp) = previous CS
+    *      16(%rsp) = previous RFLAGS
+    *      24(%rsp) = previous RSP
+    *      32(%rsp) = previous SS
+    *
+    * Output:
+    *
+    *      wsException[EXC_DB] = TRUE
+    *
+    *---------------------------------------------------------------------------
+    */
+
+   ".p2align 4\n"
+   EXPORTED_ASM_SYMBOL(SwitchDBHandler)
+   "pushq        %%rax\n"
+   ANNOTATE_ASM_CALL
+   "call         SwitchExcGetCrossPageData\n"
+   "addq         %[wsExceptionDB], %%rax\n"
+   "movb         $1,               (%%rax)\n" /* log EXC_DB */
+   "popq         %%rax\n"
+   "testl        %[EFLAGS_TF],     16(%%rsp)\n" /* check trap flag */
+   "jz           return_without_enabling_nmi\n"
+   "orl          %[EFLAGS_RF],     16(%%rsp)\n"
+   "int          $2\n"
+   "iretq\n"
+
+
+   /*
+    *---------------------------------------------------------------------------
+    *
+    * SwitchUDHandler --
+    *
+    *      UD handler that operates during worldswitch (in both directions).
+    *
+    *      It sets the wsException[EXC_UD] flag then returns.
+    *
+    * Input:
+    *
+    *       0(%rsp) = previous RIP
+    *       8(%rsp) = previous CS
+    *      16(%rsp) = previous RFLAGS
+    *      24(%rsp) = previous RSP
+    *      32(%rsp) = previous SS
+    *
+    * Output:
+    *
+    *      wsException[EXC_UD] = TRUE
+    *
+    *---------------------------------------------------------------------------
+    */
+
+   ".p2align 4\n"
+   EXPORTED_ASM_SYMBOL(SwitchUDHandler)
+   "pushq        %%rax\n"
+   "pushq        %%rbx\n"
+   "pushq        %%rcx\n"
+   ANNOTATE_ASM_CALL
+   "call         SwitchExcGetCrossPageData\n"
+   "movl         %[wsExceptionUD],      %%ecx\n"    /* log EXC_UD */
+   "movb         $1,                    (%%rax, %%rcx)\n"
+   /* Check if the exception came from a monitor RIP. */
+   "cmpq         %[MONITOR_MINIMUM_VA], 24(%%rsp)\n"
+   "jae          monitor_context\n"
+   /* Check if the exception came from the crosspage code. */
+   "movq         24(%%rsp),              %%rbx\n"
+   "andq         %[PageAlignMask],       %%rbx\n"
+   "movl         %[crosspageCodeLA],     %%ecx\n"
+   "cmpq         (%%rax, %%rcx),         %%rbx\n"
+   "je           monitor_context\n"
+   /*
+    * Linux halts the processor on host #UD2.  Act similarly.  PR 1281662.
+    * Note that this can escape due to an #NMI, #MC, or #DB.
+    */
+   "cli\n"
+   "hlt\n"
+   /* Advance 2 bytes to skip past the #UD2 instruction. */
+   "monitor_context:\n"
+   "movq         24(%%rsp), %%rbx\n"
+   "movl         %[wsUD2],  %%ecx\n"
+   "movq         %%rbx,     (%%rax, %%rcx)\n"
+   "addq         $2,        24(%%rsp)\n"
+   "popq         %%rcx\n"
+   "popq         %%rbx\n"
+   "popq         %%rax\n"
+   "jmp          return_without_enabling_nmi\n"
+
+
+   /*
+    *---------------------------------------------------------------------------
+    *
+    * SwitchNMIHandler --
+    *
+    *      NMI handler that operates during worldswitch (in both
+    *      directions).
+    *
+    *      It 'simply' sets the wsException[EXC_NMI] flag then returns,
+    *      leaving further NMI delivery inhibited.
+    *
+    *      As long as we don't execute 'iret', the CPU will not allow further
+    *      NMIs to be delivered; this is how the CPU protects itself from
+    *      runaway NMIs eating up the stack and triple-faulting.
+    *
+    *      See Vol 3, 5.5.1, Handling multiple NMIs.
+    *
+    * Input:
+    *
+    *       0(%rsp) = previous RIP
+    *       8(%rsp) = previous CS
+    *      16(%rsp) = previous RFLAGS
+    *      24(%rsp) = previous RSP
+    *      32(%rsp) = previous SS
+    *
+    * Output:
+    *
+    *      wsException[EXC_NMI] = TRUE
+    *      further NMI delivery inhibited
+    *
+    *---------------------------------------------------------------------------
+    */
+
+   ".p2align 4\n"
+   EXPORTED_ASM_SYMBOL(SwitchNMIHandler)
+   "pushq        %%rax\n"
+   ANNOTATE_ASM_CALL
+   "call         SwitchExcGetCrossPageData\n"
+   "addq         %[wsExceptionNMI], %%rax\n"
+   "movb         $1,                (%%rax)\n" /* log EXC_NMI */
+   "popq         %%rax\n"
+   "jmp          return_without_enabling_nmi\n"
+
+
+   /*
+    *---------------------------------------------------------------------------
+    *
+    * SwitchMCEHandler --
+    *
+    *      MCE handler that operates during worldswitch (in both
+    *      directions).
+    *
+    *      It simply sets the wsException[EXC_MC] flag then returns.
+    *
+    * Input:
+    *
+    *       0(%rsp) = previous RIP
+    *       8(%rsp) = previous CS
+    *      16(%rsp) = previous RFLAGS
+    *      24(%rsp) = previous RSP
+    *      32(%rsp) = previous SS
+    *
+    * Output:
+    *
+    *      wsException[EXC_MC] = TRUE
+    *
+    *---------------------------------------------------------------------------
+    */
+
+   ".p2align 4\n"
+   EXPORTED_ASM_SYMBOL(SwitchMCEHandler)
+   "pushq        %%rax\n"
+   ANNOTATE_ASM_CALL
+   "call         SwitchExcGetCrossPageData\n"
+   "addq         %[wsExceptionMC], %%rax\n"
+   "movb         $1,              (%%rax)\n" /* log EXC_MC */
+   "popq         %%rax\n"
+   "jmp          return_without_enabling_nmi\n"
+
+
+   /*
+    *---------------------------------------------------------------------------
+    *
+    * SwitchHandlerReturns --
+    *
+    *      Shared code to return without enabling NMIs.  Switch handlers call
+    *      directly to these labels as needed.
+    *
+    *---------------------------------------------------------------------------
+    */
+
+   ".p2align 4\n"
+   "return_without_enabling_nmi:\n"
+   "pushq        %%rbp\n"
+   "pushq        %%rax\n"
+   "movq         40(%%rsp), %%rbp\n"
+   "subq         $32, %%rbp\n"
+   "movq         24(%%rsp), %%rax\n"
+   "movq         %%rax, 24(%%rbp)\n"
+   "movq         16(%%rsp), %%rax\n"
+   "movq         %%rax, 16(%%rbp)\n"
+   "movq         32(%%rsp), %%rax\n"
+   "movq         %%rax, 8(%%rbp)\n"
+   "movq         8(%%rsp),  %%rax\n"
+   "movq         %%rax, (%%rbp)\n"
+   "popq         %%rax\n"
+   "movq         %%rbp, %%rsp\n"
+   "popq         %%rbp\n"
+   "popfq\n"
+   "lretq\n"
+
+
+   /*
+    *---------------------------------------------------------------------------
+    *
+    * HostToVmm --
+    *
+    *      Switch from host to monitor.
+    *
+    * Entered with:
+    *      RCX = crosspage host address
+    *      (RSP) = return to host address
+    *
+    * Must preserve:
+    *      RBX, RSI, RDI, RBP, RSP, R12..R15
+    *
+    *---------------------------------------------------------------------------
+    */
+
+   ".p2align 4\n"
+   EXPORTED_ASM_SYMBOL(HostToVmm)
+   /* Create an lret frame on the host stack. */
+   "pushq           (%%rsp)\n"
+   "mov             %%cs,  8(%%rsp)\n"
+   "movq            %%rsp, %%rax\n" /* Temporarily hold host %rsp */
+
+   /* Start from the "empty" host context and save. */
+   "leaq            %c[hostContextEmpty](%%rcx), %%rsp\n"
+   /* Note that only %ss is stored, not %ds/%es. */
+   "movw            %%ss,  %%dx\n"
+   "pushw           %%dx\n"
+   "pushq           %%rax\n" /* host %rsp */
+   "pushq           %%r15\n"
+   "pushq           %%r14\n"
+   "pushq           %%r13\n"
+   "pushq           %%r12\n"
+   "pushq           %%rdi\n"
+   "pushq           %%rsi\n"
+   "pushq           %%rbp\n"
+   "pushq           %%rbx\n"
+   "movq            %%cr3, %%rax\n"
+   "pushq           %%rax\n"
+
+   /* Start from the "full" monitor context and load. */
+   "leaq            %c[monContextFull](%%rcx), %%rsp\n"
+   "popq            %%rsi\n" /* monitor %cr3 */
+   "popq            %%rbx\n"
+   "popq            %%rbp\n"
+   "popq            %%r12\n"
+   "popq            %%r13\n"
+   "popq            %%r14\n"
+   "popq            %%r15\n"
+   "popq            %%rax\n" /* monitor %rsp */
+   "popw            %%dx\n"  /* monitor %ss */
+   /* Load the cross GDT before reloading segments, %cr3 */
+   "lgdtq           %c[crossGDTHKLADesc](%%rcx)\n"
+   /* Load %cr3 last to flush the TLB after all stack ops. */
+   "movq            %%rsi, %%cr3\n"
+   /* Reload the monitor's %ss into %ds/%es. */
+   "movw            %%dx,  %%ds\n"
+   "movw            %%dx,  %%es\n"
+   "movw            %%dx,  %%ss\n"
+   "movq            %%rax, %%rsp\n"
+
+   "lretq\n"
+
+
+   /*
+    *---------------------------------------------------------------------------
+    *
+    * VmmToHost --
+    *
+    *      Switch from monitor to host.
+    *
+    * Must preserve:
+    *      RBX, RBP, RSP, R12..R15
+    *
+    *---------------------------------------------------------------------------
+    */
+
+   ".p2align 4\n"
+   EXPORTED_ASM_SYMBOL(VmmToHost)
+   "movq            %c[VMMCROSSPAGE] + %c[crosspageDataLA], %%rcx\n"
+   /* Create an lret frame on the monitor stack. */
+   "pushq           (%%rsp)\n"
+   "mov             %%cs,  8(%%rsp)\n"
+   "movq            %%rsp, %%rax\n" /* Temporarily hold monitor %rsp */
+
+   /* Start from the "empty" monitor context and save. */
+   "leaq            %c[VMMCROSSPAGE] + %c[monContextEmpty], %%rsp\n"
+   /* Note that only %ss is stored, not %ds/%es. */
+   "movw            %%ss,  %%dx\n"
+   "pushw           %%dx\n"
+   "pushq           %%rax\n" /* monitor %rsp */
+   "pushq           %%r15\n"
+   "pushq           %%r14\n"
+   "pushq           %%r13\n"
+   "pushq           %%r12\n"
+   "pushq           %%rbp\n"
+   "pushq           %%rbx\n"
+   "movq            %%cr3, %%rax\n"
+   "pushq           %%rax\n"
+
+   /* Start from the "full" host context and load. */
+   "leaq            %c[hostContextFull](%%rcx), %%rsp\n"
+   "popq            %%r9\n" /* host %cr3 */
+   "popq            %%rbx\n"
+   "popq            %%rbp\n"
+   "popq            %%rsi\n" /* Not ABI-required. */
+   "popq            %%rdi\n" /* Not ABI-required. */
+   "popq            %%r12\n"
+   "popq            %%r13\n"
+   "popq            %%r14\n"
+   "popq            %%r15\n"
+
+   "popq            %%rax\n" /* host %rsp */
+   "popw            %%dx\n"  /* host %ss */
+   /* Load the cross GDT and IDT before reloading segments, %cr3 */
+   "lgdtq           %c[crossGDTHKLADesc](%%rcx)\n"
+   "lidtq           %c[switchHostIDTR](%%rcx)\n"
+   /* Load %cr3 last to flush the TLB after all stack ops. */
+   "movq            %%r9,  %%cr3\n"
+   /* Reload the host's %ss into %ds/%es.  Technically wrong. */
+   "movw            %%dx,  %%ds\n"
+   "movw            %%dx,  %%es\n"
+   "movw            %%dx,  %%ss\n"
+   "movq            %%rax, %%rsp\n"
+
+   /* Microsoft RTL/codegen assumes EFLAGS<DF> = 0. */
+   "cld\n"
+   "lretq\n"
+
+   /*
+    *---------------------------------------------------------------------------
+    *
+    * SwitchExcGetCrossPageData --
+    *
+    *      Common function for the exception handlers to locate the data
+    *      crosspage so they can record their respective events.  In order to
+    *      reach this code an exception had to vector through the IDT.  The IDT
+    *      is known to be in the data page.  Therefore, the data page can be
+    *      found by accessing IDTR and rounding down to page alignment.
+    *
+    * Input:
+    *     None
+    *
+    * Output:
+    *     %rax = Page aligned address of the current crosspage data area.
+    *
+    * Note:
+    *     %rax (return value) and %rflags are destroyed, all other registers
+    *     are preserved.  Since this is only called by exception handlers, the
+    *     CPU has already saved %rflags so no additional handling is required.
+    *
+    *---------------------------------------------------------------------------
+    */
+
+   ".p2align 4\n"
+   "SwitchExcGetCrossPageData:\n"
+   "subq            $0x10,            %%rsp\n"
+   "sidt            0(%%rsp)\n"
+   "movq            2(%%rsp),         %%rax\n" /* DTR.offset */
+   "addq            $0x10,            %%rsp\n"
+   "andq            %[PageAlignMask], %%rax\n"
+   "ret\n"
+
+   EXPORTED_ASM_SYMBOL(CrossPage_CodeEnd)
+
+   : /* No output list, this is not really C code. */
+   : [MONITOR_MINIMUM_VA] "i" (MONITOR_LINEAR_START),
+     [PageAlignMask]      "i" (~PAGE_MASK),
+     [EFLAGS_TF]          "i" (EFLAGS_TF),
+     [EFLAGS_RF]          "i" (EFLAGS_RF),
+     [VMMCROSSPAGE]       "i" (CROSS_PAGE_DATA_START * PAGE_SIZE),
+     [wsUD2]              "i" (offsetof(VMCrossPageData, wsUD2)),
+
+     [wsExceptionDB]      "i" (offsetof(VMCrossPageData, wsException[EXC_DB])),
+     [wsExceptionUD]      "i" (offsetof(VMCrossPageData, wsException[EXC_UD])),
+     [wsExceptionNMI]     "i" (offsetof(VMCrossPageData, wsException[EXC_NMI])),
+     [wsExceptionMC]      "i" (offsetof(VMCrossPageData, wsException[EXC_MC])),
+
+     [hostContextEmpty]   "i" (offsetof(VMCrossPageData, hostDS)),
+     [monContextEmpty]    "i" (offsetof(VMCrossPageData, monDS)),
+
+     [hostContextFull]    "i" (offsetof(VMCrossPageData, hostCR3)),
+     [monContextFull]     "i" (offsetof(VMCrossPageData, monCR3)),
+
+     [crosspageDataLA]    "i" (offsetof(VMCrossPageData, crosspageDataLA)),
+     [crosspageCodeLA]    "i" (offsetof(VMCrossPageData, crosspageCodeLA)),
+     [crossGDTHKLADesc]   "i" (offsetof(VMCrossPageData, crossGDTHKLADesc)),
+     [switchHostIDTR]     "i" (offsetof(VMCrossPageData, switchHostIDTR))
+   );
+   NOT_REACHED_MINIMAL();
+}
+
+#ifdef STACK_FRAME_NON_STANDARD
+STACK_FRAME_NON_STANDARD(CrossPage_CodePage);
+#endif
+
+/*
+ * The crosspage data must not exceed a single page.
+ * The code area also must fit in a single page but that size isn't available
+ * until link time.
+ */
+MY_ASSERTS(CROSSPAGE_DATA,
+   ASSERT_ON_COMPILE(sizeof(VMCrossPageData) <= PAGE_SIZE);
+)
diff --git a/vmmon-only/common/crosspage.h b/vmmon-only/common/crosspage.h
new file mode 100644
index 00000000..c9178fbf
--- /dev/null
+++ b/vmmon-only/common/crosspage.h
@@ -0,0 +1,43 @@
+/*********************************************************
+ * Copyright (C) 2020 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _CROSSPAGE_H_
+#define _CROSSPAGE_H_
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+struct VMCrossPageData;
+
+extern void HostToVmm(struct VMCrossPageData *crosspageWIN, void *unused1,
+                      void *unused2, struct VMCrossPageData *crosspageSYSV);
+extern const VMCrossPageData cpDataTemplate;
+
+extern void SwitchDBHandler(void);
+extern void SwitchUDHandler(void);
+extern void SwitchNMIHandler(void);
+extern void SwitchMCEHandler(void);
+extern void CrossPage_CodePage(void);
+extern void CrossPage_CodeEnd(void);
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index 8b085b13..49fce0f6 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -68,7 +68,9 @@ typedef struct HostIFContigMemMap {
 
 EXTERN Bool  HostIF_Init(VMDriver *vm, uint32 numVCPUs);
 EXTERN int   HostIF_LookupUserMPN(VMDriver *vm, VA64 uAddr, MPN *mpn);
-EXTERN void *HostIF_MapCrossPage(VMDriver *vm, VA64 uAddr);
+
+EXTERN MPN   HostIF_GetCrossPageDataMPN(VMCrossPageData *crosspageData);
+EXTERN MPN   HostIF_GetCrossPageCodeMPN(void);
 
 EXTERN void *HostIF_AllocPage(void);
 EXTERN void  HostIF_FreePage(void *ptr);
@@ -101,6 +103,7 @@ EXTERN Bool HostIF_VMLockIsHeld(VMDriver *vm);
 EXTERN void  HostIF_APICInit(VMDriver *vm);
 EXTERN uint8 HostIF_GetMonitorIPIVector(void);
 EXTERN uint8 HostIF_GetHVIPIVector(void);
+EXTERN uint8 HostIF_GetPerfCtrVector(void);
 EXTERN void  HostIF_GetTimerVectors(uint8 *v0, uint8 *v1);
 
 EXTERN int   HostIF_SemaphoreWait(VMDriver *vm,
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index e23c0f0e..0757688c 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -66,6 +66,8 @@
 #include "x86paging_64.h"
 #include "memtrack.h"
 #include "monLoader.h"
+#include "segs.h"
+#include "crosspage.h"
 
 #ifdef LINUX_GDT_IS_RO
 #   include <asm/desc.h>
@@ -588,7 +590,13 @@ Bool
 Task_Initialize(void)
 {
    unsigned i;
+   VA cpStart = (VA)CrossPage_CodePage;
+   VA cpEnd   = (VA)CrossPage_CodeEnd;
 
+   if (VA_2_VPN(cpStart) != VA_2_VPN(cpEnd)) {
+      Warning("Crosspage code validation failed.\n");
+      return FALSE;
+   }
    ASSERT_ON_COMPILE(sizeof(Atomic_uint64) == sizeof(MPN));
    for (i = 0; i < ARRAYSIZE(hvRootPage); i++) {
       Atomic_Write64(&hvRootPage[i], INVALID_MPN);
@@ -828,7 +836,7 @@ TaskSwitchPTPLookupVPN(VMDriver *vm, VPN vpn)
  *    before/after doing a BackToHost.
  *
  *    For each populated patch, performs a page walk from L4 to the patch's
- *    level.  The lowest allowed level is L3.  Invalid patch levels, collisions
+ *    level.  The lowest allowed level is L2.  Invalid patch levels, collisions
  *    at the patch's level with existing PTEs and non-present PTEs during the
  *    walk all result in failure.
  *
@@ -847,6 +855,7 @@ TaskApplyPTPatches(VMDriver *vm, VMCrossPageData *cpData)
       VMMPageTablePatch *patch = &cpData->vmmPTP[i];
       unsigned l4idx = PT_LPN_2_L4OFF(patch->lpn);
       unsigned l3idx = PT_LPN_2_L3OFF(patch->lpn);
+      unsigned l2idx = PT_LPN_2_L2OFF(patch->lpn);
       PT_L4E pte = 0;
       MA ma = cpData->monCR3 + l4idx * sizeof pte; /* PTE machine address. */
 
@@ -886,6 +895,34 @@ TaskApplyPTPatches(VMDriver *vm, VMCrossPageData *cpData)
                return FALSE;
             }
             break;
+         case 2:
+            ASSERT(patch->pteIdx == l2idx);
+            if (!PTE_PRESENT(pte)) {
+               return FALSE; /* Terminate page walk, L4 not present. */
+            }
+            ma = MPN_2_MA(LM_PTE_2_PFN(pte)) + l3idx * sizeof pte;
+            if (HostIF_ReadPhysical(vm, ma, PtrToVA64(&pte), TRUE,
+                                    sizeof pte) != 0) {
+               return FALSE;
+            }
+            if (!PTE_PRESENT(pte)) {
+               return FALSE; /* Terminate page walk, L3 not present. */
+            }
+            ma = MPN_2_MA(LM_PTE_2_PFN(pte)) + l2idx * sizeof pte;
+            if (HostIF_ReadPhysical(vm, ma, PtrToVA64(&pte), TRUE,
+                                    sizeof pte) != 0) {
+               return FALSE;
+            }
+            if (pte != 0) {
+               return FALSE; /* Collision. */
+            }
+
+            if (HostIF_WritePhysical(vm, ma, PtrToVA64(&patch->pte), TRUE,
+                                     sizeof patch->pte) != 0) {
+               return FALSE;
+            }
+            break;
+
          default:
             return FALSE; /* Invalid level. */
             break;
@@ -945,11 +982,14 @@ TaskVerifyPTPatches(VMDriver *vm,
                     VMCrossPageData *cpData)
 {
    LPN64 xgCPN = LA_2_LPN(cpData->crossGDTLA);
-   LPN64 xpCPN = LA_2_LPN(cpData->crossPageLA);
-   MPN   xpMPN = MA_2_MPN(cpData->crosspageMA);
+   LPN64 xpCPN = LA_2_LPN(cpData->crosspageDataLA);
+   MPN   xpMPN = MA_2_MPN(cpData->crosspageDataMA);
    MA    cr3   = cpData->monCR3;
+   LPN64 xpCodeCPN = LA_2_LPN(cpData->crosspageCodeLA);
+   MPN   xpCodeMPN = HostIF_GetCrossPageCodeMPN();
    return TaskVerifyPTMap(vm, cr3, xpCPN, xpMPN) &&
-          TaskVerifyPTMap(vm, cr3, xgCPN, crossGDTMPN);
+          TaskVerifyPTMap(vm, cr3, xgCPN, crossGDTMPN) &&
+          TaskVerifyPTMap(vm, cr3, xpCodeCPN, xpCodeMPN);
 }
 
 
@@ -1172,11 +1212,10 @@ Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
 /*
  *-----------------------------------------------------------------------------
  *
- * TaskPopulateHostSwitchIDTE --
+ * TaskPopulateSwitchIDTE --
  *
- *      Populates a host interrupt descriptor in the crosspage, setting its
- *      handler to the associated gate stub, given a host code segment selector
- *      and the crosspage.
+ *      Populates an interrupt descriptor in the crosspage, setting its
+ *      handler to the associated gate stub given a code segment selector.
  *
  * Results:
  *      None
@@ -1188,17 +1227,13 @@ Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
  */
 
 static void
-TaskPopulateHostSwitchIDTE(unsigned idx, Selector cs, VMCrossPage *cp)
+TaskPopulateSwitchIDTE(unsigned idx, Selector cs, Gate64 *idt, VA handlerVA)
 {
    Gate64 *entry;
-   VA64 handlerVA;
 
    ASSERT_ON_COMPILE(sizeof *entry == 16);
    ASSERT(idx < NUM_EXCEPTIONS);
-
-   handlerVA = PtrToVA64(&cp->crosspageCode.gateStubs[idx * CP_STUB_SIZE]);
-
-   entry = &cp->crosspageData.switchHostIDT[idx];
+   entry = &idt[idx];
 
    entry->offset_0_15  = LOWORD(handlerVA);
    entry->offset_16_31 = HIWORD(handlerVA);
@@ -1212,13 +1247,21 @@ TaskPopulateHostSwitchIDTE(unsigned idx, Selector cs, VMCrossPage *cp)
    entry->reserved1    = 0;
 }
 
+static VA
+TaskVmmCodeVA(void (*handler)(void))
+{
+   VA baseVA = VPN_2_VA(CROSS_PAGE_CODE_START);
+   VA offs = (VA)handler % PAGE_SIZE;
+
+   return baseVA + offs;
+}
 
 /*
  *-----------------------------------------------------------------------------
  *
- *  TaskInitHostSwitchIDT --
+ *  TaskInitSwitchIDT --
  *
- *      Initializes the contents of the host-context switch IDT and IDTR.
+ *      Initializes the contents of the switch IDTs and IDTR.
  *      Uses the cross page's host kernel linear address and host kernel CS.
  *
  * Results:
@@ -1231,18 +1274,28 @@ TaskPopulateHostSwitchIDTE(unsigned idx, Selector cs, VMCrossPage *cp)
  */
 
 static void
-TaskInitHostSwitchIDT(VMCrossPage *crosspage)
+TaskInitSwitchIDTs(VMCrossPageData *cpData)
 {
-   VMCrossPageData *cpData = &crosspage->crosspageData;
-   const Selector   cs     = cpData->hostInitial64CS;
+   const Selector hostCS = cpData->hostInitial64CS;
+   Gate64 *switchHostIDT = cpData->switchHostIDT;
+   Gate64 *switchMonIDT  = cpData->switchMonIDT;
 
    cpData->switchHostIDTR.limit = sizeof cpData->switchHostIDT - 1;
    cpData->switchHostIDTR.offset = PtrToVA64(&cpData->switchHostIDT);
 
-   TaskPopulateHostSwitchIDTE(EXC_DB,  cs, crosspage);
-   TaskPopulateHostSwitchIDTE(EXC_NMI, cs, crosspage);
-   TaskPopulateHostSwitchIDTE(EXC_UD,  cs, crosspage);
-   TaskPopulateHostSwitchIDTE(EXC_MC,  cs, crosspage);
+   TaskPopulateSwitchIDTE(EXC_DB,  hostCS, switchHostIDT, (VA)SwitchDBHandler);
+   TaskPopulateSwitchIDTE(EXC_NMI, hostCS, switchHostIDT, (VA)SwitchNMIHandler);
+   TaskPopulateSwitchIDTE(EXC_UD,  hostCS, switchHostIDT, (VA)SwitchUDHandler);
+   TaskPopulateSwitchIDTE(EXC_MC,  hostCS, switchHostIDT, (VA)SwitchMCEHandler);
+
+   TaskPopulateSwitchIDTE(EXC_DB,  SYSTEM_CODE_SELECTOR, switchMonIDT,
+                          TaskVmmCodeVA(SwitchDBHandler));
+   TaskPopulateSwitchIDTE(EXC_NMI, SYSTEM_CODE_SELECTOR, switchMonIDT,
+                          TaskVmmCodeVA(SwitchNMIHandler));
+   TaskPopulateSwitchIDTE(EXC_UD,  SYSTEM_CODE_SELECTOR, switchMonIDT,
+                          TaskVmmCodeVA(SwitchUDHandler));
+   TaskPopulateSwitchIDTE(EXC_MC,  SYSTEM_CODE_SELECTOR, switchMonIDT,
+                          TaskVmmCodeVA(SwitchMCEHandler));
 }
 
 
@@ -1554,7 +1607,7 @@ TaskCreatePTPatch(VMDriver        *vm,
 /*
  *-----------------------------------------------------------------------------
  *
- * TaskCreatePTPatches
+ * TaskCreatePTPatches --
  *
  *      Creates VMM mappings for the crosspage and crossGDT that match
  *      those from the vmmon address space, so that they are mapped at
@@ -1569,16 +1622,19 @@ TaskCreatePTPatch(VMDriver        *vm,
  */
 
 static Bool
-TaskCreatePTPatches(VMDriver    *vm,
-                    VMCrossPage *crosspage,
-                    LPN64        monStartLPN,
-                    LPN64        monEndLPN,
-                    uint16      *numPages)
+TaskCreatePTPatches(VMDriver        *vm,
+                    VMCrossPageData *cpData,
+                    LPN64            monStartLPN,
+                    LPN64            monEndLPN,
+                    uint16          *numPages)
 {
-   VMCrossPageData * const cpData = &crosspage->crosspageData;
-   LPN64                   xgCPN  = LA_2_LPN(cpData->crossGDTLA);
-   LPN64                   xpCPN  = LA_2_LPN(cpData->crossPageLA);
-   MPN                     xpMPN  = MA_2_MPN(cpData->crosspageMA);
+   LPN64                   xgCPN     = LA_2_LPN(cpData->crossGDTLA);
+   LPN64                   xpCPN     = LA_2_LPN(cpData->crosspageDataLA);
+   MPN                     xpMPN     = MA_2_MPN(cpData->crosspageDataMA);
+   LPN64                   xpCodeCPN = LA_2_LPN(cpData->crosspageCodeLA);
+   MPN                     xpCodeMPN = HostIF_GetCrossPageCodeMPN();
+
+   ASSERT(xpCodeMPN != INVALID_MPN);
    /*
     * Set up patches that the BackToHost code will use to map the
     * crosspage and crossGDT at their crossover addresses (HKLA for
@@ -1587,7 +1643,9 @@ TaskCreatePTPatches(VMDriver    *vm,
    if (TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN,
                          xpCPN, xpMPN, numPages) &&
        TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN,
-                         xgCPN, crossGDTMPN, numPages)) {
+                         xgCPN, crossGDTMPN, numPages) &&
+       TaskCreatePTPatch(vm, cpData, monStartLPN, monEndLPN,
+                         xpCodeCPN, xpCodeMPN, numPages)) {
       TaskFixupPTPatches(vm, cpData);
       return TRUE;
    }
@@ -1612,9 +1670,9 @@ TaskCreatePTPatches(VMDriver    *vm,
  */
 
 Bool
-Task_InitCrosspage(VMDriver *vm,               // IN
-                   LPN monStartLPN,            // IN
-                   LPN monEndLPN,              // IN
+Task_InitCrosspage(VMDriver     *vm,           // IN
+                   LPN           monStartLPN,  // IN
+                   LPN           monEndLPN,    // IN
                    PerVcpuPages *perVcpuPages) // IN
 {
    Vcpuid vcpuid;
@@ -1626,31 +1684,19 @@ Task_InitCrosspage(VMDriver *vm,               // IN
 
    ASSERT(0 < vm->numVCPUs && vm->numVCPUs <= MAX_VCPUS);
    for (vcpuid = 0; vcpuid < vm->numVCPUs; vcpuid++) {
-      VA64             crossPageUserAddr = perVcpuPages[vcpuid].crosspage;
-      VMCrossPage     *p = HostIF_MapCrossPage(vm, crossPageUserAddr);
-      VMCrossPageData *cpData;
-      MPN              crossPageMPN;
-
-      if (p == NULL) {
-         return FALSE;
-      }
-      cpData = &p->crosspageData;
+      VMCrossPageData *cpData = vm->crosspage[vcpuid];
+      MPN              crossPageDataMPN;
 
-      HostIF_VMLock(vm, 38);
-      if (HostIF_LookupUserMPN(vm, crossPageUserAddr, &crossPageMPN) !=
-          PAGE_LOOKUP_SUCCESS ||
-          crossPageMPN == 0) {
-         HostIF_VMUnlock(vm, 38);
-         return FALSE;
-      }
-      HostIF_VMUnlock(vm, 38);
+      crossPageDataMPN = HostIF_GetCrossPageDataMPN(cpData);
+      ASSERT(crossPageDataMPN != INVALID_MPN);
+      memcpy(cpData, &cpDataTemplate, sizeof *cpData);
 
       /*
        * The version of the crosspage must be the first four bytes of the
        * crosspage.  See the declaration of VMCrossPage in modulecall.h.
        */
 
-      ASSERT_ON_COMPILE(offsetof(VMCrossPage, crosspageData.version) == 0);
+      ASSERT_ON_COMPILE(offsetof(VMCrossPageData, version) == 0);
       ASSERT_ON_COMPILE(sizeof(cpData->version) == sizeof(uint32));
 
       /* cpData->version is VMX's version; CROSSPAGE_VERSION is vmmon's. */
@@ -1660,12 +1706,9 @@ Task_InitCrosspage(VMDriver *vm,               // IN
                  (int)CROSSPAGE_VERSION, cpData->version);
          return FALSE;
       }
-      if (!pseudoTSC.initialized) {
-         Warning("%s*: PseudoTSC has not been initialized\n", __FUNCTION__);
-         return FALSE;
-      }
-      cpData->crosspageMA = MPN_2_MA(crossPageMPN);
-      cpData->crossPageLA = (LA64)(uintptr_t)p;
+      cpData->crosspageDataMA = MPN_2_MA(crossPageDataMPN);
+      cpData->crosspageDataLA = (LA64)(uintptr_t)cpData;
+      cpData->crosspageCodeLA = (LA64)CrossPage_CodePage;
       cpData->crossGDTLA = HOST_KERNEL_VA_2_LA((VA)crossGDT);
       cpData->crossGDTHKLADesc.offset = HOST_KERNEL_VA_2_LA((VA)crossGDT);
       cpData->crossGDTHKLADesc.limit  = sizeof(CrossGDT) - 1;
@@ -1675,7 +1718,8 @@ Task_InitCrosspage(VMDriver *vm,               // IN
       cpData->monCR3 = MPN_2_MA(vm->ptRootMpns[vcpuid]);
 
       HostIF_VMLock(vm, 39);
-      if (!TaskCreatePTPatches(vm, p, monStartLPN, monEndLPN, &numPTPPages)) {
+      if (!TaskCreatePTPatches(vm, cpData, monStartLPN, monEndLPN,
+                               &numPTPPages)) {
          HostIF_VMUnlock(vm, 39);
          Warning("%s: Could not create page table patches for VCPU %d\n",
                  __FUNCTION__, vcpuid);
@@ -1713,9 +1757,8 @@ Task_InitCrosspage(VMDriver *vm,               // IN
       cpData->timerIntrTS           = MAX_ABSOLUTE_TS;
       cpData->hstTimerExpiry        = MAX_ABSOLUTE_TS;
       cpData->monTimerExpiry        = MAX_ABSOLUTE_TS;
-      vm->crosspage[vcpuid]         = p;
 
-      TaskInitHostSwitchIDT(p);
+      TaskInitSwitchIDTs(cpData);
    }
    /*
     * Store the number of pages allocated for this VM's page table patches so
@@ -1870,16 +1913,16 @@ TaskDisableTF(void)
 
 
 static INLINE Bool
-TaskGotException(const VMCrossPage *crosspage, unsigned exc)
+TaskGotException(const VMCrossPageData *crosspageData, unsigned exc)
 {
-   return crosspage->crosspageData.wsException[exc];
+   return crosspageData->wsException[exc];
 }
 
 
 static INLINE void
-TaskSetException(VMCrossPage *crosspage, unsigned exc, Bool v)
+TaskSetException(VMCrossPageData *crosspageData, unsigned exc, Bool v)
 {
-   crosspage->crosspageData.wsException[exc] = v;
+   crosspageData->wsException[exc] = v;
 }
 
 
@@ -1905,7 +1948,7 @@ TaskSetException(VMCrossPage *crosspage, unsigned exc, Bool v)
  */
 
 static INLINE_SINGLE_CALLER void
-TaskSaveDebugRegisters(VMCrossPage *crosspage)
+TaskSaveDebugRegisters(VMCrossPageData *crosspageData)
 {
    Bool saveGotDB;
 
@@ -1913,13 +1956,13 @@ TaskSaveDebugRegisters(VMCrossPage *crosspage)
    do {                                                 \
       uintptr_t drReg;                                  \
       GET_DR##n(drReg);                                 \
-      crosspage->crosspageData.hostDR[n] = drReg;       \
+      crosspageData->hostDR[n] = drReg;                 \
    } while (0)
 
    /* Hardware contains the host's %dr7, %dr6, %dr3, %dr2, %dr1, %dr0 */
-   crosspage->crosspageData.hostDRInHW = ((1 << 7) | (1 << 6) |
-                                          (1 << 3) | (1 << 2) |
-                                          (1 << 1) | (1 << 0));
+   crosspageData->hostDRInHW = ((1 << 7) | (1 << 6) |
+                                (1 << 3) | (1 << 2) |
+                                (1 << 1) | (1 << 0));
 
    /*
     * Save DR7 since we need to disable debug breakpoints during the world
@@ -1927,8 +1970,8 @@ TaskSaveDebugRegisters(VMCrossPage *crosspage)
     * SwitchDBHandler simply IRETs after setting crosspage gotDB flag.
     */
 
-   saveGotDB = TaskGotException(crosspage, EXC_DB);
-   TaskSetException(crosspage, EXC_DB, FALSE);
+   saveGotDB = TaskGotException(crosspageData, EXC_DB);
+   TaskSetException(crosspageData, EXC_DB, FALSE);
    COMPILER_MEM_BARRIER();      /* Prevent hoisting #UD-raising instructions. */
    SAVE_DR(7);
 
@@ -1936,7 +1979,7 @@ TaskSaveDebugRegisters(VMCrossPage *crosspage)
     * In all cases, DR7 shouldn't have the GD bit set.
     */
 
-   TS_ASSERT(!(crosspage->crosspageData.hostDR[7] & DR7_GD));
+   TS_ASSERT(!(crosspageData->hostDR[7] & DR7_GD));
 
    /*
     * Save DR6 in order to accommodate the ICEBP instruction and other stuff
@@ -1961,15 +2004,15 @@ TaskSaveDebugRegisters(VMCrossPage *crosspage)
     * SAVE_DR(6) can raise #DB.
     */
 
-   if (TaskGotException(crosspage, EXC_DB) &&
-       (crosspage->crosspageData.hostDR[6] & DR6_BD)) {
-      crosspage->crosspageData.hostDR[6] -= DR6_BD;
-      crosspage->crosspageData.hostDR[7] |= DR7_GD;
+   if (TaskGotException(crosspageData, EXC_DB) &&
+       (crosspageData->hostDR[6] & DR6_BD)) {
+      crosspageData->hostDR[6] -= DR6_BD;
+      crosspageData->hostDR[7] |= DR7_GD;
       SET_DR7(DR7_DEFAULT);
 
       /* HW: %dr7 and %dr6 are the guest, %dr3, %dr2, %dr1, %dr0 are host */
-      crosspage->crosspageData.hostDRInHW = ((1 << 3) | (1 << 2) |
-                                             (1 << 1) | (1 << 0));
+      crosspageData->hostDRInHW = ((1 << 3) | (1 << 2) |
+                                   (1 << 1) | (1 << 0));
    }
 
    /*
@@ -1977,20 +2020,20 @@ TaskSaveDebugRegisters(VMCrossPage *crosspage)
     * coincidentally trip during the switch.
     */
 
-   else if (crosspage->crosspageData.hostDR[7] & DR7_ENABLED) {
+   else if (crosspageData->hostDR[7] & DR7_ENABLED) {
       SET_DR7(DR7_DEFAULT);          // no #DB here, just simple set
       /* HW: %dr7 = guest, %dr6, %dr3, %dr2, %dr1, %dr0 = host */
-      crosspage->crosspageData.hostDRInHW = ((1 << 6) | (1 << 3) | (1 << 2) |
-                                             (1 << 1) | (1 << 0));
+      crosspageData->hostDRInHW = ((1 << 6) | (1 << 3) | (1 << 2) |
+                                   (1 << 1) | (1 << 0));
    }
 
-   TaskSetException(crosspage, EXC_DB, saveGotDB);
+   TaskSetException(crosspageData, EXC_DB, saveGotDB);
 
    /*
     * hostDR[6,7] have host contents in them now.
     */
 
-   crosspage->crosspageData.hostDRSaved = 0xC0;
+   crosspageData->hostDRSaved = 0xC0;
 #undef SAVE_DR
 }
 
@@ -2259,14 +2302,10 @@ TaskUpdatePTSCParameters(VMDriver *vm,
  *
  *      Wrapper that calls code to switch from the host to the monitor.
  *
- *      The basic idea is to do a (*(crosspage->hostToVmm))(crosspage)
+ *      The basic idea is to do a HostToVmm(crosspage)
  *      but it's complicated because we must have a common call format
  *      between GCC and MSC.
  *
- *      Since we have complete control over what GCC does with asm volatile,
- *      this amounts to having GCC do exactly what MSC does.
- *      For 64-bit hosts, we pass the parameter in RCX.
- *
  *      For 64-bit GCC, the callee is expected to preserve
  *      RBX,RBP,RSP,R12..R15, whereas MSC expects the callee to preserve
  *      RBX,RSI,RDI,RBP,RSP,R12..R15.  So for simplicity, we have the
@@ -2293,48 +2332,24 @@ TaskUpdatePTSCParameters(VMDriver *vm,
  */
 
 static INLINE_SINGLE_CALLER void
-TaskSwitchToMonitor(VMCrossPage *crosspage)
+TaskSwitchToMonitor(VMCrossPageData *crosspageData)
 {
-   const void *codePtr = ((void *)&crosspage->crosspageCode.toVmmFunc);
-
-#if defined(__GNUC__)
-   /*
-    * Pass the crosspage pointer in RCX just like 64-bit MSC does.
-    * Tell GCC that the worldswitch preserves RBX,RSI,RDI,RBP,RSP,
-    * R12..R15 just like the MSC 64-bit calling convention.
-    */
-
-   {
-      uint64 raxGetsWiped, rcxGetsWiped;
-
-      __asm__ __volatile__("call *%%rax"
-                           : "=a" (raxGetsWiped),
-                             "=c" (rcxGetsWiped)
-                           : "0" (codePtr),
-                             "1" (crosspage)
-                           : "rdx", "r8", "r9", "r10", "r11", "cc", "memory");
-   }
-#elif defined(_MSC_VER)
    /*
-    * The 64-bit calling convention is to pass the argument in RCX and that
-    * the called function must preserve RBX,RSI,RDI,RBP,RSP,R12..R15.
+    * Arrange for RCX to contain the crosspage pointer using the MS ABI (first
+    * argument) and with the SYSV ABI (4th argument).
     */
-#pragma warning(suppress: 4055) // Cast of data pointer to function pointer.
-   (*(void (*)(VMCrossPage *))codePtr)(crosspage);
-#else
-#error No compiler defined for TaskSwitchToMonitor
-#endif
+   HostToVmm(crosspageData, NULL, NULL, crosspageData);
 }
 
 
 static void
-TaskTestCrossPageExceptionHandlers(VMCrossPage *crosspage)
+TaskTestCrossPageExceptionHandlers(VMCrossPageData *crosspage)
 {
    static Bool testSwitchNMI = TRUE; /* test only first time through */
 
    /*
     * Test the DB,NMI,MCE handlers to make sure they can set the
-    * flags.  This is calling the handlers in switchNMI.S.
+    * flags.  This is calling the handlers in crosspage.c.
     */
 
    if (vmx86_debug && testSwitchNMI) {
@@ -2343,8 +2358,7 @@ TaskTestCrossPageExceptionHandlers(VMCrossPage *crosspage)
       testSwitchNMI = FALSE;
 
       /*
-       * RAISE_INTERRUPT calls Switch{32,64}DBHandler in switchNMI.S
-       * (depending on host bitsize).
+       * RAISE_INTERRUPT calls SwitchDBHandler in crosspage.c.
        */
 
       gotSave = TaskGotException(crosspage, EXC_DB);
@@ -2354,8 +2368,7 @@ TaskTestCrossPageExceptionHandlers(VMCrossPage *crosspage)
       TaskSetException(crosspage, EXC_DB, gotSave);
 
       /*
-       * RAISE_INTERRUPT calls Switch{32,64}NMIHandler in switchNMI.S
-       * (depending on host bitsize).
+       * RAISE_INTERRUPT calls SwitchNMIHandler in crosspage.c.
        */
       gotSave = TaskGotException(crosspage, EXC_NMI);
       TaskSetException(crosspage, EXC_NMI, FALSE);
@@ -2366,7 +2379,7 @@ TaskTestCrossPageExceptionHandlers(VMCrossPage *crosspage)
       /*
        * Test the LRETQ in the 64-bit mini NMI handler to make sure
        * it works with any 16-byte offset of the stack pointer.
-       * The INT 2 calls Switch64NMIHandler in switchNMI.S.
+       * The INT 2 calls SwitchNMIHandler in crosspage.c.
        */
       {
          uint64 v1, v2;
@@ -2395,8 +2408,7 @@ TaskTestCrossPageExceptionHandlers(VMCrossPage *crosspage)
       TaskSetException(crosspage, EXC_NMI, gotSave);
 
       /*
-       * RAISE_INTERRUPT calls Switch{32,64}MCEHandler in switchNMI.S
-       * (depending on host bitsize).
+       * RAISE_INTERRUPT calls SwitchMCEHandler in crosspage.c.
        */
 
       gotSave = TaskGotException(crosspage, EXC_MC);
@@ -2425,10 +2437,10 @@ TaskTestCrossPageExceptionHandlers(VMCrossPage *crosspage)
  */
 
 static INLINE Bool
-TaskShouldRetryWorldSwitch(VMCrossPage *crosspage)
+TaskShouldRetryWorldSwitch(VMCrossPageData *crosspage)
 {
-   Bool result = crosspage->crosspageData.retryWorldSwitch;
-   crosspage->crosspageData.retryWorldSwitch = FALSE;
+   Bool result = crosspage->retryWorldSwitch;
+   crosspage->retryWorldSwitch = FALSE;
    return result;
 }
 
@@ -2447,16 +2459,13 @@ TaskShouldRetryWorldSwitch(VMCrossPage *crosspage)
  *      state.
  *
  * Results:
- *      None.
- *
- * Side effects:
- *      Jump to the monitor. Has no direct effect on the host-visible
- *      state except that it might generate an interrupt.
+ *      TRUE - If a #UD did not occur during the context switch.
+ *      FALSE - Otherwise.
  *
  *-----------------------------------------------------------------------------
  */
 
-void
+Bool
 Task_Switch(VMDriver *vm,  // IN
             Vcpuid vcpuid) // IN
 {
@@ -2474,10 +2483,11 @@ Task_Switch(VMDriver *vm,  // IN
    Bool lint1NMI;
    Bool pcNMI;
    Bool thermalNMI;
-   VMCrossPage *crosspage;
+   VMCrossPageData *crosspage;
    uint32 pCPU;
    MPN hvRootMPN;
    Descriptor *tempGDTBase;
+   Bool switchOk = TRUE;
 #ifdef CYCLE_SPEC_CTRL
    Bool specCtrlEqual = FALSE;
    uint64 readSpecCtrlValue = 0;
@@ -2486,8 +2496,9 @@ Task_Switch(VMDriver *vm,  // IN
 
    ASSERT(vcpuid < vm->numVCPUs);
    crosspage = vm->crosspage[vcpuid];
+   ASSERT(crosspage != NULL);
 
-   ASSERT_ON_COMPILE(sizeof(VMCrossPage) == PAGE_SIZE);
+   ASSERT_ON_COMPILE(sizeof(VMCrossPageData) <= PAGE_SIZE);
    TaskDisableNMI(&vm->hostAPIC, &lint0NMI, &lint1NMI, &pcNMI, &thermalNMI);
    SAVE_FLAGS(flags);
    CLEAR_INTERRUPTS();
@@ -2506,13 +2517,13 @@ Task_Switch(VMDriver *vm,  // IN
     * crosspages arguments when doing this though, see bug 820257.
     */
    if (hvRootMPN == INVALID_MPN && CPUID_HostSupportsHV()) {
-      crosspage->crosspageData.userCallType = MODULECALL_USERCALL_NONE;
-      crosspage->crosspageData.moduleCallType = MODULECALL_ALLOC_VMX_PAGE;
-      crosspage->crosspageData.pcpuNum = pCPU;
+      crosspage->userCallType = MODULECALL_USERCALL_NONE;
+      crosspage->moduleCallType = MODULECALL_ALLOC_VMX_PAGE;
+      crosspage->pcpuNum = pCPU;
    } else if (USE_TEMPORARY_GDT && tempGDTBase == NULL) {
-      crosspage->crosspageData.userCallType = MODULECALL_USERCALL_NONE;
-      crosspage->crosspageData.moduleCallType = MODULECALL_ALLOC_TMP_GDT;
-      crosspage->crosspageData.pcpuNum = pCPU;
+      crosspage->userCallType = MODULECALL_USERCALL_NONE;
+      crosspage->moduleCallType = MODULECALL_ALLOC_TMP_GDT;
+      crosspage->pcpuNum = pCPU;
    } else {
       do {
          uintptr_t cr0reg, cr2reg, cr3reg, cr4reg;
@@ -2523,7 +2534,7 @@ Task_Switch(VMDriver *vm,  // IN
 
          Atomic_Write32(&vm->currentHostCpu[vcpuid], pCPU);
 
-         TaskUpdatePTSCParameters(vm, &crosspage->crosspageData, vcpuid);
+         TaskUpdatePTSCParameters(vm, crosspage, vcpuid);
 
          /*
           * Disable PEBS if it is supported and enabled.  Do this while on the
@@ -2554,7 +2565,7 @@ Task_Switch(VMDriver *vm,  // IN
           */
 
          TaskSaveIDT(&hostIDT);
-         TaskLoadIDT(&crosspage->crosspageData.switchHostIDTR);
+         TaskLoadIDT(&crosspage->switchHostIDTR);
          TaskTestCrossPageExceptionHandlers(crosspage);
 
          if (CPUID_HostSupportsVT()) {
@@ -2580,21 +2591,21 @@ Task_Switch(VMDriver *vm,  // IN
          GET_CR0(cr0reg);
          GET_CR4(cr4reg);
          GET_CR3(cr3reg);
-         crosspage->crosspageData.hostCR3 = cr3reg;
+         crosspage->hostCR3 = cr3reg;
 
          /*
           * Any reserved bits in CR0 must be preserved when we switch
           * to the VMM. [See PR 291004.]  (On the other hand, Intel
           * recommends that we clear any reserved CR4 bits.)
           */
-         crosspage->crosspageData.wsCR0 &= ~CR0_RESERVED;
-         crosspage->crosspageData.wsCR0 |= (cr0reg & CR0_RESERVED);
+         crosspage->wsCR0 &= ~CR0_RESERVED;
+         crosspage->wsCR0 |= (cr0reg & CR0_RESERVED);
 
          /*
           * CR4.VMXE must be enabled to support VMX in the monitor.
           */
          if (CPUID_HostSupportsVT()) {
-            crosspage->crosspageData.wsCR4 |= CR4_VMXE;
+            crosspage->wsCR4 |= CR4_VMXE;
          }
 
          /*
@@ -2602,8 +2613,8 @@ Task_Switch(VMDriver *vm,  // IN
           * host's values.  CR4.PCIDE will be cleared once we're in the monitor,
           * running on a CR3 with a PCID field of 0.
           */
-         crosspage->crosspageData.wsCR4 =
-            (crosspage->crosspageData.wsCR4 & ~(CR4_MCE | CR4_PCIDE)) |
+         crosspage->wsCR4 =
+            (crosspage->wsCR4 & ~(CR4_MCE | CR4_PCIDE)) |
             (cr4reg & (CR4_MCE | CR4_PCIDE));
 
          /*
@@ -2611,15 +2622,15 @@ Task_Switch(VMDriver *vm,  // IN
           * switching to the monitor's CR4 ensures that global pages are
           * flushed.
           */
-         ASSERT((crosspage->crosspageData.wsCR4 & CR4_PGE) == 0);
+         ASSERT((crosspage->wsCR4 & CR4_PGE) == 0);
 
          /*
           * Load the world-switch CR0 and CR4.  We can't load the monitor's
           * CR3 yet, because the current code isn't mapped into the
           * monitor's address space.
           */
-         SET_CR0((uintptr_t)crosspage->crosspageData.wsCR0);
-         SET_CR4((uintptr_t)crosspage->crosspageData.wsCR4);
+         SET_CR0((uintptr_t)crosspage->wsCR0);
+         SET_CR4((uintptr_t)crosspage->wsCR4);
 
          TaskSaveDebugRegisters(crosspage);
 
@@ -2708,23 +2719,22 @@ Task_Switch(VMDriver *vm,  // IN
             currentSpecCtrlValue = (currentSpecCtrlValue + 1) % 4;
             X86MSR_SetMSR(MSR_SPEC_CTRL, currentSpecCtrlValue);
 #endif
-            crosspage->crosspageData.specCtrl = X86MSR_GetMSR(MSR_SPEC_CTRL);
+            crosspage->specCtrl = X86MSR_GetMSR(MSR_SPEC_CTRL);
          }
 
-         DEBUG_ONLY(crosspage->crosspageData.monTinyStack[0] = 0xDEADBEEF;)
-         DEBUG_ONLY(crosspage->crosspageData.hostTinyStack[0] = 0xDEADBEEF;)
+         DEBUG_ONLY(crosspage->monTinyStack[0] = 0xDEADBEEF;)
+         DEBUG_ONLY(crosspage->hostTinyStack[0] = 0xDEADBEEF;)
          /* Running in host context prior to TaskSwitchToMonitor() */
          TaskSwitchToMonitor(crosspage);
          /* Running in host context after to TaskSwitchToMonitor() */
 
-         TS_ASSERT(crosspage->crosspageData.monTinyStack[0] == 0xDEADBEEF);
-         TS_ASSERT(crosspage->crosspageData.hostTinyStack[0] == 0xDEADBEEF);
+         TS_ASSERT(crosspage->monTinyStack[0] == 0xDEADBEEF);
+         TS_ASSERT(crosspage->hostTinyStack[0] == 0xDEADBEEF);
 
 #ifdef CYCLE_SPEC_CTRL
          if (CPUID_HostSupportsSpecCtrl()) {
             readSpecCtrlValue = X86MSR_GetMSR(MSR_SPEC_CTRL);
-            specCtrlEqual = readSpecCtrlValue ==
-                            crosspage->crosspageData.specCtrl;
+            specCtrlEqual = readSpecCtrlValue == crosspage->specCtrl;
             /* Do not leak cycling SPEC_CTRL value back to host. */
             X86MSR_SetMSR(MSR_SPEC_CTRL, 0);
          }
@@ -2762,10 +2772,10 @@ Task_Switch(VMDriver *vm,  // IN
           * CR2 always has to be restored.  CR8 never has to be restored.
           */
          SET_CR2(cr2reg);
-         if (crosspage->crosspageData.wsCR0 != cr0reg) {
+         if (crosspage->wsCR0 != cr0reg) {
             SET_CR0(cr0reg);
          }
-         if (crosspage->crosspageData.wsCR4 != cr4reg) {
+         if (crosspage->wsCR4 != cr4reg) {
             SET_CR4(cr4reg);
          } else if ((cr4reg & CR4_PCIDE) != 0) {
             /*
@@ -2813,7 +2823,7 @@ Task_Switch(VMDriver *vm,  // IN
             TaskDisableTF();
          }
 
-         TaskRestoreDebugRegisters(&crosspage->crosspageData);
+         TaskRestoreDebugRegisters(crosspage);
 
          ASSERT_NO_INTERRUPTS();
 
@@ -2832,7 +2842,7 @@ Task_Switch(VMDriver *vm,  // IN
             X86MSR_SetMSR(MSR_RTIT_CTL, ptMSR);
          }
 
-         TaskUpdateLatestPTSC(vm, &crosspage->crosspageData);
+         TaskUpdateLatestPTSC(vm, crosspage);
          Atomic_Write32(&vm->currentHostCpu[vcpuid], INVALID_PCPU);
 
          /*
@@ -2864,12 +2874,13 @@ Task_Switch(VMDriver *vm,  // IN
             RAISE_INTERRUPT(EXC_MC);
          }
          if (UNLIKELY(TaskGotException(crosspage, EXC_UD))) {
-            Warning("#UD occurred on switch back to host; dumping core.\n");
+            switchOk = FALSE;
+            Warning("#UD occurred on switch back to host.\n");
          }
 #ifdef CYCLE_SPEC_CTRL
          if (UNLIKELY(!specCtrlEqual)) {
             Warning("SpecCtrl not equal: expected %"FMT64"x, got %"FMT64"x\n",
-                    crosspage->crosspageData.specCtrl, readSpecCtrlValue);
+                    crosspage->specCtrl, readSpecCtrlValue);
          }
 #endif
          /*
@@ -2877,8 +2888,8 @@ Task_Switch(VMDriver *vm,  // IN
           * received during worldswitch.  Here is the more generic case
           * of forwarding NMIs received while executing the VMM/guest.
           */
-         if (crosspage->crosspageData.moduleCallType == MODULECALL_INTR &&
-             crosspage->crosspageData.args[0] == EXC_NMI) {
+         if (crosspage->moduleCallType == MODULECALL_INTR &&
+             crosspage->args[0] == EXC_NMI) {
             /*
              * If VMM was interrupted by an NMI, do the INT 2 so the
              * host will handle it, but then return immediately to the
@@ -2888,12 +2899,12 @@ Task_Switch(VMDriver *vm,  // IN
              * done the EOI.
              */
             RAISE_INTERRUPT(EXC_NMI);
-            crosspage->crosspageData.retryWorldSwitch = TRUE;
+            crosspage->retryWorldSwitch = TRUE;
          }
       } while (UNLIKELY(TaskShouldRetryWorldSwitch(crosspage)));
    }
 
-   if (crosspage->crosspageData.moduleCallType == MODULECALL_INTR) {
+   if (crosspage->moduleCallType == MODULECALL_INTR) {
 
       /*
        * Newer versions of Window expect EFLAGS_AC to be set when handling an
@@ -2912,15 +2923,15 @@ Task_Switch(VMDriver *vm,  // IN
        * what bad things btw).
        */
 #ifdef _WIN64
-      if (crosspage->crosspageData.args[0] <= 0xFF &&
-          (crosspage->crosspageData.args[0] >= 0x14 ||
-           crosspage->crosspageData.args[0] == EXC_MC)) {
-         RAISE_INTERRUPT((unsigned char)crosspage->crosspageData.args[0]);
+      if (crosspage->args[0] <= 0xFF &&
+          (crosspage->args[0] >= 0x14 ||
+           crosspage->args[0] == EXC_MC)) {
+         RAISE_INTERRUPT((unsigned char)crosspage->args[0]);
       } else {
          Warning("%s: Received Unexpected Interrupt: 0x%"FMT64"X\n",
-                 __FUNCTION__, crosspage->crosspageData.args[0]);
+                 __FUNCTION__, crosspage->args[0]);
          Panic("Received Unexpected Interrupt: 0x%"FMT64"X\n",
-               crosspage->crosspageData.args[0]);
+               crosspage->args[0]);
       }
 #else
       /*
@@ -2934,7 +2945,7 @@ Task_Switch(VMDriver *vm,  // IN
 #define IRQ_INT16(_x) IRQ_INT8(_x); IRQ_INT8(_x + 8)
 #define IRQ_INT32(_x) IRQ_INT16(_x); IRQ_INT16(_x + 16)
 
-      switch (crosspage->crosspageData.args[0]) {
+      switch (crosspage->args[0]) {
          // These are the general IO interrupts
          // It would be nice to generate this dynamically, but see Note2 above.
 
@@ -2967,13 +2978,14 @@ Task_Switch(VMDriver *vm,  // IN
           */
 
          Warning("%s: Received Unexpected Interrupt: 0x%"FMT64"X\n",
-                 __FUNCTION__, crosspage->crosspageData.args[0]);
+                 __FUNCTION__, crosspage->args[0]);
          Panic("Received Unexpected Interrupt: 0x%"FMT64"X\n",
-               crosspage->crosspageData.args[0]);
+               crosspage->args[0]);
       }
 #endif
    }
 
    RESTORE_FLAGS(flags);
    TaskRestoreNMI(&vm->hostAPIC, lint0NMI, lint1NMI, pcNMI, thermalNMI);
+   return switchOk;
 }
diff --git a/vmmon-only/common/task.h b/vmmon-only/common/task.h
index acf9f713..6957d410 100644
--- a/vmmon-only/common/task.h
+++ b/vmmon-only/common/task.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013,2015,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2013,2015,2019-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -29,7 +29,7 @@ struct MonLoaderHeader;
 extern Bool Task_CreateCrossGDT(BSVMM_GDTInit *gdt);
 extern Bool Task_InitCrosspage(VMDriver *vm, LPN monStartLPN, LPN monEndLPN,
                                PerVcpuPages *perVcpuPages);
-extern void Task_Switch(VMDriver *vm, Vcpuid vcpuid);
+extern Bool Task_Switch(VMDriver *vm, Vcpuid vcpuid);
 extern Bool Task_Initialize(void);
 extern void Task_Terminate(void);
 extern MPN Task_GetHVRootPageForPCPU(uint32 pCPU);
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index a33f393b..e5fb7ad4 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -112,8 +112,9 @@ static unsigned globalFastClockRate;
 HostIFContigMemMap *hvIOBitmap;
 
 typedef struct {
-   Atomic_uint32 index;
-   MSRQuery *query;
+   Atomic_uint32 *index; // OUT: array of cpu counters for queries.
+   MSRQuery *query;  // IN/OUT: array of query items
+   uint32 numItems;  // IN
 } Vmx86GetMSRData;
 
 static Bool hostUsesNX;
@@ -123,6 +124,20 @@ typedef struct NXData {
    Atomic_uint32 hasNX;
 } NXData;
 
+/*
+ * A structure for holding MSR indexes, values for MSR uniformity checks.
+ */
+typedef struct VMX86MSRCacheInfo {
+   uint32 msrIndex;
+   uint64 msrValue;
+} VMX86MSRCacheInfo;
+
+static VMX86MSRCacheInfo msrUniformityCacheInfo[] = {
+#define MSR_FEAT(member) {member, CONST64(0)},
+   MSR_FEAT(IA32_MSR_ARCH_CAPABILITIES)
+#undef MSR_FEAT
+};
+
 /*
  *----------------------------------------------------------------------
  *
@@ -567,6 +582,66 @@ Vmx86_Calloc(size_t numElements, // IN
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86AllocCrossPages --
+ *
+ *      Allocate numVCPUs pages suitable to be used as the VCPU's
+ *      crosspage area.
+ *
+ * Results:
+ *      TRUE if the required crosspages are allocated successfully.
+ *      FALSE otherwise.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+Vmx86AllocCrossPages(VMDriver *vm)
+{
+   Vcpuid v;
+
+   for (v = 0; v < vm->numVCPUs; v++) {
+      MPN unused;
+
+      UNUSED_VARIABLE(unused);
+      vm->crosspage[v] = HostIF_AllocKernelPages(1, &unused);
+
+      if (vm->crosspage[v] == NULL) {
+         return FALSE;
+      }
+      memset(vm->crosspage[v], 0, PAGE_SIZE);
+   }
+   return TRUE;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86FreeCrossPages --
+ *
+ *      Free the crosspages allocated for the given VM.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+Vmx86FreeCrossPages(VMDriver *vm)
+{
+   Vcpuid v;
+
+   if (vm->crosspage != NULL) {
+      for (v = 0; v < vm->numVCPUs; v++) {
+         if (vm->crosspage[v] != NULL) {
+            HostIF_FreeKernelPages(1, vm->crosspage[v]);
+         }
+      }
+   }
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -749,6 +824,7 @@ Vmx86FreeAllVMResources(VMDriver *vm)
 
       Vmx86_SetHostClockRate(vm, 0);
 
+      Vmx86FreeCrossPages(vm);
       if (vm->ptpTracker != NULL) {
          Task_SwitchPTPPageCleanup(vm);
       }
@@ -1197,6 +1273,15 @@ Vmx86_ProcessBootstrap(VMDriver *vm,
       goto error;
    }
 
+   if (!pseudoTSC.initialized) {
+      Warning("%s: PseudoTSC has not been initialized\n", __FUNCTION__);
+      goto error;
+   }
+
+   if (!Vmx86AllocCrossPages(vm)) {
+      Warning("Failed to allocate cross pages.\n");
+      goto error;
+   }
    /*
     * Initialize the driver's part of the cross-over page used to
     * talk to the monitor.
@@ -1638,12 +1723,12 @@ Vmx86_MonTimerIPI(void)
       VCPUSet_Empty(&expiredVCPUs);
 
       for (v = 0; v < vm->numVCPUs; v++) {
-         VMCrossPage *crosspage = vm->crosspage[v];
+         VMCrossPageData *crosspage = vm->crosspage[v];
 
-         if (!crosspage) {
+         if (crosspage == NULL) {
             continue;  // VCPU is not initialized yet
          }
-         expiry = crosspage->crosspageData.monTimerExpiry;
+         expiry = crosspage->monTimerExpiry;
          if (expiry != 0 && expiry <= pNow) {
             VCPUSet_Include(&expiredVCPUs, v);
             hasWork = TRUE;
@@ -2779,45 +2864,47 @@ Vmx86_CheckPseudoTSC(uint64 *lastTSC, // IN/OUT: last/current value of the TSC
 static void
 Vmx86GetMSR(void *clientData) // IN/OUT: A Vmx86GetMSRData *
 {
+   uint32 i;
    Vmx86GetMSRData *data = (Vmx86GetMSRData *)clientData;
-   MSRQuery *query;
-   uint32 index;
-   int err;
-
-   ASSERT(data);
-   query = data->query;
-   ASSERT(query);
+   ASSERT(data && data->index && data->query);
 
-   index = Atomic_ReadInc32(&data->index);
-   if (index >= query->numLogicalCPUs) {
-      return;
-   }
+   for (i = 0; i < data->numItems; ++i) {
+      uint32 index;
+      int err;
+      Atomic_uint32 *cpus = &data->index[i];
+      MSRQuery *query = &data->query[i];
 
-   query->logicalCPUs[index].tag = HostIF_GetCurrentPCPU();
+      index = Atomic_ReadInc32(cpus);
+      if (index >= query->numLogicalCPUs) {
+         continue;
+      }
 
-   /*
-    * We treat BIOS_SIGN_ID (microcode version) specially on Intel,
-    * where the preferred read sequence involves a macro.
-    */
+      query->logicalCPUs[index].tag = HostIF_GetCurrentPCPU();
 
-   if (CPUID_GetVendor() == CPUID_VENDOR_INTEL &&
-       query->msrNum == MSR_BIOS_SIGN_ID) {
-      /* safe to read: MSR_BIOS_SIGN_ID architectural since Pentium Pro */
-      query->logicalCPUs[index].msrVal = INTEL_MICROCODE_VERSION();
-      err = 0;
-   } else {
       /*
-       * Try to enable HV any time these MSRs are queried.  We have seen
-       * buggy formware that forgets to re-enable HV after waking from
-       * deep sleep. [PR 1020692]
+       * We treat BIOS_SIGN_ID (microcode version) specially on Intel,
+       * where the preferred read sequence involves a macro.
        */
-      if (query->msrNum == MSR_FEATCTL || query->msrNum == MSR_VM_CR) {
-         Vmx86EnableHVOnCPU();
+      if (CPUID_GetVendor() == CPUID_VENDOR_INTEL &&
+          query->msrNum == MSR_BIOS_SIGN_ID) {
+         /* safe to read: MSR_BIOS_SIGN_ID architectural since Pentium Pro */
+         query->logicalCPUs[index].msrVal = INTEL_MICROCODE_VERSION();
+         err = 0;
+      } else {
+         /*
+          * Try to enable HV any time these MSRs are queried.  We have seen
+          * buggy firmware that forgets to re-enable HV after waking from
+          * deep sleep. [PR 1020692]
+          */
+         if (query->msrNum == MSR_FEATCTL || query->msrNum == MSR_VM_CR) {
+            Vmx86EnableHVOnCPU();
+         }
+         err =
+            HostIF_SafeRDMSR(query->msrNum, &query->logicalCPUs[index].msrVal);
       }
-      err = HostIF_SafeRDMSR(query->msrNum, &query->logicalCPUs[index].msrVal);
-   }
 
-   query->logicalCPUs[index].implemented = (err == 0) ? 1 : 0;
+      query->logicalCPUs[index].implemented = (err == 0) ? 1 : 0;
+   }
 }
 
 
@@ -2826,7 +2913,7 @@ Vmx86GetMSR(void *clientData) // IN/OUT: A Vmx86GetMSRData *
  *
  * Vmx86_GetAllMSRs --
  *
- *      Collect MSR value on all logical CPUs.
+ *      Collect MSR value on number of logical CPUs requested.
  *
  *      The caller is responsible for ensuring that the requested MSR is valid
  *      on all logical CPUs.
@@ -2848,24 +2935,40 @@ Vmx86GetMSR(void *clientData) // IN/OUT: A Vmx86GetMSRData *
 Bool
 Vmx86_GetAllMSRs(MSRQuery *query) // IN/OUT
 {
+   unsigned i, cpu;
+   Atomic_uint32 index;
    Vmx86GetMSRData data;
+   data.index = &index;
+   data.numItems = 1;
+
+   /* Check MSR uniformity cache first. */
+   for (i = 0; i < ARRAYSIZE(msrUniformityCacheInfo); ++i) {
+      if (msrUniformityCacheInfo[i].msrIndex == query->msrNum) {
+         for (cpu = 0; cpu < query->numLogicalCPUs; cpu++) {
+            query->logicalCPUs[cpu].msrVal = msrUniformityCacheInfo[i].msrValue;
+            query->logicalCPUs[cpu].implemented = 1;
+            query->logicalCPUs[cpu].tag = cpu;
+         }
+         return TRUE;
+      }
+   }
 
-   Atomic_Write32(&data.index, 0);
+   Atomic_Write32(data.index, 0);
    data.query = query;
 
    HostIF_CallOnEachCPU(Vmx86GetMSR, &data);
 
    /*
-    * At this point, Atomic_Read32(&data.index) is the number of logical CPUs
+    * At this point, Atomic_Read32(data.index) is the number of logical CPUs
     * who replied.
     */
 
-   if (Atomic_Read32(&data.index) > query->numLogicalCPUs) {
+   if (Atomic_Read32(data.index) > query->numLogicalCPUs) {
       return FALSE;
    }
 
-   ASSERT(Atomic_Read32(&data.index) <= query->numLogicalCPUs);
-   query->numLogicalCPUs = Atomic_Read32(&data.index);
+   ASSERT(Atomic_Read32(data.index) <= query->numLogicalCPUs);
+   query->numLogicalCPUs = Atomic_Read32(data.index);
 
    return TRUE;
 }
@@ -3408,16 +3511,13 @@ Vmx86_GetMonitorContext(VMDriver *vm,       // IN: The VM instance.
                         Vcpuid vcpuid,      // IN: VCPU in question.
                         Context64 *context) // OUT: context.
 {
-   VMCrossPage *crosspage;
    VMCrossPageData *cpData;
-   if (vcpuid >= vm->numVCPUs) {
-      return FALSE;
-   }
-   crosspage = vm->crosspage[vcpuid];
-   if (!crosspage) {
+
+   if (vcpuid >= vm->numVCPUs || vm->crosspage[vcpuid] == NULL) {
       return FALSE;
    }
-   cpData = &crosspage->crosspageData;
+   cpData = vm->crosspage[vcpuid];
+
    memset(context, 0, sizeof *context);
    context->es  = cpData->monES;
    context->ss  = cpData->monSS;
@@ -3494,3 +3594,137 @@ Vmx86_CreateHVIOBitmap(void)
    memset(hvIOBitmap->addr, 0xff, SVM_VMCB_IO_BITMAP_SIZE);
    return TRUE;
 }
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86RegisterCPU --
+ *
+ *      Registers each logical CPU by incrementing a counter.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      counter value pointed by 'data' is incremented by one.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+Vmx86RegisterCPU(void *data) // IN: *data
+{
+   Atomic_uint32 *numLogicalCPUs = data;
+   ASSERT(numLogicalCPUs);
+   Atomic_Inc32(numLogicalCPUs);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86_CheckMSRUniformity --
+ *
+ *      Provides basic hardware MSR feature checks for x86 hosted platform. VMM
+ *      requires and prefers uniformity of certain MSRs. This function iterates
+ *      through a list of MSR features (i.e. msrUniformityCacheInfo), checking
+ *      uniformity for MSR value on each logical CPU. A Uniformity check is
+ *      ignored for MSRs are that are not available for the target architecture
+ *      or cpu family. If MSRs are non uniform then, a common bit field is
+ *      calculated by taking the intersection of MSR values across cpu(s).
+ *
+ * Results:
+ *      Returns TRUE if MSR uniformity checks complete successfully, FALSE
+ *      otherwise.
+ *
+ * Side effects:
+ *      updates msrUniformityCacheInfo cache with MSR values.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+Bool
+Vmx86_CheckMSRUniformity(void)
+{
+   Vmx86GetMSRData data;
+   uint32 i, j;
+   uint32 numQueries = ARRAYSIZE(msrUniformityCacheInfo);
+   Atomic_uint32 numLogicalCPUs;
+   Atomic_uint32 *cpuCounters;
+   uint32 numPCPUs = 0;
+   MSRQuery *query = NULL;
+
+   Atomic_Write32(&numLogicalCPUs, 0);
+   /*
+    * Calculates number of logical CPUs by counting and then uses this
+    * information to set up MSR queries; will be executed on each logical CPU.
+    */
+   HostIF_CallOnEachCPU(Vmx86RegisterCPU, &numLogicalCPUs);
+   numPCPUs = Atomic_Read32(&numLogicalCPUs);
+   ASSERT(numPCPUs > 0);
+   query = Vmx86_Calloc(numQueries,
+                        sizeof(MSRQuery) + sizeof(MSRReply) * numPCPUs, TRUE);
+   if (query == NULL) {
+      Warning("Fatal, not enough memory for MSR feature uniformity checks");
+      return FALSE;
+   }
+
+   cpuCounters = Vmx86_Calloc(numQueries, sizeof(Atomic_uint32), TRUE);
+   if (cpuCounters == NULL) {
+      Vmx86_Free(query);
+      Warning("Fatal, not enough memory for MSR feature uniformity checks");
+      return FALSE;
+   }
+   data.query = query;
+   data.index = cpuCounters;
+   data.numItems = numQueries;
+
+   /*
+    * Enumerates a MSR list and initializes MSR data structure before the
+    * actual (safe) MSR query takes place. The Nested loop tests a MSR for
+    * uniformity on all logical processors.
+    */
+   for (i = 0; i < ARRAYSIZE(msrUniformityCacheInfo); ++i) {
+      query = &data.query[i];
+      Atomic_Write32(&data.index[i], 0);
+      query->msrNum = msrUniformityCacheInfo[i].msrIndex;
+      query->numLogicalCPUs = numPCPUs;
+   }
+
+   /* perform once, a multi MSR query for MSRs in uniformity check list. */
+   HostIF_CallOnEachCPU(Vmx86GetMSR, &data);
+
+   for (i = 0; i < ARRAYSIZE(msrUniformityCacheInfo); ++i) {
+      uint32 msrIndex = msrUniformityCacheInfo[i].msrIndex;
+      query = &data.query[i];
+      ASSERT(Atomic_Read32(&data.index[i]) == numPCPUs);
+      msrUniformityCacheInfo[i].msrValue = query->logicalCPUs[0].msrVal;
+      if (msrIndex == IA32_MSR_ARCH_CAPABILITIES) {
+         /*
+          * MSR_ARCH_CAPABILITIES_RSBA bit 1 represents lack of feature while 0
+          * represents presence. Therefore, bit is flipped for calculating the
+          * least common set and flipped again on the final value for resetting.
+          */
+         msrUniformityCacheInfo[i].msrValue ^= MSR_ARCH_CAPABILITIES_RSBA;
+      }
+      for (j = 1; j < numPCPUs; j++) {
+         uint64 msrValuePCPU = query->logicalCPUs[j].msrVal;
+         if (msrValuePCPU != query->logicalCPUs[0].msrVal) {
+            if (msrIndex == IA32_MSR_ARCH_CAPABILITIES) {
+               msrValuePCPU ^= MSR_ARCH_CAPABILITIES_RSBA;
+            }
+            msrUniformityCacheInfo[i].msrValue &= msrValuePCPU;
+            Warning("Found a mismatch on MSR feature 0x%x; logical cpu%u "
+                    "value = 0x%llx, but logical cpu%u value = 0x%llx\n",
+                    msrIndex, j, msrValuePCPU, 0, query->logicalCPUs[0].msrVal);
+         }
+      }
+      if (msrIndex == IA32_MSR_ARCH_CAPABILITIES) {
+         msrUniformityCacheInfo[i].msrValue ^= MSR_ARCH_CAPABILITIES_RSBA;
+      }
+   }
+   Vmx86_Free(cpuCounters);
+   Vmx86_Free(query);
+   return TRUE;
+}
+
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index cda9aefc..2766822b 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -68,7 +68,7 @@ typedef struct VMDriver {
    SharedAreaVmmon        *sharedArea;       /* VMMon shared area info. */
    StatVarsVmmon          *statVars;         /* VMMon stat vars info. */
    /* Pointers to the crossover pages shared with the monitor. */
-   struct VMCrossPage    **crosspage;        /* numVCPUs-sized array. */
+   struct VMCrossPageData **crosspage;        /* numVCPUs-sized array. */
    struct MemTrack        *ptpTracker;       /* Tracks page table patch pages */
    struct MemTrack        *vmmTracker;       /* Tracks allocated VMM pages */
    VCPUSet                *crosscallWaitSet; /* numVCPUs-sized array. */
@@ -175,6 +175,7 @@ extern void Vmx86_UpdateMemInfo(VMDriver *curVM,
 extern void Vmx86_Add2MonPageTable(VMDriver *vm, VPN vpn, MPN mpn,
                                    Bool readOnly);
 extern Bool Vmx86_GetAllMSRs(MSRQuery *query);
+extern Bool Vmx86_CheckMSRUniformity(void);
 extern void Vmx86_FlushVMCSAllCPUs(MA vmcs);
 extern void Vmx86_MonTimerIPI(void);
 extern void Vmx86_InitIDList(void);
diff --git a/vmmon-only/include/addrlayout.h b/vmmon-only/include/addrlayout.h
new file mode 100644
index 00000000..305373ae
--- /dev/null
+++ b/vmmon-only/include/addrlayout.h
@@ -0,0 +1,319 @@
+/*********************************************************
+ * Copyright (C) 2007-2020 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _ADDRLAYOUT_H_
+#define _ADDRLAYOUT_H_
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMX
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "address_defs.h"
+#include "x86desc.h"
+#include "x86types.h"
+#include "vmm_constants.h"
+
+#define DIRECT_EXEC_USER_RPL    3
+#define BINARY_TRANSLATION_RPL  1
+typedef char x86_PAGE[PAGE_SIZE];
+
+#define MAX_VADDR                    CONST64U(0xffffffffffffffff)
+#define MONITOR_SIZE                 (64 * 1024 * 1024)
+#define MONITOR_LINEAR_START         (MAX_VADDR - MONITOR_SIZE + 1)
+#define MONITOR_LINEAR_END           (MAX_VADDR)
+#define NUM_MONITOR_PAGES            (MONITOR_SIZE / PAGE_SIZE)
+#define MONITOR_BASE_VPN             (MONITOR_LINEAR_START >> PAGE_SHIFT)
+
+#define MONITOR_AS_START             MONITOR_BASE_VPN
+#define MONITOR_AS_LEN               NUM_MONITOR_PAGES
+
+/*
+ * Regions and items necessarily overlap.  Build parallel structures for each.
+ * These 'field' structures are used to determine page numbers and offsets.
+ * AddrLayout contains zero-length regions used for alignment-checking.  (These
+ * are used by gcc as Windows prohibits zero-length arrays.)
+ */
+
+/* Item layout. */
+typedef struct {
+#if defined __GNUC__
+#define REGION(name, length) x86_PAGE name##_REGION_MARKER_FIELD[0];
+#else
+#define REGION(name, length)
+#endif
+#define ITEM(name, length) x86_PAGE name##_FIELD[length];
+#include "addrlayout_table.h"
+} AddrLayout;
+#undef REGION
+#undef ITEM
+#define FIELD_PAGE_NUMBER(name) PAGE_NUMBER(&(((AddrLayout *)0)->name##_FIELD))
+
+
+/* Region layout. */
+typedef struct {
+#define REGION(name, length) x86_PAGE name##_REGION_FIELD[length];
+#define ITEM(name, length)
+#include "addrlayout_table.h"
+} RegionAddrLayout;
+#undef REGION
+#undef ITEM
+#define REGION_FIELD_PAGE_NUMBER(name) \
+   PAGE_NUMBER(&(((RegionAddrLayout *)0)->name##_REGION_FIELD))
+
+#if defined __GNUC__
+/*
+ * The sum of sizes of items in a region must add up to the region's size.
+ * AddrLayout contains zero-sized region markers at their correct offsets.
+ * RegionAddrLayout contains full-sized regions (but no items).  Comparing the
+ * marker and region offsets ensures that all items sizes in the previous
+ * region sum to the size of the previous region.  To check the final region
+ * (as it has no successor) we assert the sizes of the tables match.
+ *
+ * We also assert 2MB region granularity.
+ *
+ * This checking is only performed when using gcc.
+ */
+#define REGION(name, length) static INLINE void name(void) { \
+   ASSERT_ON_COMPILE(FIELD_PAGE_NUMBER(name##_REGION_MARKER) == \
+                     REGION_FIELD_PAGE_NUMBER(name)); \
+   ASSERT_ON_COMPILE((length % 512) == 0); \
+   ASSERT_ON_COMPILE(sizeof(AddrLayout) == sizeof(RegionAddrLayout)); \
+   ASSERT_ON_COMPILE(sizeof(RegionAddrLayout) == MONITOR_SIZE); \
+}
+#define ITEM(name, length)
+#include "addrlayout_table.h"
+#undef REGION
+#undef ITEM
+#endif
+
+/*
+ * Sizes.
+ */
+
+enum {
+#define REGION(name, length) name##_REGION_LEN = length,
+#define ITEM(name, length) name##_LEN = length,
+#include "addrlayout_table.h"
+};
+#undef REGION
+#undef ITEM
+
+/*
+ * Starts.
+ */
+
+#if defined __GNUC__
+/* Windows compiler and gdb do not accept 64-bit enumerations, but gcc
+ * does.  These are used by geninfo.c.
+ */
+enum {
+#define REGION(name, length) _asm_##name##_REGION_START = \
+    0ULL + MONITOR_BASE_VPN + REGION_FIELD_PAGE_NUMBER(name),
+#define ITEM(name, length) _asm_##name##_START = \
+    0ULL + MONITOR_BASE_VPN + FIELD_PAGE_NUMBER(name),
+#include "addrlayout_table.h"
+};
+#undef REGION
+#undef ITEM
+
+enum {
+#define REGION(name, length) name##_REGION_START = \
+   MONITOR_BASE_VPN + REGION_FIELD_PAGE_NUMBER(name),
+#define ITEM(name, length) name##_START = \
+   MONITOR_BASE_VPN + FIELD_PAGE_NUMBER(name),
+#include "addrlayout_table.h"
+};
+#undef REGION
+#undef ITEM
+
+#else
+#define REGION(name, length) \
+   static const uint64 name##_REGION_START = \
+   MONITOR_BASE_VPN + REGION_FIELD_PAGE_NUMBER(name);
+#define ITEM(name, length) \
+   static const uint64 name##_START = \
+   MONITOR_BASE_VPN + FIELD_PAGE_NUMBER(name);
+#include "addrlayout_table.h"
+#undef REGION
+#undef ITEM
+#endif
+
+enum {
+#define REGION(name, length) name##_REGION_start_page = \
+   REGION_FIELD_PAGE_NUMBER(name),
+#define ITEM(name, length) name##_start_page = \
+   FIELD_PAGE_NUMBER(name),
+#include "addrlayout_table.h"
+};
+#undef REGION
+#undef ITEM
+
+
+/* Derive the bootstrap start address from table contents. */
+#define MONITOR_BOOTSTRAP_START_LA   VPN_2_VA(BS_TXT_START)
+
+#ifndef VMX86_SERVER
+#define SWITCH_PAGE_TABLE_LEN          12
+#endif
+
+#define VMM_STACK_TOP_HW          VPN_2_VA(MON_STACK_PAGES_START + \
+                                           MON_STACK_PAGES_LEN)
+/*
+ * VMM_STKTOP_HW_LEN needs to contain an ExcFrame64ForCopy (72 bytes) and
+ * some more bytes for a "no man's land" region.  We make sure the "no
+ * man's land" region is 0 on BT_Resume and HV_Resume.  Because we
+ * check "no man's land" in 8-byte chunks, VMM_STKTOP_HW_LEN must be
+ * divisible by 8.
+ */
+#define VMM_STKTOP_HW_LEN          168
+#define VMM_STKTOP_HW_LRET_LEN     (VMM_STKTOP_HW_LEN + sizeof(LretFrame64))
+#define VMM_STKTOP_LRET_OFFSET     (PAGE_SIZE - VMM_STKTOP_HW_LRET_LEN)
+
+#define MON_STACK_BASE            VPN_2_VA(MON_STACK_PAGES_START)
+#define MON_STACK_TOP             VPN_2_VA(MON_STACK_PAGES_START + \
+                                           MON_STACK_PAGES_LEN)
+#define DF_STACK_BASE              VPN_2_VA(DF_STACK_PAGES_START)
+#define DF_STACK_TOP               VPN_2_VA(DF_STACK_PAGES_START + \
+                                            DF_STACK_PAGES_LEN)
+#define MC_STACK_BASE              VPN_2_VA(MC_STACK_PAGES_START)
+#define MC_STACK_TOP               VPN_2_VA(MC_STACK_PAGES_START + \
+                                            MC_STACK_PAGES_LEN)
+#define NMI_STACK_BASE             VPN_2_VA(NMI_STACK_PAGES_START)
+#define NMI_STACK_TOP              VPN_2_VA(NMI_STACK_PAGES_START + \
+                                            NMI_STACK_PAGES_LEN)
+
+#define NUM_MON_PTABS   MON_PAGE_TABLE_L1_LEN
+
+#define MON_START_L5OFF PT_LA_2_L5OFF(MONITOR_LINEAR_START)
+#define MON_START_L4OFF PT_LA_2_L4OFF(MONITOR_LINEAR_START)
+#define MON_START_L3OFF PT_LA_2_L3OFF(MONITOR_LINEAR_START)
+#define MON_START_L2OFF PT_LA_2_L2OFF(MONITOR_LINEAR_START)
+
+/*
+ * Allocated wired pages for the monitor.
+ * Currently we allocate wired pages for the:
+ *  0) The shared area between user and monitor;
+ *  a) GDT of the monitor
+ *  a1) BT (CP1) stack
+ *  b) The monitor's page table with one page directory under 4 GB
+ *      and two page table pages.
+ *  c) Pages for the monitor's stack.
+ *  d) The BT area pages
+ *  e) The cross driver/monitor page.
+ *  f) The physical memory array for the machine.
+ *  g) The SMRAM memory
+ *
+ * We allocate the shared area separately since it must be read/write
+ * in the monitor.   See SharedArea_PowerOn().
+ */
+
+#define MON_BOOTSTRAP_PAGE_TABLE_PAGES (BOOTSTRAP_REGION_LEN     /  \
+                                        PAE_PTES_PER_PGTBL)
+#ifdef VMX86_SERVER
+#define NUM_MONWIRED_PAGES     0
+
+#define MON_PAGE_TABLE_ALLOC_PAGES 0
+#define NUM_MONWIRED_BOOTSTRAP_PAGES 0
+
+#define NUM_MONWIRED_NUMA_PAGES_ML (MON_STACK_PAGES_LEN  + \
+                                    DF_STACK_PAGES_LEN   + \
+                                    MC_STACK_PAGES_LEN   + \
+                                    NMI_STACK_PAGES_LEN  + \
+                                    HV_CURRENT_VMCB_LEN  + \
+                                    IDT_NORMAL_LEN       + \
+                                    GDT_AND_TASK_LEN)
+
+#else
+#define NUM_MONWIRED_PAGES    (CROSS_PAGE_CODE_LEN   + \
+                               CROSS_PAGE_DATA_LEN   + \
+                               MON_PAGE_TABLE_L4_LEN + \
+                               MON_PAGE_TABLE_L3_LEN + \
+                               MON_PAGE_TABLE_L2_LEN)
+
+#define MON_PAGE_TABLE_ALLOC_PAGES ((MONITOR_READONLY_REGION_LEN + \
+                                     MONITOR_DATA_REGION_LEN     + \
+                                     MONITOR_MISC_REGION_LEN)    / \
+                                     PAE_PTES_PER_PGTBL)
+
+#define NUM_MONWIRED_BOOTSTRAP_PAGES MON_BOOTSTRAP_PAGE_TABLE_PAGES
+
+#define NUM_MONWIRED_NUMA_PAGES_ML (MON_STACK_PAGES_LEN + \
+                                    DF_STACK_PAGES_LEN  + \
+                                    MC_STACK_PAGES_LEN  + \
+                                    NMI_STACK_PAGES_LEN + \
+                                    GDT_AND_TASK_LEN    + \
+                                    IDT_NORMAL_LEN      + \
+                                    HV_CURRENT_VMCB_LEN + \
+                                    SWITCH_PAGE_TABLE_LEN)
+#endif
+
+#define MON_PAGE_TABLE_L5        VPN_2_VA(MON_PAGE_TABLE_L5_START)
+#define MON_PAGE_TABLE_L4        VPN_2_VA(MON_PAGE_TABLE_L4_START)
+#define VMM_STACK_TOP            (VMM_STACK_TOP_HW - VMM_STKTOP_HW_LEN)
+#define VMM_LRET_STACK_TOP       (VMM_STACK_TOP_HW - VMM_STKTOP_HW_LRET_LEN)
+/*
+ * Mark out a guard page for the VMM stack, this is not in the addrlayout_table
+ * explicitly because it overlaps the last page of the MONITOR_READONLY region.
+ */
+#define VMM_STACK_GUARD_START    MON_STACK_PAGES_START
+#define VMM_STACK_GUARD_LEN      PAGE_SIZE
+
+/*
+ * Following functions return true if the range [va, va+len) is within
+ * range of a particular monitor stack.  (Don't adjust without
+ * considering uint64 overflow when va is very high.)
+ */
+static INLINE Bool
+AddrLayout_InMonStack(VA64 va, size_t len)
+{
+   return VPN_2_VA(MON_STACK_PAGES_START) <= va &&
+          va <= VMM_STACK_TOP_HW - len;
+}
+
+static INLINE Bool
+AddrLayout_InNMIStack(VA64 va, size_t len)
+{
+   return va >= NMI_STACK_BASE && va <= NMI_STACK_TOP - len;
+}
+
+static INLINE Bool
+AddrLayout_InDFStack(VA64 va, size_t len)
+{
+   return va >= DF_STACK_BASE && va <= DF_STACK_TOP - len;
+}
+
+static INLINE Bool
+AddrLayout_InMCStack(VA64 va, size_t len)
+{
+   return va >= MC_STACK_BASE && va <= MC_STACK_TOP - len;
+}
+
+static INLINE Bool
+AddrLayout_InAMonitorStack(VA va, size_t len)
+{
+   return AddrLayout_InMonStack(va, len)  ||
+          AddrLayout_InNMIStack(va, len)  ||
+          AddrLayout_InDFStack(va, len)   ||
+          AddrLayout_InMCStack(va, len);
+}
+
+#endif
diff --git a/vmmon-only/include/addrlayout_table.h b/vmmon-only/include/addrlayout_table.h
new file mode 100644
index 00000000..88fbd2ff
--- /dev/null
+++ b/vmmon-only/include/addrlayout_table.h
@@ -0,0 +1,144 @@
+/*********************************************************
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * addrlayout_table.h --
+ *
+ * Named elements in the monitor's address space of fixed size and location.
+ * All units are 4 kilobyte pages.  Also used for vmmlayout output.
+ *
+ * The monitor's address space is populated three different ways:
+ * 1) For elements of a fixed size and location, at compile-time.
+ * 2) For well-known program sections and the shared area, at link-time.
+ * 3) Dynamically, by the allocator, during bootstrapping and monitor power-on.
+ *
+ * This file describes all of the monitor's main 64MB address space.  All of
+ * (1) is described specifically.  Ranges for (2) and (3) are accounted for,
+ * but their contents are described generally here.
+ *
+ * The monitor's address space is organized into container regions which are an
+ * integer number of 2MB "large" pages.  Within a container region, items
+ * comprised of one or more 4KB pages may be described.
+ *
+ * All container regions and items are described by a name and a size in pages.
+ * No two items may have the same name nor may two regions.
+ *
+ * REGION(region-name, number-of-pages)
+ *   ITEM(item-name,   number-of-pages)     // first item in region
+ *   ITEM(item-name,   number-of-pages)     // second item in region
+ * <...>
+ */
+
+
+/*
+ * Monitor .rodata/.text.  Mapped large (reducing TLB pressure) and read-only.
+ */
+REGION(MONITOR_READONLY,        1024)
+  ITEM(MONITOR_READONLY_LINKER, 1024) // Used by linker.
+
+/*
+ * Monitor .data/.bss.  Mapped large (reducing TLB pressure) and read-write.
+ */
+REGION(MONITOR_DATA,            512)
+  ITEM(MON_STACK_PAGES,           8) // Monitor stack.
+  ITEM(IDT_NORMAL,                1) // Normal IDT (used for all but SVM).
+  ITEM(MONITOR_DATA,            503) // Used by linker and TC.
+
+/*
+ * The monitor's translation cache.  This object starts at the page boundary
+ * following the end of the used space in MONITOR_DATA and extends through
+ * the TC_REGION.
+ */
+REGION(TC_REGION,              1024)
+  ITEM(TC_BLOCK,               1024)
+
+/*
+ * The monitor's pages for architectural state, stacks, page tables, shared
+ * pages, and dynamic allocation.  This region also contains the linked shared
+ * area and other contents.
+ * Mapped small (allowing non-present mappings and sharing) and read-write.
+ */
+REGION(MONITOR_MISC,           5632)
+#ifdef VMX86_SERVER
+  ITEM(GUARD_PAGE,                2) // Reserved (for symmetry with hosted).
+#else
+  ITEM(CROSS_PAGE_DATA,           1) // Cross page data (RW).
+  ITEM(CROSS_PAGE_CODE,           1) // Cross page code (RX).
+#endif
+  ITEM(GDT_AND_TASK,              1) // GDT and Task State Segment.
+
+  ITEM(MON_PAGE_TABLE_L5,         1) // Monitor page root, if 5-Level PT used.
+  ITEM(MON_PAGE_TABLE_L4,         1) // Monitor page root, if 4-Level PT used.
+  ITEM(MON_PAGE_TABLE_L3,         1) // Monitor L3 page table.
+  ITEM(MON_PAGE_TABLE_L2,         1) // Monitor L2 page table.
+  ITEM(MON_PAGE_TABLE_L1,        32) // Monitor L1 page tables.
+
+  ITEM(HOST_APIC,                 1) // Physical APIC.
+  ITEM(GUEST_APIC,                1) // Guest APIC.
+
+  ITEM(DF_GUARD_PAGE,             1) // Double Fault stack guard page.
+  ITEM(DF_STACK_PAGES,            1) // Double Fault stack; need ~768 bytes.
+
+  ITEM(MC_GUARD_PAGE,             1) // Machine Check stack guard page.
+  ITEM(MC_STACK_PAGES,            1) // Machine Check stack.
+
+  ITEM(NMI_GUARD_PAGE,            1) // NMI stack guard page.
+  ITEM(NMI_STACK_PAGES,           4) // NMI stack.  Profiling requires a larger
+                                     // stack than MC/DF.
+
+  ITEM(HV_SWITCH,                 1) // SVM switch page
+  ITEM(HV_CURRENT_VMCB,           1) // SVM current VMCB
+  ITEM(HV_STD_NATIVE_VMCB,        1) // SVM/VT standard VMCB/VMCS
+  ITEM(HV_AUX_NATIVE_VMCB,        1) // SVM/VT auxiliary VMCB/VMCS
+  ITEM(VHV_GUEST_VMCB,            1) // VSVM/VVT guest VMCB/VMCS
+  ITEM(HV_SEV_VMSA,               1) // SVM SEV-ES state save area
+  ITEM(VPROBE_MON_RELOC,          1) // VProbe monitor reloc page.
+  ITEM(GART_LIST_PAGES,          48) // PhysMem vmm gart list pages.
+  ITEM(GART_ALT_LIST_PAGES,      48) // Alternate vmm gart pages
+                                     // (for invalidation).
+  ITEM(GART_BF_PAGES,             8) // Gart Bloom filter memory pages.
+  ITEM(VVT_GUEST_VIRT_APIC,       1) // Inner guest virtual APIC page.
+  ITEM(HT_STATE_MAP,              8) // Information used by the SecureHT module
+  ITEM(SHARED_RW_DATA,         5462) // R/W shared data, including the shared
+                                     // area and stat vars. Any remaining pages
+                                     // are left to the dynamic allocator, which
+                                     // extends throughout the entire reclaimed
+                                     // bootstrap region.
+/*
+ * Bootstrap-used space.  This space is reclaimed when bootstrap is done, and
+ * is used by the allocator thereafter.  The allocator starts at the first
+ * unused page in the SHARED_RW_DATA item from the MONITOR_MISC region and
+ * extends through to the end of the VMM address space once the bootstrap region
+ * is reclaimed.
+ */
+REGION(BOOTSTRAP,              8192)
+  ITEM(BS_TXT,                   17) // bootstrap's .text
+  ITEM(BS_RODATA,                10) // bootstrap's .rodata
+  ITEM(BS_DATA,                  10) // bootstrap's .data
+  ITEM(BS_BSS,                   10) // bootstrap's .bss
+  ITEM(BS_HEADER,                 1) // MonLoaderHeader mapping
+  ITEM(BS_VCPU_L1PT_RANGE,       32) // VCPU L1PT mappings
+  ITEM(BS_VCPU_L1PT_PT,           1) // L1PT that maps a VCPU's L1 page tables
+  ITEM(BS_INIT_POOL,              1) // pool for initializing VMM pages
+  ITEM(BS_DYNAMIC_ALLOC,       1880) // bs_alloc's dynamic allocator pages
+  ITEM(IDT_BOOTSTRAP,             1) // bootstrap IDT
+  ITEM(IDT_BOOTSTRAP_STUBS,       2) // bootstrap IDT gate stubs
+  ITEM(BS_PER_VM_VMX,           300) // vmm64's shared_per_vm_vmx
+  ITEM(BS_PER_VCPU,               8) // vmm64's shared_per_vcpu for VCPU 0
+  ITEM(BS_PER_VCPU_VMX,         136) // vmm64's shared_per_vcpu_vmx for VCPU 0
+  ITEM(VMM_MODULES,            5783) // ~22.6MB for unlinked VMM modules
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index cbbabd94..2eb661f9 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -148,7 +148,7 @@ PtrToVA64(void const *ptr) // IN
  * the NT specific VMX86_DRIVER_VERSION.
  */
 
-#define VMMON_VERSION           (392 << 16 | 0)
+#define VMMON_VERSION           (398 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -248,6 +248,7 @@ enum IOCTLCmd {
    IOCTLCMD(GET_IPI_VECTORS),
    IOCTLCMD(SEND_IPI),
    IOCTLCMD(SEND_ONE_IPI),
+   IOCTLCMD(GET_SWITCH_ERROR_ADDR),
 
    /*
     * Keep host-specific calls at the end so they can be undefined
@@ -316,6 +317,7 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_SEND_IPI            VMIOCTL_NEITHER(SEND_IPI)
 #define IOCTL_VMX86_SEND_ONE_IPI        VMIOCTL_BUFFERED(SEND_ONE_IPI)
 #define IOCTL_VMX86_GET_IPI_VECTORS     VMIOCTL_BUFFERED(GET_IPI_VECTORS)
+#define IOCTL_VMX86_GET_SWITCH_ERROR_ADDR VMIOCTL_BUFFERED(GET_SWITCH_ERROR_ADDR)
 #define IOCTL_VMX86_LOOK_UP_MPN         VMIOCTL_BUFFERED(LOOK_UP_MPN)
 #define IOCTL_VMX86_GET_VMM_PAGE_ROOT   VMIOCTL_BUFFERED(GET_VMM_PAGE_ROOT)
 #define IOCTL_VMX86_LOCK_PAGE           VMIOCTL_BUFFERED(LOCK_PAGE)
@@ -563,7 +565,6 @@ typedef struct VMStatVarsRegistrationBlock {
 } VMStatVarsRegistrationBlock;
 
 typedef struct {
-   VA64   crosspage; // IN: User VA of VCPU crosspage.
    VA64   ptRoot;    // IN: User VA of VCPU L4 page table root.
 } PerVcpuPages;
 
@@ -579,6 +580,15 @@ typedef struct VMProcessBootstrapBlock {
    PerVcpuPages   perVcpuPages[0];
 } VMProcessBootstrapBlock;
 
+/*
+ * Arguments for retrieving the switch error address.
+ */
+typedef struct VMSwitchErrorArgs {
+   Vcpuid vcpuid;  // IN: The VCPU of interest.
+   uint64 addr;    // OUT: The code address that a failure was detected at, or 0
+                   //      if no failure has occurred.
+} VMSwitchErrorArgs;
+
 static INLINE size_t
 GetVMProcessBootstrapBlockSize(unsigned numVCPUs)
 {
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index dfb4060f..7d004475 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -42,8 +42,6 @@
 #include "mon_assert.h"
 
 #define NUM_EXCEPTIONS   20     /* EXC_DE ... EXC_XF. */
-#define CP_STUB_SIZE     16     /* A relative jmp instruction (5 bytes)
-                                   padded to the next 16 byte boundary. */
 
 #define MODULECALL_TABLE                                                      \
    MC(INTR)                                                                   \
@@ -66,12 +64,14 @@
    MC(ALLOC_ANON_LOW_PAGE)                                                    \
    MC(GET_MON_IPI_VECTOR)                                                     \
    MC(GET_HV_IPI_VECTOR)                                                      \
+   MC(GET_PERF_CTR_VECTOR)                                                    \
    MC(GET_HOST_TIMER_VECTORS)                                                 \
    MC(BOOTSTRAP_CLEANUP)                                                      \
    MC(GET_SHARED_AREA)                                                        \
    MC(GET_STAT_VARS)                                                          \
    MC(GET_NUM_PTP_PAGES)                                                      \
    MC(GET_HV_IO_BITMAP)                                                       \
+   MC(GET_MSR)                                                                \
 
 /*
  *----------------------------------------------------------------------
@@ -109,8 +109,8 @@ typedef enum ModuleCallType {
  */
 
 #if defined(VMX86_UCCOST) && !defined(VMX86_SERVER)
-#define UCTIMESTAMP(cp, stamp) \
-             do { (cp)->ucTimeStamps[UCCOST_ ## stamp] = RDTSC(); } while (0)
+#define UCTIMESTAMP(ptr, stamp) \
+             do { (ptr)[UCCOST_ ## stamp] = RDTSC(); } while (0)
 #else
 #define UCTIMESTAMP(cp, stamp)
 #endif
@@ -130,7 +130,7 @@ typedef struct UCCostResults {
 } UCCostResults;
 
 typedef enum UCCostStamp {
-#define UC(x) UCCOST_ ## x,
+#define UC(x, y) UCCOST_ ## x,
 #include "uccostTable.h"
    UCCOST_MAX
 } UCCostStamp;
@@ -144,12 +144,12 @@ typedef enum UCCostStamp {
  * MAX_SWITCH_PT_PATCHES
  *
  *   This is the maximum number of patches that must be placed into
- *   the monitor page tables so that the host GDT and the crosspage
- *   can be accessed during worldswitch.
+ *   the monitor page tables so that the host GDT, crosspage data, and
+ *   crosspage code can be accessed during worldswitch.
  *
  *----------------------------------------------------------------------
  */
-#define MAX_SWITCH_PT_PATCHES 2
+#define MAX_SWITCH_PT_PATCHES 3
 
 /*----------------------------------------------------------------------
  *
@@ -236,16 +236,23 @@ VMMPageTablePatch;
  * - the largest stack use instantaneously possible by #DB handling code
  * - one high-water uint32 used to detect stack overflows when debugging
  *
- * 184 bytes is slightly more than enough as of 2015/03/17 -- fjacobs.
+ * A breakdown of the worst-case exception handler stack usage (SwitchUDHandler)
+ * is: 5 * uint64 (Hardware) + 1 * uint64 (RAX) + 1 * uint64 (RBX) +
+ *     1 * uint64 (RCX) + 1 * uint64 (call) + 2 * uint64 (sidt) = 11 * uint64
+ * This is a slight over-estimate of the possible usage at any time but there
+ * is plenty of space available in the cross page data area.
+ *
+ * 264 (11 * sizeof(uint64) * 3) bytes is slightly more than enough as of
+ * 2020/06/14.
  */
-#define TINY_STACK_SIZE      184
+#define TINY_STACK_SIZE      264
 
 /*
  *----------------------------------------------------------------------
  *
  * VMCrossPageData --
  *
- *      Data which is stored on the VMCrossPage.
+ *      Data which is stored on the cross page.
  *
  *----------------------------------------------------------------------
  */
@@ -294,11 +301,13 @@ struct VMCrossPageData {
    uint16   monES;  /* Not saved/restored in assembly switch */
    uint16   monPad;
 
-   uint64   crosspageMA;
+   uint64   crosspageDataMA;
 
    uint64   hostDR[8];
-   LA64     crossPageLA;       // where host/PTP map the cross page
+   LA64     crosspageDataLA;   // where host/PTP map the cross data page
    LA64     crossGDTLA;        // where host/PTP map the cross GDT
+   LA64     crosspageCodeLA;   // where host/PTP map the cross code page
+   LA64     vmmToHostLA;       // where host has placed the VmmToHost function
    uint16   hostInitial64CS;
    uint8    hostDRSaved;       // Host DR spilled to hostDR[x].
    uint8    hostDRInHW;        // 0 -> shadowDR in h/w, 1 -> hostDR in h/w.
@@ -337,6 +346,7 @@ struct VMCrossPageData {
 
 #if !defined(VMX86_SERVER)
    uint64 ucTimeStamps[UCCOST_MAX];
+   uint8  _ucPad[8];
 #endif
 
    SwitchedMSRState switchedMSRState;
@@ -399,64 +409,14 @@ struct VMCrossPageData {
 #include "vmware_pack_end.h"
 VMCrossPageData;
 
-
-/*
- *----------------------------------------------------------------------
- *
- * VMCrossPageCode --
- *
- *      Code which is stored on the VMCrossPage.
- *
- *----------------------------------------------------------------------
- */
-
-#define CODE_BLOCK_SIZE (PAGE_SIZE - sizeof(VMCrossPageData) - \
-                         (2 + NUM_EXCEPTIONS) * CP_STUB_SIZE)
-
-typedef
-#include "vmware_pack_begin.h"
-struct VMCrossPageCode {
-   uint8         toVmmFunc[CP_STUB_SIZE];    // Fixed-position stubs to jump
-   uint8         toHostFunc[CP_STUB_SIZE];   // to world switch functions
-   uint8         gateStubs[NUM_EXCEPTIONS *
-                           CP_STUB_SIZE];    // Stubs for crossIDT.
-   uint8         codeBlock[CODE_BLOCK_SIZE]; // Code for worldswitch and
-                                             // fault handling.
-}
-#include "vmware_pack_end.h"
-VMCrossPageCode;
-
-
-/*
- *----------------------------------------------------------------------
- *
- * VMCrossPage --
- *
- *      Data structure shared between the monitor and the module
- *      that is used for crossing between the two.
- *      Accessible as vm->crosspage (kernel module) and CROSS_PAGE
- *      (monitor)
- *
- *      Must be exactly one page long.
- *
- *----------------------------------------------------------------------
- */
-
-typedef
-#include "vmware_pack_begin.h"
-struct VMCrossPage {
-   VMCrossPageData crosspageData;
-   VMCrossPageCode crosspageCode;
-}
-#include "vmware_pack_end.h"
-VMCrossPage;
-
-#define CROSSPAGE_VERSION_BASE 0xc0e /* increment by 1 */
+#define CROSSPAGE_VERSION_BASE 0xc12 /* increment by 1 */
 #define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
 
 #if !defined(VMX86_SERVER) && defined(VMM)
-#define CROSS_PAGE             ((VMCrossPage * const)VPN_2_VA(CROSS_PAGE_START))
-#define VMM_SWITCH_SHARED_DATA ((VMCrossPageData *)&CROSS_PAGE->crosspageData)
+#define CROSS_PAGE             ((VMCrossPageData *) \
+                                VPN_2_VA(CROSS_PAGE_DATA_START))
+#define VMM_SWITCH_SHARED_DATA ((VMCrossPageData * const) \
+                                VPN_2_VA(CROSS_PAGE_DATA_START))
 #endif
 
 #define MX_WAITINTERRUPTED     3
diff --git a/vmmon-only/include/monLoader.h b/vmmon-only/include/monLoader.h
index 60731028..3389c445 100644
--- a/vmmon-only/include/monLoader.h
+++ b/vmmon-only/include/monLoader.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -296,9 +296,10 @@ typedef enum MonLoaderError {
  * Values above shared area subindices for sharing of MonLoaderHeader
  * and htSchedStateMap.
  */
-#define MONLOADER_HEADER_IDX 6
-#define MONLOADER_HT_MAP_IDX 7
-
+#define MONLOADER_HEADER_IDX          6
+#define MONLOADER_HT_MAP_IDX          7
+#define MONLOADER_CROSS_PAGE_CODE_IDX 8
+#define MONLOADER_CROSS_PAGE_DATA_IDX 9
 
 MonLoaderError MonLoader_Process(MonLoaderHeader *header, unsigned numVCPUs,
                                  void *args, unsigned *line, Vcpuid *vcpu);
diff --git a/vmmon-only/include/pcip_defs.h b/vmmon-only/include/pcip_defs.h
index 87884066..690f93e1 100644
--- a/vmmon-only/include/pcip_defs.h
+++ b/vmmon-only/include/pcip_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2009-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2009-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -66,7 +66,6 @@ typedef enum PCIPassthru_IntrType {
    (PCIPASSTHRU_INTR_MSI | PCIPASSTHRU_INTR_MSI_INT)
 
 typedef struct FPTIntrProxyInfo {
-   uint32            adapterIndex;
    uint32            vectorIndex;
    MonitorIdemAction actionID;
 } FPTIntrProxyInfo;
@@ -76,9 +75,15 @@ typedef struct UPTIntrProxyInfo {
    MonitorIdemAction actionID;
 } UPTIntrProxyInfo;
 
+typedef struct MPTIntrProxyInfo {
+   uint32            adapterIndex;
+   MonitorIdemAction actionID;
+} MPTIntrProxyInfo;
+
 typedef union PCIPassthru_IntrProxyInfo {
    FPTIntrProxyInfo fpt;
    UPTIntrProxyInfo upt;
+   MPTIntrProxyInfo mpt;
 } PCIPassthru_IntrProxyInfo;
 
 typedef enum PCIPassthru_ErrorType {
diff --git a/vmmon-only/include/perfctr_arch.h b/vmmon-only/include/perfctr_arch.h
index 2e2a6df2..47fd70f6 100644
--- a/vmmon-only/include/perfctr_arch.h
+++ b/vmmon-only/include/perfctr_arch.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2014, 2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2014, 2019-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -133,13 +133,19 @@
  */
 #define PERFCTR_AMD_SMI_COUNT                                  0x2b
 
-/* AMD Data Cache Events */
+/*
+ * AMD Data Cache Events
+ * Family <  17H: 0x45 - Unified TLB hit
+ *                0x46 - Unified TLB miss
+ * Family >= 17H: 0x45 - L1 DTLB miss (L2 DTLB hit or miss)
+ *                0x46 - Tablewalker
+ */
 #define PERFCTR_AMD_DATA_CACHE_ACCESSES                        0x40
 #define PERFCTR_AMD_DATA_CACHE_MISSES                          0x41
 #define PERFCTR_AMD_DATA_CACHE_REFILLS_FROM_L2_OR_SYSTEM       0x42
 #define PERFCTR_AMD_DATA_CACHE_REFILLS_FROM_SYSTEM             0x43
 #define PERFCTR_AMD_DATA_CACHE_LINES_EVICTED                   0x44
-#define PERFCTR_AMD_L1_DTLB_MISS_AND_L2_DTLB_HIT               0x45
+#define PERFCTR_AMD_L1_DTLB_MISS_AND_L2_DTLB_HIT_OR_MISS       0x45
 #define PERFCTR_AMD_L1_DTLB_AND_L2_DTLB_MISS                   0x46
 #define PERFCTR_AMD_MISALIGNED_ACCESSES                        0x47
 #define PERFCTR_AMD_PREFETCH_INSTRS_DISPATCHED                 0x4b
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
index a85b62f7..c6a2fd6b 100644
--- a/vmmon-only/include/ptsc.h
+++ b/vmmon-only/include/ptsc.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2017,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2017,2019-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -125,7 +125,7 @@ PTSC_MHz(void)
 
 #if defined(VM_X86_64) || defined(VM_ARM_64)
 
-/* 
+/*
  * Conversions to/from cycles.  Note that the conversions operate on
  * signed values, so be careful when taking the difference of two
  * VmAbsoluteTS (which is unsigned) that that value is not out of range
@@ -197,13 +197,13 @@ VmAbsoluteTS PTSC_Get(void);
 
 #endif
 
-/* 
+/*
  *-----------------------------------------------------------------------------
  *
  * PTSC_HasSynchronizedTSCs --
  *
  *      Returns TRUE iff the platform TSCs are known to be synchronized.
- * 
+ *
  *-----------------------------------------------------------------------------
  */
 
@@ -214,7 +214,7 @@ PTSC_HasSynchronizedTSCs(void)
 }
 
 
-/* 
+/*
  *-----------------------------------------------------------------------------
  *
  * PTSC_HostAdjustedTSCs --
@@ -231,4 +231,37 @@ PTSC_HostAdjustedTSCs(void)
    return ptscInfo.hwTSCsAdjusted;
 }
 
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * PTSC_AdvanceTimer --
+ *
+ *      Advance '*deadline' in 'period' increments such that it is
+ *      greater than 'now'.  Return the number of ticks incremented.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+PTSC_AdvanceTimer(VmAbsoluteTS now,
+                  VmIntervalTS period,
+                  VmAbsoluteTS *deadline)
+{
+   VmAbsoluteTS d = *deadline;
+   if (now >= d) {
+      uint64 count = 1;
+      d += period;
+      if (UNLIKELY(now >= d)) {
+         uint64 t = (now - d) / period + 1;
+         VmIntervalTS diff = t * period;
+         count += t;
+         d += diff;
+      }
+      *deadline = d;
+      return count;
+   }
+   return 0;
+}
+
 #endif /* ifndef _PTSC_H_ */
diff --git a/vmmon-only/include/segs.h b/vmmon-only/include/segs.h
new file mode 100644
index 00000000..21f7f3fa
--- /dev/null
+++ b/vmmon-only/include/segs.h
@@ -0,0 +1,176 @@
+/*********************************************************
+ * Copyright (C) 2018-2020 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * segs.h --
+ *
+ *      Describes segment descriptors and structures containing them for both
+ *      the monitor (in hosted and ESX) and the vmkernel.
+ */
+
+#ifndef _SEGS_H_
+#define _SEGS_H_
+
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "x86types.h"
+#include "x86segdescrs.h"
+#include "x86sel.h"
+#include "addrlayout.h"
+
+
+/*
+ * Segment map of the monitor.
+ *
+ * The GDT and Task State Segment reside consecutively on one page.  The
+ * monitor segments are placed at the end of the GDT.  The vmkernel can use all
+ * lower-numbered segments for user-mode as well as higher-numbered segments
+ * (though the vmkernel should not use monitor-private segments).  The high
+ * segment placement ensures that there is no selector-overlap with hosted
+ * kernel segments (the hosted world switch code can be a bit faster then, as
+ * it can use a single cross GDT).
+ */
+
+#define GDT_SIZE              (sizeof(Descriptor) * NUM_VALID_SEGMENTS)
+#define GDT_LIMIT             (GDT_SIZE - 1)
+
+#define IRB_SIZE              32 /* Interrupt redirection bitmap. */
+#define TSS_SIZE              (sizeof(Task64) + IRB_SIZE)
+
+#define GDT_START_VA          (VPN_2_VA(GDT_AND_TASK_START))
+#define TASK_START_VA         (VPN_2_VA(GDT_AND_TASK_START) + GDT_SIZE)
+
+/*
+ * vmkBoot uses some of the lower-numbered segments, as do host kernels on
+ * hosted.  User segments could start earlier than 32; see bug #1904257.
+ * Descriptor is used to describe boot, user and kernel segments.
+ * Descriptor64 (twice as large) is used for task segments.
+ */
+#define NUM_BOOT_SEGMENTS     32
+#define NUM_USER_SEGMENTS     (FIRST_SYSTEM_SEGMENT - FIRST_USER_SEGMENT)
+#define NUM_SYSTEM_SEGMENTS   2
+#define NUM_TASK_SEGMENTS     2
+
+#define FIRST_USER_SEGMENT    NUM_BOOT_SEGMENTS
+#define FIRST_SYSTEM_SEGMENT  (PAGE_SIZE / sizeof(Descriptor) - \
+                               NUM_SYSTEM_SEGMENTS            - \
+                               NUM_TASK_SEGMENTS * 2          - \
+                               TSS_SIZE / sizeof(Descriptor))
+
+#define GDT_USER_TLS_MIN      USER_TLS_1_SEGMENT
+#define GDT_USER_TLS_MAX      USER_TLS_3_SEGMENT
+#define USER_TLS_COUNT        ((USER_TLS_3_SEGMENT - USER_TLS_1_SEGMENT) + 1)
+
+#define FOREACH_USER_TLS_INDEX(_i)              \
+   {                                            \
+      unsigned _i;                              \
+      for (_i = 0; _i < USER_TLS_COUNT; _i++) { \
+
+#define FOREACH_USER_TLS_INDEX_DONE             \
+      }                                         \
+   }
+
+#define NULL_LDTR             0
+
+/*
+ * The descriptor after SYSTEM_CODE_SEGMENT (loaded into %cs) must be
+ * appropriate for %ss because of the syscall instruction for 64-bit
+ * user worlds.  Thus SYSTEM_DATA_SEGMENT is directly after it.
+ */
+typedef enum VmwSegs {
+   NULL_SEGMENT             = 0,
+   /* (... reserved for host operating system or vmkBoot segments). */
+
+   USER32_CODE_SEGMENT      = FIRST_USER_SEGMENT,
+   USER_DATA_SEGMENT,
+   USER64_SYSRET_SEGMENT,
+   USER64_STACK_SEGMENT,
+   USER64_CODE_SEGMENT,
+   USER_TLS_1_SEGMENT,
+   USER_TLS_2_SEGMENT,
+   USER_TLS_3_SEGMENT,
+
+   AFTER_LAST_USER_SEGMENT,
+
+   SYSTEM_CODE_SEGMENT      = FIRST_SYSTEM_SEGMENT,
+   SYSTEM_DATA_SEGMENT,
+   VMKERNEL_TASK_SEGMENT,
+   VMKERNEL_TASK_SEGMENT_HI,
+   MONITOR_TASK_SEGMENT,
+   MONITOR_TASK_SEGMENT_HI,
+
+   NUM_VALID_SEGMENTS
+} VmwSegs;
+
+#define GDT_SYSTEM_SEL(x) MAKE_SELECTOR(x##_SEGMENT, SELECTOR_GDT, 0)
+#define GDT_SYSTEM_SEL_UNCHECKED(x) \
+   MAKE_SELECTOR_UNCHECKED(x##_SEGMENT, SELECTOR_GDT, 0)
+#define GDT_USER_SEL(x) MAKE_SELECTOR(x##_SEGMENT, SELECTOR_GDT, 3)
+#define GDT_USER_SEL_UNCHECKED(x) \
+   MAKE_SELECTOR_UNCHECKED(x##_SEGMENT, SELECTOR_GDT, 3)
+
+/* Selectors used statically in code or in assembly must be unchecked. */
+#define SYSTEM_NULL_SELECTOR    GDT_SYSTEM_SEL(NULL)
+#define USER32_CODE_SELECTOR    GDT_USER_SEL_UNCHECKED(USER32_CODE)
+#define USER_DATA_SELECTOR      GDT_USER_SEL_UNCHECKED(USER_DATA)
+#define USER64_CODE_SELECTOR    GDT_USER_SEL_UNCHECKED(USER64_CODE)
+#define USER64_SYSRET_SELECTOR  GDT_USER_SEL(USER64_SYSRET)
+#define SYSTEM_CODE_SELECTOR    GDT_SYSTEM_SEL_UNCHECKED(SYSTEM_CODE)
+#define SYSTEM_DATA_SELECTOR    GDT_SYSTEM_SEL_UNCHECKED(SYSTEM_DATA)
+#define MONITOR_TASK_SELECTOR   GDT_SYSTEM_SEL(MONITOR_TASK)
+#define VMKERNEL_TASK_SELECTOR  GDT_SYSTEM_SEL(VMKERNEL_TASK)
+
+/*
+ * The VMM GDT is comprised of many segment descriptors with one initial
+ * Task State Segment system descriptor.  The VMM Task State Segment is
+ * on the same page sequentially after its GDT.
+ */
+#pragma pack(push, 1)
+typedef struct StaticGDTAndTSS {
+   Descriptor   empty[NUM_BOOT_SEGMENTS + NUM_USER_SEGMENTS];
+   Descriptor   systemSegs[NUM_SYSTEM_SEGMENTS];
+   Descriptor64 vmkTask;
+   Descriptor64 monTask;
+   Task64       monTSS;
+   uint8        TSSIRBitmap[IRB_SIZE];
+} StaticGDTAndTSS;
+#pragma pack(pop)
+
+#pragma pack(push, 1)
+typedef struct VmkernelGDT {
+   Descriptor   bootSegs[NUM_BOOT_SEGMENTS];
+   Descriptor   userSegs[NUM_USER_SEGMENTS];
+   Descriptor   systemSegs[NUM_SYSTEM_SEGMENTS]; /* VMM/VMK-shared. */
+   Descriptor64 vmkTask;
+   Descriptor64 monTask;
+} VmkernelGDT;
+#pragma pack(pop)
+
+MY_ASSERTS(segs,
+           ASSERT_ON_COMPILE(SYSTEM_CODE_SEGMENT + 1 == SYSTEM_DATA_SEGMENT);
+           ASSERT_ON_COMPILE(AFTER_LAST_USER_SEGMENT - FIRST_USER_SEGMENT <=
+                             NUM_USER_SEGMENTS);
+           ASSERT_ON_COMPILE(AFTER_LAST_USER_SEGMENT <= FIRST_SYSTEM_SEGMENT);
+)
+
+#endif /* _SEGS_H_ */
diff --git a/vmmon-only/include/uccostTable.h b/vmmon-only/include/uccostTable.h
index 87366788..657a73dc 100644
--- a/vmmon-only/include/uccostTable.h
+++ b/vmmon-only/include/uccostTable.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -20,15 +20,12 @@
 #define INCLUDE_ALLOW_VMMON
 #include "includeCheck.h"
 
-UC(CALL_START)
-UC(BEGIN_BACK_TO_HOST)
-UC(SWITCHED_TO_MODULE)
-UC(VMX_SELECT_RETURN)
-UC(VMX_HANDLER_START)
-UC(VMX_SIGNAL)
-UC(MODULE_SIGNAL)
-UC(SWITCHING_TO_MONITOR)
-UC(DONE_BACK_TO_HOST)
-UC(CALL_END)
+UC(CALL_START,             FALSE)
+UC(BEGIN_BACK_TO_HOST,     FALSE)
+UC(SWITCHED_TO_MODULE,     TRUE)
+UC(VMX_HANDLER_START,      FALSE)
+UC(SWITCHING_TO_MONITOR,   TRUE)
+UC(DONE_BACK_TO_HOST,      FALSE)
+UC(CALL_END,               FALSE)
 
 #undef UC
diff --git a/vmmon-only/include/usercalldefs.h b/vmmon-only/include/usercalldefs.h
index 90fd5059..edafd6a4 100644
--- a/vmmon-only/include/usercalldefs.h
+++ b/vmmon-only/include/usercalldefs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008,2019-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,5 +31,6 @@
  * failing DeviceIoControl on Windows.
  */
 #define USERCALL_VMX86ALLOCERR (-8192)
+#define USERCALL_SWITCHERR     (-8193)
 
-#endif 
+#endif
diff --git a/vmmon-only/include/vcpuid.h b/vmmon-only/include/vcpuid.h
index 648d9244..60a80936 100644
--- a/vmmon-only/include/vcpuid.h
+++ b/vmmon-only/include/vcpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014, 2016-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014, 2016-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -60,7 +60,7 @@ typedef uint32 Vcpuid;                 // VCPU number
 #define MAX_SMALL_VM_VCPUS 128
 
 /* Supported limit. */
-#define MAX_SUPPORTED_VCPUS   256
+#define MAX_SUPPORTED_VCPUS   (FEATURE_STATE_IS_ENABLED(MonsterVM) ? 768 : 256)
 
 #if defined __cplusplus
 } // extern "C"
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index ba699382..76a0fbbc 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016-2017,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -417,31 +417,13 @@ _BUILD_GET_CR(_GET_CR8, 8);
 static INLINE void
 _Set_GDT(_GETSET_DTR_TYPE *dtr)
 {
-#ifdef VM_X86_64
    _lgdt(dtr);
-#else
-   /*
-    * timetools 32-bit targets use an old version of MSVC that doesn't support
-    * the _lgdt intrinsic. Luckily, 32-bit still supports inline asm.
-    */
-   __asm mov eax, dtr
-   __asm lgdt [eax]
-#endif
 }
 
 static INLINE void
 _Get_GDT(_GETSET_DTR_TYPE *dtr)
 {
-#ifdef VM_X86_64
    _sgdt(dtr);
-#else
-   /*
-    * timetools 32-bit targets use an old version of MSVC that doesn't support
-    * the _sgdt intrinsic. Luckily, 32-bit still supports inline asm.
-    */
-   __asm mov eax, dtr
-   __asm sgdt [eax]
-#endif
 }
 
 static INLINE void
@@ -466,141 +448,6 @@ _Get_IDT(_GETSET_DTR_TYPE *dtr)
 
 #define RESTORE_FLAGS(x) __writeeflags(x)
 
-
-#ifdef VM_X86_32
-
-#define SET_TR(_tr)      _Set_TR(_tr)
-#define SET_LDT(_tr)     _Set_LDT(_tr)
-
-#define GET_TR(_tr)      do { _tr = _Get_TR();  } while (0)
-#define GET_LDT(_tr)     do { _tr = _Get_LDT(); } while (0)
-
-#define SET_CR2(_reg)    __asm mov eax, _reg __asm mov cr2, eax
-#define CLTS()           __asm clts
-
-#define FNCLEX()         __asm fnclex
-
-#define TLB_INVALIDATE_PAGE(_addr) {  \
-   void *_a = (_addr); \
-   __asm mov eax, _a __asm invlpg [eax] \
-}
-
-#define RAISE_INTERRUPT(_x)  {__asm int _x }
-#define RETURN_FROM_INT()   {__asm iretd }
-
-
-static INLINE void
-SET_DS(Selector val)
-{
-   __asm mov ax, val
-   __asm mov ds, ax
-}
-
-static INLINE void
-SET_ES(Selector val)
-{
-   __asm mov ax, val
-   __asm mov es, ax
-}
-
-static INLINE void
-SET_FS(Selector val)
-{
-   __asm mov ax, val
-   __asm mov fs, ax
-}
-
-static INLINE void
-SET_GS(Selector val)
-{
-   __asm mov ax, val
-   __asm mov gs, ax
-}
-
-static INLINE void
-SET_SS(Selector val)
-{
-   __asm mov ax, val
-   __asm mov ss, ax
-}
-
-static INLINE Selector
-GET_FS(void)
-{
-   Selector _v;
-   __asm mov _v,fs
-   return _v;
-}
-
-static INLINE Selector
-GET_GS(void)
-{
-   Selector _v;
-   __asm mov _v,gs
-   return _v;
-}
-
-static INLINE Selector
-GET_DS(void)
-{
-   Selector _v;
-   __asm mov _v,ds
-   return _v;
-}
-
-static INLINE Selector
-GET_ES(void)
-{
-   Selector _v;
-   __asm mov _v,es
-   return _v;
-}
-
-static INLINE Selector
-GET_SS(void)
-{
-   Selector _v;
-   __asm mov _v,ss
-   return _v;
-}
-
-static INLINE Selector
-GET_CS(void)
-{
-   Selector _v;
-   __asm mov _v,cs
-   return _v;
-}
-
-static INLINE void
-_Set_LDT(Selector val)
-{
-   __asm lldt val
-}
-
-static INLINE void
-_Set_TR(Selector val)
-{
-   __asm ltr val
-}
-
-static INLINE Selector
-_Get_LDT(void)
-{
-   Selector sel;
-   __asm sldt sel
-   return sel;
-}
-
-static INLINE Selector
-_Get_TR(void)
-{
-   Selector sel;
-   __asm str sel
-   return sel;
-}
-
-#endif /* !VM_X86_32 */
 #endif /* !__GNUC__ && !_MSC_VER */
 
 
@@ -680,7 +527,7 @@ INTERRUPTS_ENABLED(void)
 #endif
 
 
-#if defined (__GNUC__) || (defined (_MSC_VER) && defined (VM_X86_32))
+#if defined (__GNUC__)
 static INLINE unsigned
 CURRENT_CPL(void)
 {
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index d13c0502..52bb5d88 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -41,6 +41,13 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
+#if defined _MSC_VER && !defined BORA_NO_WIN32_INTRINS
+#pragma warning(push)
+#pragma warning(disable : 4255)      // disable no-prototype() to (void) warning
+#include <intrin.h>
+#pragma warning(pop)
+#endif
+
 #include "vm_basic_types.h"
 #include "vm_assert.h"
 
@@ -145,64 +152,6 @@ typedef ALIGNED(16) struct Atomic_uint128 {
 } Atomic_uint128;
 #endif
 
-/*
- * Prototypes for msft atomics.  These are defined & inlined by the
- * compiler so no function definition is needed.  The prototypes are
- * needed for C++.
- *
- * The declarations for the intrinsic functions were taken from ntddk.h
- * in the DDK. The declarations must match otherwise the 64-bit C++
- * compiler will complain about second linkage of the intrinsic functions.
- * We define the intrinsic using the basic types corresponding to the
- * Windows typedefs. This avoids having to include windows header files
- * to get to the windows types.
- */
-#if defined _MSC_VER && !defined BORA_NO_WIN32_INTRINS
-#ifdef __cplusplus
-extern "C" {
-#endif
-long  _InterlockedExchange(long volatile*, long);
-long  _InterlockedCompareExchange(long volatile*, long, long);
-long  _InterlockedExchangeAdd(long volatile*, long);
-long  _InterlockedDecrement(long volatile*);
-long  _InterlockedIncrement(long volatile*);
-__int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
-#pragma intrinsic(_InterlockedExchange, _InterlockedCompareExchange)
-#pragma intrinsic(_InterlockedExchangeAdd, _InterlockedDecrement)
-#pragma intrinsic(_InterlockedIncrement)
-#pragma intrinsic(_InterlockedCompareExchange64)
-
-# if _MSC_VER >= 1600
-char     _InterlockedExchange8(char volatile *, char);
-char     _InterlockedCompareExchange8(char volatile *, char, char);
-#pragma intrinsic(_InterlockedCompareExchange8, _InterlockedCompareExchange8)
-#endif
-
-#if defined VM_X86_64
-long     _InterlockedAnd(long volatile*, long);
-__int64  _InterlockedAnd64(__int64 volatile*, __int64);
-long     _InterlockedOr(long volatile*, long);
-__int64  _InterlockedOr64(__int64 volatile*, __int64);
-long     _InterlockedXor(long volatile*, long);
-__int64  _InterlockedXor64(__int64 volatile*, __int64);
-__int64  _InterlockedExchangeAdd64(__int64 volatile*, __int64);
-__int64  _InterlockedIncrement64(__int64 volatile*);
-__int64  _InterlockedDecrement64(__int64 volatile*);
-__int64  _InterlockedExchange64(__int64 volatile*, __int64);
-#if !defined _WIN64
-#pragma intrinsic(_InterlockedAnd, _InterlockedAnd64)
-#pragma intrinsic(_InterlockedOr, _InterlockedOr64)
-#pragma intrinsic(_InterlockedXor, _InterlockedXor64)
-#pragma intrinsic(_InterlockedExchangeAdd64, _InterlockedIncrement64)
-#pragma intrinsic(_InterlockedDecrement64, _InterlockedExchange64)
-#endif /* !_WIN64 */
-#endif /* __x86_64__ */
-
-#ifdef __cplusplus
-}
-#endif
-#endif /* _MSC_VER */
-
 #if defined __arm__
 /*
  * LDREX without STREX or CLREX may cause problems in environments where the
@@ -255,15 +204,6 @@ Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
  * registers.
  */
 
-#if defined _MSC_VER && _MSC_VER < 1600 && defined __x86_64__
-uint8 VMWInterlockedExchange8(uint8 volatile *ptr,
-                              uint8 val);
-
-uint8 VMWInterlockedCompareExchange8(uint8 volatile *ptr,
-                                     uint8 newVal,
-                                     uint8 oldVal);
-#endif
-
 #if defined __GNUC__ && defined VM_ARM_32
 /* Force the link step to fail for unimplemented functions. */
 extern int AtomicUndefined(void const *);
@@ -405,19 +345,8 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
       : "memory"
    );
    return val;
-#elif defined _MSC_VER && _MSC_VER >= 1600
+#elif defined _MSC_VER
    return _InterlockedExchange8((volatile char *)&var->value, val);
-#elif defined _MSC_VER && defined __i386__
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm movzx eax, val
-      __asm mov ebx, var
-      __asm xchg [ebx]Atomic_uint8.value, al
-   }
-#pragma warning(pop)
-#elif defined _MSC_VER && defined __x86_64__
-   return VMWInterlockedExchange8(&var->value, val);
 #else
 #error No compiler defined for Atomic_ReadWrite8
 #endif
@@ -500,23 +429,9 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
    );
 
    return val;
-#elif defined _MSC_VER && _MSC_VER >= 1600
+#elif defined _MSC_VER
    return _InterlockedCompareExchange8((volatile char *)&var->value,
                                        newVal, oldVal);
-#elif defined _MSC_VER && defined __i386__
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov al, oldVal
-      __asm mov ebx, var
-      __asm mov cl, newVal
-      __asm lock cmpxchg [ebx]Atomic_uint8.value, cl
-      __asm movzx eax, al
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#elif defined _MSC_VER && defined __x86_64__
-   return VMWInterlockedCompareExchange8(&var->value, newVal, oldVal);
 #else
 #error No compiler defined for Atomic_ReadIfEqualWrite8
 #endif
@@ -1312,13 +1227,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedAnd((long *)&var->value, (long)val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock And [ebx]Atomic_uint32.value, eax
-#endif
 #else
 #error No compiler defined for Atomic_And
 #endif
@@ -1377,13 +1286,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedOr((long *)&var->value, (long)val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock Or [ebx]Atomic_uint32.value, eax
-#endif
 #else
 #error No compiler defined for Atomic_Or
 #endif
@@ -1442,13 +1345,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedXor((long *)&var->value, (long)val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock Xor [ebx]Atomic_uint32.value, eax
-#endif
 #else
 #error No compiler defined for Atomic_Xor
 #endif
@@ -2187,18 +2084,13 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
     */
    return var->value;
 #elif defined _MSC_VER && defined VM_ARM_32
+   /* MSVC + 32-bit ARM has add64 but no cmpxchg64 */
    return _InterlockedAdd64((__int64 *)&var->value, 0);
 #elif defined _MSC_VER && defined __i386__
-#   pragma warning(push)
-#   pragma warning(disable : 4035)      // disable no-return warning
-   {
-      __asm mov ecx, var
-      __asm mov edx, ecx
-      __asm mov eax, ebx
-      __asm lock cmpxchg8b [ecx]
-      // edx:eax is the return value; this is documented to work. --mann
-   }
-#   pragma warning(pop)
+   /* MSVC + 32-bit x86 has cmpxchg64 but no add64 */
+   return _InterlockedCompareExchange64((__int64 *)&var->value,
+                                        (__int64)255,  // Unlikely value to
+                                        (__int64)255); // not dirty cache
 #elif defined __GNUC__ && defined VM_ARM_V7
    __asm__ __volatile__(
       "ldrexd %[value], %H[value], [%[var]] \n\t"
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index ec31efd0..8bc743e8 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -35,6 +35,13 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
+#if defined _MSC_VER && !defined BORA_NO_WIN32_INTRINS
+#pragma warning(push)
+#pragma warning(disable : 4255)      // disable no-prototype() to (void) warning
+#include <intrin.h>
+#pragma warning(pop)
+#endif
+
 #include "vm_basic_types.h"
 
 #if defined VM_X86_64
@@ -499,7 +506,7 @@ uint16set(void *dst, uint16 val, size_t count)
       "strh    %w2, [%0]\n"
       "4:"
       : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
-      : "r" (val)
+      : "r" ((uint64)val)
       : "cc", "memory");
 #else
    size_t dummy0;
@@ -552,6 +559,7 @@ uint32set(void *dst, uint32 val, size_t count)
       : "cc", "memory");
 #elif defined(VM_ARM_64)
    void   *tmpDst = dst;
+   uint64 tmpVal = val;
 
    if (count == 0) {
       return dst;
@@ -588,7 +596,7 @@ uint32set(void *dst, uint32 val, size_t count)
       "cbz     %1, 4f\n\t"
       "str     %w2, [%0]\n\t" // No incr
       "4:"
-      : "+r" (tmpDst), "+r" (count), "+r" (val)
+      : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
       :
       : "cc", "memory");
 #else
@@ -632,22 +640,13 @@ uint32set(void *dst, uint32 val, size_t count)
 static INLINE void *
 uint16set(void *dst, uint16 val, size_t count)
 {
-#ifdef VM_X86_64
+#ifdef VM_X86_ANY
    __stosw((uint16*)dst, val, count);
-#elif defined(VM_ARM_32)
+#else
    size_t i;
    for (i = 0; i < count; i++) {
       ((uint16 *)dst)[i] = val;
    }
-#else
-   __asm { pushf;
-           mov ax, val;
-           mov ecx, count;
-           mov edi, dst;
-           cld;
-           rep stosw;
-           popf;
-   }
 #endif
    return dst;
 }
@@ -655,22 +654,13 @@ uint16set(void *dst, uint16 val, size_t count)
 static INLINE void *
 uint32set(void *dst, uint32 val, size_t count)
 {
-#ifdef VM_X86_64
+#ifdef VM_X86_ANY
    __stosd((unsigned long*)dst, (unsigned long)val, count);
-#elif defined(VM_ARM_32)
+#else
    size_t i;
    for (i = 0; i < count; i++) {
       ((uint32 *)dst)[i] = val;
    }
-#else
-   __asm { pushf;
-           mov eax, val;
-           mov ecx, count;
-           mov edi, dst;
-           cld;
-           rep stosd;
-           popf;
-   }
 #endif
    return dst;
 }
@@ -782,17 +772,9 @@ PAUSE(void)
 #endif
 }
 #elif defined(_MSC_VER)
-#ifdef VM_X86_64
 {
    _mm_pause();
 }
-#else /* VM_X86_64 */
-#pragma warning( disable : 4035)
-{
-   __asm _emit 0xf3 __asm _emit 0x90
-}
-#pragma warning (default: 4035)
-#endif /* VM_X86_64 */
 #else  /* __GNUC__  */
 #error No compiler defined for PAUSE
 #endif
@@ -840,11 +822,11 @@ RDTSC(void)
 #endif
 }
 #elif defined(_MSC_VER)
-#ifdef VM_X86_64
+#ifdef VM_X86_ANY
 {
    return __rdtsc();
 }
-#elif defined(VM_ARM_32)
+#else
 {
    /*
     * We need to do more inverstagetion here to find
@@ -853,13 +835,7 @@ RDTSC(void)
    NOT_IMPLEMENTED();
    return 0;
 }
-#else
-#pragma warning( disable : 4035)
-{
-   __asm _emit 0x0f __asm _emit 0x31
-}
-#pragma warning (default: 4035)
-#endif /* VM_X86_64 */
+#endif /* VM_X86_ANY */
 #else  /* __GNUC__  */
 #error No compiler defined for RDTSC
 #endif /* __GNUC__  */
diff --git a/vmmon-only/include/vm_basic_asm_x86_64.h b/vmmon-only/include/vm_basic_asm_x86_64.h
index ee1d1fb0..75823a43 100644
--- a/vmmon-only/include/vm_basic_asm_x86_64.h
+++ b/vmmon-only/include/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,41 +39,6 @@
 #error "This file is x86-64 only!"
 #endif
 
-#if defined(_MSC_VER) && !defined(BORA_NO_WIN32_INTRINS)
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-uint64 _umul128(uint64 multiplier, uint64 multiplicand,
-                uint64 *highProduct);
-int64 _mul128(int64 multiplier, int64 multiplicand,
-              int64 *highProduct);
-uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
-#ifdef ULM
-void _fxsave64(void *save);
-void _fxsave(void *save);
-void _fxrstor64(const void *load);
-void _fxrstor(const void *load);
-void _xsave64(void *save, uint64 mask);
-void _xsave(void *save, uint64 mask);
-void _xsaveopt64(void *save, uint64 mask);
-void _xsavec(void *save, uint64 mask);
-void _xrstor64(const void *load, uint64 mask);
-void _xrstor(const void *load, uint64 mask);
-#endif /* ULM */
-#ifdef __cplusplus
-}
-#endif
-
-#pragma intrinsic(_umul128, _mul128, __shiftright128)
-
-#ifdef ULM
-#pragma intrinsic(_fxsave64, _fxsave, _fxrstor64, _fxrstor, _xsave64, _xsave, \
-                  _xsaveopt64, _xsavec, _xrstor64, _xrstor)
-#endif /* ULM */
-
-#endif // _MSC_VER
-
 #if defined(__GNUC__)
 /*
  * GET_CURRENT_PC
diff --git a/vmmon-only/include/vm_basic_asm_x86_common.h b/vmmon-only/include/vm_basic_asm_x86_common.h
index 9fc0cacb..8c2ee36e 100644
--- a/vmmon-only/include/vm_basic_asm_x86_common.h
+++ b/vmmon-only/include/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,97 +38,6 @@
 #error "Should be included only in x86 builds"
 #endif
 
-/*
- * x86-64 windows doesn't support inline asm so we have to use these
- * intrinsic functions defined in the compiler.  Not all of these are well
- * documented.  There is an array in the compiler dll (c1.dll) which has
- * an array of the names of all the intrinsics minus the leading
- * underscore.  Searching around in the ntddk.h file can also be helpful.
- *
- * The declarations for the intrinsic functions were taken from the DDK.
- * Our declarations must match the ddk's otherwise the 64-bit c++ compiler
- * will complain about second linkage of the intrinsic functions.
- * We define the intrinsic using the basic types corresponding to the
- * Windows typedefs. This avoids having to include windows header files
- * to get to the windows types.
- */
-#if defined(_MSC_VER) && !defined(BORA_NO_WIN32_INTRINS)
-#ifdef __cplusplus
-extern "C" {
-#endif
-/*
- * It seems x86 & x86-64 windows still implements these intrinsic
- * functions.  The documentation for the x86-64 suggest the
- * __inbyte/__outbyte intrinsics even though the _in/_out work fine and
- * __inbyte/__outbyte aren't supported on x86.
- */
-int            _inp(unsigned short);
-unsigned short _inpw(unsigned short);
-unsigned long  _inpd(unsigned short);
-
-int            _outp(unsigned short, int);
-unsigned short _outpw(unsigned short, unsigned short);
-unsigned long  _outpd(uint16, unsigned long);
-#pragma intrinsic(_inp, _inpw, _inpd, _outp, _outpw, _outpw, _outpd)
-
-/*
- * Prevents compiler from re-ordering reads, writes and reads&writes.
- * These functions do not add any instructions thus only affect
- * the compiler ordering.
- *
- * See:
- * `Lockless Programming Considerations for Xbox 360 and Microsoft Windows'
- * http://msdn.microsoft.com/en-us/library/bb310595(VS.85).aspx
- */
-void _ReadBarrier(void);
-void _WriteBarrier(void);
-void _ReadWriteBarrier(void);
-#pragma intrinsic(_ReadBarrier, _WriteBarrier, _ReadWriteBarrier)
-
-void _mm_mfence(void);
-void _mm_lfence(void);
-#pragma intrinsic(_mm_mfence, _mm_lfence)
-
-long _InterlockedXor(long volatile *, long);
-#pragma intrinsic(_InterlockedXor)
-
-unsigned int __getcallerseflags(void);
-#pragma intrinsic(__getcallerseflags)
-
-#ifdef VM_X86_64
-/*
- * intrinsic functions only supported by x86-64 windows as of 2k3sp1
- */
-unsigned __int64 __rdtsc(void);
-void             __stosw(unsigned short *, unsigned short, size_t);
-void             __stosd(unsigned long *, unsigned long, size_t);
-void             _mm_pause(void);
-#pragma intrinsic(__rdtsc, __stosw, __stosd, _mm_pause)
-
-unsigned char  _BitScanForward64(unsigned long *, unsigned __int64);
-unsigned char  _BitScanReverse64(unsigned long *, unsigned __int64);
-#pragma intrinsic(_BitScanForward64, _BitScanReverse64)
-#endif /* VM_X86_64 */
-
-unsigned char  _BitScanForward(unsigned long *, unsigned long);
-unsigned char  _BitScanReverse(unsigned long *, unsigned long);
-#pragma intrinsic(_BitScanForward, _BitScanReverse)
-
-unsigned char  _bittest(const long *, long);
-unsigned char  _bittestandset(long *, long);
-unsigned char  _bittestandreset(long *, long);
-unsigned char  _bittestandcomplement(long *, long);
-#pragma intrinsic(_bittest, _bittestandset, _bittestandreset, _bittestandcomplement)
-#ifdef VM_X86_64
-unsigned char  _bittestandset64(__int64 *, __int64);
-unsigned char  _bittestandreset64(__int64 *, __int64);
-#pragma intrinsic(_bittestandset64, _bittestandreset64)
-#endif // VM_X86_64
-#ifdef __cplusplus
-}
-#endif
-#endif // _MSC_VER
-
 #ifdef __GNUC__
 /*
  * Checked against the Intel manual and GCC --hpreg
@@ -179,9 +88,6 @@ __GCC_IN(l, uint32, IN32)
 #define OUTW(port, val) __GCC_OUT(w, w, port, val)
 #define OUT32(port, val) __GCC_OUT(l, , port, val)
 
-#define GET_CURRENT_EIP(_eip) \
-      __asm__ __volatile("call 0\n\tpopl %0" : "=r" (_eip): );
-
 static INLINE unsigned int
 GetCallerEFlags(void)
 {
@@ -191,35 +97,35 @@ GetCallerEFlags(void)
 }
 
 #elif defined(_MSC_VER)
-static INLINE  uint8
+static INLINE uint8
 INB(uint16 port)
 {
-   return (uint8)_inp(port);
+   return __inbyte(port);
 }
 static INLINE void
 OUTB(uint16 port, uint8 value)
 {
-   _outp(port, value);
+   __outbyte(port, value);
 }
 static INLINE uint16
 INW(uint16 port)
 {
-   return _inpw(port);
+   return __inword(port);
 }
 static INLINE void
 OUTW(uint16 port, uint16 value)
 {
-   _outpw(port, value);
+   __outword(port, value);
 }
 static INLINE  uint32
 IN32(uint16 port)
 {
-   return _inpd(port);
+   return __indword(port);
 }
 static INLINE void
 OUT32(uint16 port, uint32 value)
 {
-   _outpd(port, value);
+   __outdword(port, value);
 }
 
 #ifndef VM_X86_64
@@ -227,11 +133,6 @@ OUT32(uint16 port, uint32 value)
 #undef NEAR
 #endif
 
-#define GET_CURRENT_EIP(_eip) do { \
-   __asm call NEAR PTR $+5 \
-   __asm pop eax \
-   __asm mov _eip, eax \
-} while (0)
 #endif // VM_X86_64
 
 static INLINE unsigned int
@@ -358,11 +259,7 @@ SFENCE(void)
    );
 #elif defined _MSC_VER
    _ReadWriteBarrier();
-#if defined VM_X86_32
-   __asm sfence;
-#else
    _mm_sfence();
-#endif
    _ReadWriteBarrier();
 #else
 #error No compiler defined for SFENCE
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index bb9d86cf..d32cde0d 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -688,22 +688,28 @@ typedef void * UserVA;
 
 /*
  * At present, we effectively require a compiler that is at least
- * gcc-3.3 (circa 2003).  Enforce this here, various things below
+ * gcc-4.1 (circa 2006).  Enforce this here, various things below
  * this line depend upon it.
  *
- * In practice, most things presently compile with gcc-4.1 or gcc-4.4.
- * The various linux kernel modules may use older (gcc-3.3) compilers.
+ * Current oldest compilers:
+ * - guest tools: 4.1.2 (freebsd/solaris)
+ * - buildhost compiler: 4.4.3
+ * - hosted kernel modules: 4.5
+ *
+ * SWIG's preprocessor is exempt.
  */
-#if defined __GNUC__ && (__GNUC__ < 3 || (__GNUC__ == 3 && __GNUC_MINOR__ < 3))
-#error "gcc version is too old to compile assembly, need gcc-3.3 or better"
+#ifndef SWIG
+#if defined __GNUC__ && (__GNUC__ < 4 || (__GNUC__ == 4 && __GNUC_MINOR__ < 1))
+#error "gcc version is too old, need gcc-4.1 or better"
+#endif
 #endif
 
 /*
- * Similarly, we require a compiler that is at least vc90 (vs2008).
+ * Similarly, we require a compiler that is at least vs2012.
  * Enforce this here.
  */
-#if defined _MSC_VER && _MSC_VER < 1500
-#error "cl.exe version is too old, need vc90 or better"
+#if defined _MSC_VER && _MSC_VER < 1700
+#error "cl.exe version is too old, need vs2012 or better"
 #endif
 
 
diff --git a/vmmon-only/include/vm_idt_x86.h b/vmmon-only/include/vm_idt_x86.h
new file mode 100644
index 00000000..52c1d840
--- /dev/null
+++ b/vmmon-only/include/vm_idt_x86.h
@@ -0,0 +1,88 @@
+/*********************************************************
+ * Copyright (C) 2012,2017-2018,2020 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_idt_x86.h --
+ *
+ *	Definitions for IDT use in x86/x86-64 ESX and hosted VMware Products.
+ */
+
+#ifndef _VM_IDT_X86_H_
+#define _VM_IDT_X86_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#if defined __cplusplus
+extern "C" {
+#endif
+
+/*
+ * User worlds are the only worlds that expect to receive
+ * interrupts on a stack specified in the %rsp entries of
+ * the TSS.
+ */
+#define TSS_RSP0 0
+#define TSS_RSP1 1
+#define TSS_RSP2 2
+
+/*
+ * The monitor and the vmkernel use gate stub handlers of a single size in
+ * their IDTs.  The only exception is the #PF gate (#14) which is twice as
+ * long in the monitor IDT, to copy CR2.
+ */
+#define IDT_STUB_SIZE              16
+
+#define IST_NONE                    0
+/* IST entries for the monitor. */
+#define IST_VMM_DF                  1
+#define IST_VMM_NMI                 2
+#define IST_VMM_MCE                 3
+#define MAX_VMM_IST                 3
+/* IST entries for the vmkernel. */
+#define IST_VMK_MCE                 5
+#define IST_VMK_DF                  6
+#define IST_VMK_NMI                 7
+
+
+static INLINE int
+IDT_MonitorISTForVector(int v)
+{
+   /*
+    * For non-SVM execution, the monitor uses the IST for #DF, #NMI, and #MC.
+    */
+   if (v == EXC_DF) {
+      return IST_VMM_DF;
+   } else if (v == EXC_NMI) {
+      return IST_VMM_NMI;
+   } else if (v == EXC_MC) {
+      return IST_VMM_MCE;
+   }
+   return IST_NONE;
+}
+
+#if defined __cplusplus
+} // extern "C"
+#endif
+
+#endif /* _VM_IDT_X86_H_ */
diff --git a/vmmon-only/include/vmmem_shared.h b/vmmon-only/include/vmmem_shared.h
index c301f713..90b5905e 100644
--- a/vmmon-only/include/vmmem_shared.h
+++ b/vmmon-only/include/vmmem_shared.h
@@ -32,6 +32,7 @@
 #define INCLUDE_ALLOW_VMKERNEL
 #define INCLUDE_ALLOW_VMX
 #include "includeCheck.h"
+#include "community_source.h"
 
 /*
  * Page remapping definitions.
@@ -97,10 +98,12 @@ typedef struct PlatformPageInfoList {
 #define VMMEM_SERVICES_CLEAR_MASK(typeMask, type)         \
            (typeMask & ~VMMEM_SERVICES_TYPE_2_MASK(type))
 
+#define MDEF_DRAINER
+
 #define VMMEM_SERVICES_DEFS                                       \
    MDEF(VMMEM_SERVICES_TYPE_P2M,         P2MUpdate_FilterPages)   \
    MDEF(VMMEM_SERVICES_TYPE_SWAP,        BusMemSwap_FilterPages)  \
-   MDEF(VMMEM_SERVICES_TYPE_DIRTY_CLEAR, DirtyDrainer_ClearDirty)
+   MDEF_DRAINER
 
 #define MDEF(_type, _cb) _type,
 typedef enum VmMemServices_Type {
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index bd1f870d..5fe018c3 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -99,6 +99,7 @@
 #define CR4_SMEP       0x00100000
 #define CR4_SMAP       0x00200000
 #define CR4_PKE        0x00400000
+#define CR4_CET        0x00800000
 #define CR4_RESERVED   CONST64U(0xffffffffff889000)
 #define CR8_RESERVED   CONST64U(0xfffffffffffffff0)
 
@@ -203,6 +204,7 @@
 #define EXC_MC           18
 #define EXC_XF           19  // SIMD exception.
 #define EXC_VE           20  // Virtualization exception - VT only.
+#define EXC_CP           21  // Control Protection exception.
 #define EXC_VC           29  // VMM communication exception (SVM / SEV-ES only).
 #define EXC_SX           30  // Security exception (SVM only).
 
@@ -210,7 +212,7 @@
 #define EXC_WITH_ERR_CODE_MASK ((1u << EXC_DF) | (1u << EXC_TS) | \
                                 (1u << EXC_NP) | (1u << EXC_SS) | \
                                 (1u << EXC_GP) | (1u << EXC_PF) | \
-                                (1u << EXC_AC))
+                                (1u << EXC_AC) | (1u << EXC_CP))
 
 /*
  * eflag/rflag definitions.
@@ -220,24 +222,24 @@
 
 typedef enum x86_FLAGS {
    EFLAGS_NONE         = 0,
-   EFLAGS_CF           = (1 << 0),     /* User */ 
-   EFLAGS_SET          = (1 << 1),                                  
-   EFLAGS_PF           = (1 << 2),     /* User */ 
-   EFLAGS_AF           = (1 << 4),     /* User */ 
-   EFLAGS_ZF           = (1 << 6),     /* User */ 
-   EFLAGS_SF           = (1 << 7),     /* User */ 
-   EFLAGS_TF           = (1 << 8),     /* Priv */ 
-   EFLAGS_IF           = (1 << 9),     /* Priv */ 
-   EFLAGS_DF           = (1 << 10),    /* User */ 
-   EFLAGS_OF           = (1 << 11),    /* User */ 
-   EFLAGS_NT           = (1 << 14),    /* Priv */ 
-   EFLAGS_RF           = (1 << 16),    /* Priv */ 
-   EFLAGS_VM           = (1 << 17),    /* Priv */ 
-   EFLAGS_AC           = (1 << 18),    /* Priv */ 
-   EFLAGS_VIF          = (1 << 19),    /* Priv */ 
-   EFLAGS_VIP          = (1 << 20),    /* Priv */ 
+   EFLAGS_CF           = (1 << 0),     /* User */
+   EFLAGS_SET          = (1 << 1),
+   EFLAGS_PF           = (1 << 2),     /* User */
+   EFLAGS_AF           = (1 << 4),     /* User */
+   EFLAGS_ZF           = (1 << 6),     /* User */
+   EFLAGS_SF           = (1 << 7),     /* User */
+   EFLAGS_TF           = (1 << 8),     /* Priv */
+   EFLAGS_IF           = (1 << 9),     /* Priv */
+   EFLAGS_DF           = (1 << 10),    /* User */
+   EFLAGS_OF           = (1 << 11),    /* User */
+   EFLAGS_NT           = (1 << 14),    /* Priv */
+   EFLAGS_RF           = (1 << 16),    /* Priv */
+   EFLAGS_VM           = (1 << 17),    /* Priv */
+   EFLAGS_AC           = (1 << 18),    /* Priv */
+   EFLAGS_VIF          = (1 << 19),    /* Priv */
+   EFLAGS_VIP          = (1 << 20),    /* Priv */
    EFLAGS_ID           = (1 << 21),    /* Priv */
-   
+
    EFLAGS_IOPL         = 3 << EFLAGS_IOPL_SHIFT,
    EFLAGS_ARITH        = (EFLAGS_CF | EFLAGS_PF | EFLAGS_AF | EFLAGS_ZF |
                           EFLAGS_SF | EFLAGS_OF),
@@ -249,7 +251,7 @@ typedef enum x86_FLAGS {
    EFLAGS_ALL          = (EFLAGS_CF | EFLAGS_PF | EFLAGS_AF | EFLAGS_ZF |
                           EFLAGS_SF | EFLAGS_DF | EFLAGS_OF | EFLAGS_TF |
                           EFLAGS_IF | EFLAGS_IOPL | EFLAGS_NT | EFLAGS_RF |
-                          EFLAGS_VM | EFLAGS_AC | EFLAGS_VIF | EFLAGS_VIP | 
+                          EFLAGS_VM | EFLAGS_AC | EFLAGS_VIF | EFLAGS_VIP |
                           EFLAGS_ID),
    EFLAGS_ALL_16       = EFLAGS_ALL & 0xffff,
    EFLAGS_REAL_32      = (EFLAGS_ALL & ~(EFLAGS_VIP | EFLAGS_VIF | EFLAGS_VM)),
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 5213ae8d..b8272b7d 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -141,7 +141,7 @@ CPUIDQuery;
    CPUIDLEVEL(TRUE,  18,  0x18,       8, 17) \
    CPUIDLEVEL(TRUE,  1A,  0x1a,       0, 17) \
    CPUIDLEVEL(TRUE,  1B,  0x1b,       2, 17) \
-   CPUIDLEVEL(TRUE,  1F,  0x1f,       6, 17) \
+   CPUIDLEVEL(FALSE, 1F,  0x1f,       6, 17) \
    CPUIDLEVEL(FALSE, 400, 0x40000000, 0,  0) \
    CPUIDLEVEL(FALSE, 401, 0x40000001, 0,  0) \
    CPUIDLEVEL(FALSE, 402, 0x40000002, 0,  0) \
@@ -481,7 +481,7 @@ FIELD(  6,  0, EDX, 16, 16, HW_FEEDBACK_INDEX,                   NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_7                                            \
-FIELD(  7,  0, EAX,  0, 32, LEAF_7_MAX_SUBLEVEL,                 YES, FUT ) \
+FIELD(  7,  0, EAX,  0, 32, LEAF_7_MAX_SUBLEVEL,                 YES,  18 ) \
 FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                            YES,   9 ) \
 FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                          ANY,  11 ) \
 FLAG(   7,  0, EBX,  2,  1, SGX,                                 ANY,  17 ) \
@@ -530,18 +530,20 @@ FLAG(   7,  0, ECX, 14,  1, AVX512VPOPCNTDQ,                     YES,  16 ) \
 FLAG(   7,  0, ECX, 16,  1, VA57,                                NO,    0 ) \
 FIELD(  7,  0, ECX, 17,  5, MAWA,                                NO,    0 ) \
 FLAG(   7,  0, ECX, 22,  1, RDPID,                               YES,  17 ) \
-FLAG(   7,  0, ECX, 25,  1, CLDEMOTE,                            YES, FUT ) \
-FLAG(   7,  0, ECX, 27,  1, MOVDIRI,                             YES, FUT ) \
-FLAG(   7,  0, ECX, 28,  1, MOVDIR64B,                           YES, FUT ) \
+FLAG(   7,  0, ECX, 25,  1, CLDEMOTE,                            YES,  18 ) \
+FLAG(   7,  0, ECX, 27,  1, MOVDIRI,                             YES,  18 ) \
+FLAG(   7,  0, ECX, 28,  1, MOVDIR64B,                           YES,  18 ) \
 FLAG(   7,  0, ECX, 29,  1, ENQCMD,                              NO,    0 ) \
 FLAG(   7,  0, ECX, 30,  1, SGX_LC,                              ANY,  17 ) \
 FLAG(   7,  0, EDX,  2,  1, AVX512QVNNIW,                        YES,  16 ) \
 FLAG(   7,  0, EDX,  3,  1, AVX512QFMAPS,                        YES,  16 ) \
-FLAG(   7,  0, EDX,  4,  1, FAST_SHORT_REPMOV,                   YES, FUT ) \
-FLAG(   7,  0, EDX,  8,  1, AVX512VP2INTERSECT,                  YES, FUT ) \
+FLAG(   7,  0, EDX,  4,  1, FAST_SHORT_REPMOV,                   YES,  18 ) \
+FLAG(   7,  0, EDX,  8,  1, AVX512VP2INTERSECT,                  YES,  18 ) \
 FLAG(   7,  0, EDX, 10,  1, MDCLEAR,                             YES,   9 ) \
 FLAG(   7,  0, EDX, 13,  1, TSX_MICROCODE_UPDATE,                NO,    0 ) \
+FLAG(   7,  0, EDX, 14,  1, SERIALIZE,                           NO,    0 ) \
 FLAG(   7,  0, EDX, 15,  1, HYBRID,                              NO,    0 ) \
+FLAG(   7,  0, EDX, 16,  1, TSXLDTRK,                            NO,    0 ) \
 FLAG(   7,  0, EDX, 18,  1, PCONFIG,                             NO,    0 ) \
 FLAG(   7,  0, EDX, 20,  1, CET_IBT,                             NO,    0 ) \
 FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                            ANY,   9 ) \
@@ -550,7 +552,7 @@ FLAG(   7,  0, EDX, 28,  1, FCMD,                                YES,   9 ) \
 FLAG(   7,  0, EDX, 29,  1, ARCH_CAPABILITIES,                   ANY,   9 ) \
 FLAG(   7,  0, EDX, 30,  1, CORE_CAPABILITIES,                   NO,    0 ) \
 FLAG(   7,  0, EDX, 31,  1, SSBD,                                YES,   9 ) \
-FLAG(   7,  1, EAX,  5,  1, AVX512BF16,                          YES, FUT )
+FLAG(   7,  1, EAX,  5,  1, AVX512BF16,                          YES,  18 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_9                                            \
@@ -789,11 +791,11 @@ FIELD( 1B,  0, EDX,  0, 32, PCONFIG_TARGET_ID3,                  NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1F                                           \
-FIELD( 1F,  0, EAX,  0,  5, TOPOLOGY_V2_MASK_WIDTH,              NO,    0 ) \
-FIELD( 1F,  0, EBX,  0, 16, TOPOLOGY_V2_CPUS_SHARING_LEVEL,      NO,    0 ) \
-FIELD( 1F,  0, ECX,  0,  8, TOPOLOGY_V2_LEVEL_NUMBER,            NO,    0 ) \
-FIELD( 1F,  0, ECX,  8,  8, TOPOLOGY_V2_LEVEL_TYPE,              NO,    0 ) \
-FIELD( 1F,  0, EDX,  0, 32, TOPOLOGY_V2_X2APIC_ID,               NO,    0 )
+FIELD( 1F,  0, EAX,  0,  5, TOPOLOGY_V2_MASK_WIDTH,              NA,    0 ) \
+FIELD( 1F,  0, EBX,  0, 16, TOPOLOGY_V2_CPUS_SHARING_LEVEL,      NA,    0 ) \
+FIELD( 1F,  0, ECX,  0,  8, TOPOLOGY_V2_LEVEL_NUMBER,            NA,    0 ) \
+FIELD( 1F,  0, ECX,  8,  8, TOPOLOGY_V2_LEVEL_TYPE,              NA,    0 ) \
+FIELD( 1F,  0, EDX,  0, 32, TOPOLOGY_V2_X2APIC_ID,               NA,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_400                                          \
@@ -907,9 +909,6 @@ FIELD( 80,  0, EBX,  0, 32, LEAF80_VENDOR1,                      NA,    0 ) \
 FIELD( 80,  0, ECX,  0, 32, LEAF80_VENDOR3,                      NA,    0 ) \
 FIELD( 80,  0, EDX,  0, 32, LEAF80_VENDOR2,                      NA,    0 )
 
-#define CPUID_81_ECX_14 \
-FLAG(  81,  0, ECX, 14,  1, LEAF81ECX_RSVD1,                     NO,    0 )
-
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_81                                           \
 FIELD( 81,  0, EAX,  0,  4, LEAF81_STEPPING,                     ANY,   4 ) \
@@ -934,13 +933,12 @@ FLAG(  81,  0, ECX, 10,  1, IBS,                                 NO,    0 ) \
 FLAG(  81,  0, ECX, 11,  1, XOP,                                 YES,   8 ) \
 FLAG(  81,  0, ECX, 12,  1, SKINIT,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 13,  1, WATCHDOG,                            NO,    0 ) \
-CPUID_81_ECX_14 \
 FLAG(  81,  0, ECX, 15,  1, LWP,                                 NO,    0 ) \
 FLAG(  81,  0, ECX, 16,  1, FMA4,                                YES,   8 ) \
 FLAG(  81,  0, ECX, 17,  1, TCE,                                 NO,    0 ) \
 FLAG(  81,  0, ECX, 19,  1, NODEID_MSR,                          NO,    0 ) \
 FLAG(  81,  0, ECX, 21,  1, TBM,                                 YES,   9 ) \
-FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                            NO,    0 ) \
+FLAG(  81,  0, ECX, 22,  1, TOPOLOGY,                            ANY,  18 ) \
 FLAG(  81,  0, ECX, 23,  1, PERFCORE,                            ANY,   4 ) \
 FLAG(  81,  0, ECX, 24,  1, PERFNB,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 26,  1, DATABK,                              NO,    0 ) \
@@ -1067,21 +1065,29 @@ FIELD( 88,  0, EAX, 16,  8, GUEST_PHYS_ADDR_SZ,                  YES,   8 ) \
 FLAG(  88,  0, EBX,  0,  1, CLZERO,                              YES,  14 ) \
 FLAG(  88,  0, EBX,  1,  1, IRPERF,                              NO,    0 ) \
 FLAG(  88,  0, EBX,  2,  1, XSAVE_ERR_PTR,                       NO,    0 ) \
+FLAG(  88,  0, EBX,  3,  1, INVLPGB,                             NO,    0 ) \
 FLAG(  88,  0, EBX,  4,  1, RDPRU,                               NO,    0 ) \
 FLAG(  88,  0, EBX,  6,  1, MBE,                                 NO,    0 ) \
+FLAG(  88,  0, EBX,  8,  1, MCOMMIT,                             NO,    0 ) \
 FLAG(  88,  0, EBX,  9,  1, WBNOINVD,                            YES,  17 ) \
+FLAG(  88,  0, EBX, 10,  1, LBREXTN,                             NO,    0 ) \
 FLAG(  88,  0, EBX, 12,  1, LEAF88_IBPB,                         ANY,   9 ) \
+FLAG(  88,  0, EBX, 13,  1, WBINVD_INT,                          NO,    0 ) \
 FLAG(  88,  0, EBX, 14,  1, LEAF88_IBRS,                         NO,    0 ) \
 FLAG(  88,  0, EBX, 15,  1, LEAF88_STIBP,                        NO,    0 ) \
 FLAG(  88,  0, EBX, 16,  1, LEAF88_IBRS_ALWAYS,                  NO,    0 ) \
 FLAG(  88,  0, EBX, 17,  1, LEAF88_STIBP_ALWAYS,                 NO,    0 ) \
 FLAG(  88,  0, EBX, 18,  1, LEAF88_PREFER_IBRS,                  NO,    0 ) \
+FLAG(  88,  0, EBX, 19,  1, LEAF88_IBRS_SAME_MODE,               NO,    0 ) \
+FLAG(  88,  0, EBX, 20,  1, LMSLE_UNSUPPORTED,                   NO,    0 ) \
+FLAG(  88,  0, EBX, 23,  1, PPIN,                                NO,    0 ) \
 FLAG(  88,  0, EBX, 24,  1, LEAF88_SSBD_SPEC_CTRL,               ANY,   9 ) \
 FLAG(  88,  0, EBX, 25,  1, LEAF88_SSBD_VIRT_SPEC_CTRL,          ANY,   9 ) \
 FLAG(  88,  0, EBX, 26,  1, LEAF88_SSBD_NOT_NEEDED,              NO,    0 ) \
 FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                   YES,   4 ) \
 FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                  YES,   7 ) \
 FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                        NO,    0 ) \
+FIELD( 88,  0, EDX,  0, 16, INVLPGB_MAX,                         NO,    0 ) \
 FIELD( 88,  0, EDX, 16,  8, RDPRU_MAX,                           NO,    0 )
 
 #define CPUID_8A_EDX_11 \
@@ -1115,7 +1121,9 @@ FLAG(  8A,  0, EDX, 16,  1, SVM_VGIF,                            NO,    0 ) \
 FLAG(  8A,  0, EDX, 17,  1, SVM_GMET,                            YES,  17 ) \
 FIELD( 8A,  0, EDX, 18,  2, SVMEDX_RSVD3,                        NO,    0 ) \
 FLAG(  8A,  0, EDX, 20,  1, SVM_GUEST_SPEC_CTRL,                 NO,    0 ) \
-FIELD( 8A,  0, EDX, 21, 11, SVMEDX_RSVD4,                        NO,    0 )
+FIELD( 8A,  0, EDX, 21,  3, SVMEDX_RSVD4,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 24,  1, SVM_TLB_CTL,                         NO,    0 ) \
+FIELD( 8A,  0, EDX, 25,  7, SVMEDX_RSVD5,                        NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_819                                          \
@@ -1206,18 +1214,23 @@ FIELD(81E,  0, EBX,  8,  2, CORES_PER_COMPUTE_UNIT,              NA,    0 ) \
 FIELD(81E,  0, ECX,  0,  8, NODEID_VAL,                          NA,    0 ) \
 FIELD(81E,  0, ECX,  8,  3, NODES_PER_PKG,                       NA,    0 )
 
-#define CPUID_81F_EAX_10 \
-FLAG( 81F,  0, EAX, 10,  1, SVMEAX_RSVD1,                        NO,    0 )
-
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_81F                                          \
 FLAG( 81F,  0, EAX,  0,  1, SME,                                 NO,    0 ) \
 FLAG( 81F,  0, EAX,  1,  1, SEV,                                 YES,  17 ) \
 FLAG( 81F,  0, EAX,  2,  1, PAGE_FLUSH_MSR,                      NO,    0 ) \
 FLAG( 81F,  0, EAX,  3,  1, SEV_ES,                              YES,  17 ) \
-CPUID_81F_EAX_10 \
+FLAG( 81F,  0, EAX,  4,  1, SEV_SNP,                             NO,    0 ) \
+FLAG( 81F,  0, EAX,  5,  1, VMPL,                                NO,    0 ) \
+FLAG( 81F,  0, EAX, 10,  1, SEV_HEC,                             NO,    0 ) \
+FLAG( 81F,  0, EAX, 11,  1, SEV_64BIT_REQ,                       NO,    0 ) \
+FLAG( 81F,  0, EAX, 12,  1, SEV_RESTR_INJECTION,                 NO,    0 ) \
+FLAG( 81F,  0, EAX, 13,  1, SEV_ALT_INJECTION,                   NO,    0 ) \
+FLAG( 81F,  0, EAX, 14,  1, SEV_DEBUG_SWAP,                      NO,    0 ) \
+FLAG( 81F,  0, EAX, 15,  1, SEV_NO_HOST_IBS,                     NO,    0 ) \
 FIELD(81F,  0, EBX,  0,  6, SME_PAGE_TABLE_BIT_NUM,              YES,  17 ) \
 FIELD(81F,  0, EBX,  6,  6, SME_PHYS_ADDR_SPACE_REDUCTION,       NO,    0 ) \
+FIELD(81F,  0, EBX, 12,  4, NUM_VMPL,                            NO,    0 ) \
 FIELD(81F,  0, ECX,  0, 32, NUM_ENCRYPTED_GUESTS,                NO,    0 ) \
 FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                        NO,    0 )
 
diff --git a/vmmon-only/include/x86cpuid_asm.h b/vmmon-only/include/x86cpuid_asm.h
index 8addeca8..e365caf2 100644
--- a/vmmon-only/include/x86cpuid_asm.h
+++ b/vmmon-only/include/x86cpuid_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,31 +39,6 @@
 #include "x86cpuid.h"
 
 
-/*
- * The declarations for the intrinsic functions were taken from MSDN.
- * We define the intrinsic using the basic types corresponding to the
- * Windows typedefs. This avoids having to include windows header files
- * to get to the windows types.
- */
-#ifdef _MSC_VER
-#ifdef __cplusplus
-extern "C" {
-#endif
-/*
- * __cpuid has been supported since VS2003
- * __cpuidex has been supported since VS2008
- */
-void __cpuid(int regs[4], int eax);
-void __cpuidex(int regs[4], int eax, int ecx);
-#pragma intrinsic(__cpuid)
-#pragma intrinsic(__cpuidex)
-
-#ifdef __cplusplus
-}
-#endif
-#endif /* _MSC_VER */
-
-
 #ifdef __GNUC__ // {
 
 /*
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 949cfbde..139617f9 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -113,6 +113,20 @@ MSRQuery;
 #define MSR_TSC_AUX           0xc0000103
 #define MSR_BD_TSC_RATIO      0xc0000104
 
+/* CET MSRs */
+#define MSR_U_CET                            0x6a0
+#define MSR_S_CET                            0x6a2
+#define MSR_CET_SH_STK_EN                         (1ULL << 0)
+#define MSR_CET_WR_SHSTK_EN                       (1ULL << 1)
+#define MSR_PL0_SSP                          0x6a4
+#define MSR_PL1_SSP                          0x6a5
+#define MSR_PL2_SSP                          0x6a6
+#define MSR_PL3_SSP                          0x6a7
+#define MSR_ISST_ADDR                        0x6a8
+
+#define MSR_TEST_CTRL                        0x33
+#define MSR_TEST_CTRL_SPLIT_LOCK_DETECT           (1ULL << 29)
+
 #define IA32_MSR_ARCH_CAPABILITIES           0x10a
 #define MSR_ARCH_CAPABILITIES_RDCL_NO             (1ULL << 0)
 #define MSR_ARCH_CAPABILITIES_IBRS_ALL            (1ULL << 1)
@@ -480,6 +494,8 @@ MSRQuery;
 #define MSR_K8_SYSCFG_MTRRTOM2EN         (1ULL<<21)
 #define MSR_K8_SYSCFG_TOM2FORCEMEMTYPEWB (1ULL<<22)
 #define MSR_K8_SYSCFG_SMEE               (1ULL<<23)
+#define MSR_K8_SYSCFG_SNPE               (1ULL<<24)
+#define MSR_K8_SYSCFG_VMPLE              (1ULL<<25)
 
 #define MSR_K8_TOPMEM2       0xc001001d
 
@@ -521,13 +537,22 @@ MSRQuery;
 /* SEV related MSRs. */
 #define MSR_VMPAGE_FLUSH           0xc001011e
 #define MSR_GHCB_PA                0xc0010130
+#define MSR_GHCB_PA_FUNCTION_MASK       0xfff
 #define MSR_GHCB_PA_SEVINFO_HV              1
 #define MSR_GHCB_PA_SEVINFO_REQ             2
 #define MSR_GHCB_PA_AP_JUMP_TABLE           3
+#define MSR_GHCB_PA_CPUID_REQ               4
+#define MSR_GHCB_PA_CPUID_RESP              5
+#define MSR_GHCB_PA_TERMINATE             256
 #define MSR_SEV_STATUS             0xc0010131
 
 #define MSR_SEV_STATUS_SEV_EN      0x0000000000000001ULL // SEV is enabled
 #define MSR_SEV_STATUS_SEV_ES_EN   0x0000000000000002ULL // SEV-ES is enabled
+#define MSR_SEV_STATUS_SEV_SNP_EN  0x0000000000000004ULL // SEV-SNP is enabled
+
+/* SEV-SNP (Secure Nested Paging) MSRs. */
+#define MSR_RMP_BASE              0xc0010132 // Address of first byte of RMP
+#define MSR_RMP_END               0xc0010133 // Address of last byte of RMP
 
 #define MSR_AMD_DE_CFG           0xc0011029  // Decode configuration
 #define MSR_AMD_DE_CFG_BIT1      (1ULL<<1)
@@ -796,7 +821,6 @@ X86MSR_SetMSR(uint32 cx, uint64 value)
 }
 #endif
 #elif defined _MSC_VER // !__GNUC__ && _MSC_VER
-#ifdef _WIN64
 unsigned __int64  __readmsr(unsigned long);
 void              __writemsr(unsigned long, unsigned __int64);
 #pragma intrinsic(__readmsr, __writemsr)
@@ -811,37 +835,6 @@ X86MSR_SetMSR(uint32 cx, uint64 value)
 {
    __writemsr((unsigned long)(cx), (unsigned __int64)(value));
 }
-#else // !__GNUC__ && _MSC_VER && !_WIN64
-#pragma warning( disable : 4035)
-static INLINE uint64
-X86MSR_GetMSR(uint32 input)
-{
-   __asm push ecx
-   __asm mov  ecx, input
-   /* 0x0f 0x32 -> edx:eax = rdmsr[ecx] */
-   __asm _emit 0x0f __asm _emit 0x32
-   __asm pop ecx
-}
-
-static INLINE void
-X86MSR_SetMSR(uint32 input, uint64 value)
-{
-      uint32 hival = (uint32)((value) >> 32);
-      uint32 loval = (uint32)value;
-      __asm push edx
-      __asm push ecx
-      __asm push eax
-      __asm mov  eax, loval
-      __asm mov  edx, hival
-      __asm mov  ecx, input
-      /* 0x0f 0x30 -> wrmsr[ecx] = edx:eax */
-      __asm _emit 0x0f __asm _emit 0x30
-      __asm pop  eax
-      __asm pop  ecx
-      __asm pop  edx
-}
-#pragma warning (default: 4035)
-#endif
 #else // !__GNUC__ && !_MSC_VER
 #error No compiler defined for RDMSR/WRMSR.
 #endif
diff --git a/vmmon-only/include/x86paging_64.h b/vmmon-only/include/x86paging_64.h
index 871a9dec..39b46587 100644
--- a/vmmon-only/include/x86paging_64.h
+++ b/vmmon-only/include/x86paging_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016,2018-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016,2018-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,6 +40,7 @@
 #include "x86types.h"
 #include "vm_pagetable.h"
 #include "x86paging_common.h"
+#include "vm_assert.h"
 
 #define LM_PTE_PFN_MASK      CONST64U(0xffffffffff000)
 #define LM_PTE_2_PFN(_pte)   (((_pte) & LM_PTE_PFN_MASK) >> PT_PTE_PFN_SHIFT)
@@ -136,4 +137,95 @@ LMPTEIsSafe(VM_PAE_PTE pte, PT_Level level, uint64 physMask)
 #define VA64_CANONICAL_HOLE_START   (CONST64U(1) << (VA64_IMPL_BITS - 1))
 #define VA64_CANONICAL_HOLE_LEN  VA64_CANONICAL_MASK - VA64_CANONICAL_HOLE_START
 
+static INLINE Bool
+x86IsCanonicalC(VA64 va)
+{
+   return (va & VA64_CANONICAL_MASK) == 0 ||
+          (va & VA64_CANONICAL_MASK) == VA64_CANONICAL_MASK;
+}
+
+#if defined(VM_X86_64) && defined(__GNUC__)
+static INLINE Bool
+x86IsCanonicalAsm(VA64 va)
+{
+   Bool out;
+   /*
+    * sarq $48, %0: Move 17 bits from position 63:47 into 15:0 and CF,
+    *  sign-extending as we do so.
+    * adcl $0, %0: Then add (0 + CF) to the shifted value.  The result is zero
+    *  iff (CF == 1 && bits 31:0 == 0xffffffff) or (CF == 0 && bits 31:0 == 0).
+    *  That is, if original bits 47 and higher were all 1s or all 0s.
+    * setz %1: Create the boolean.
+    *
+    * The chain of AdcLong macros will emit one adc instruction; gcc
+    * has no obvious way to force the size of a quad %0 to a long.
+    */
+#define AdcLong(reg64, reg32) \
+   ".ifc  %0, %%" #reg64 "\n" \
+   " adcl $0, %%" #reg32 "\n" \
+   ".endif \n"
+
+   asm ("sarq $48, %0 \n"
+        AdcLong(rax, eax)
+        AdcLong(rcx, ecx)
+        AdcLong(rdx, edx)
+        AdcLong(rbx, ebx)
+        AdcLong(rsp, esp)
+        AdcLong(rbp, ebp)
+        AdcLong(rsi, esi)
+        AdcLong(rdi, edi)
+        AdcLong(r8,  r8d)
+        AdcLong(r9,  r9d)
+        AdcLong(r10, r10d)
+        AdcLong(r11, r11d)
+        AdcLong(r12, r12d)
+        AdcLong(r13, r13d)
+        AdcLong(r14, r14d)
+        AdcLong(r15, r15d)
+        "setz %1" : "+r"(va), "=r"(out));
+   return out;
+#undef AdcLong
+}
+#endif
+
+static INLINE Bool
+x86_IsCanonical(VA64 va)
+{
+#if defined(VM_X86_64) && defined(__GNUC__)
+   if (__builtin_constant_p(va)) {
+      return x86IsCanonicalC(va);
+   } else {
+      return x86IsCanonicalAsm(va);
+   }
+#else
+   return x86IsCanonicalC(va);
+#endif
+}
+
+static INLINE Bool
+x86_IsCanonicalRange(VA64 va, unsigned size)
+{
+   /*
+    * The check is simple as long as the size is less
+    * than the number of implemented bits.
+    *
+    * The only case we don't handle is one where the VA goes from a
+    * high canonical address and wraps to a non-canonical address
+    * (e.g. 0x00008000_00000000) or higher.  Our test would falsely
+    * consider this canonical.
+    */
+   ASSERT_ON_COMPILE(sizeof(size) * 8 < VA64_IMPL_BITS);
+
+   /*
+    * VA64_CANONICAL_MASK is the lowest canonical address with the
+    * upper bits all set.
+    *
+    * VA64_CANONICAL_HOLE_START is one higher than the highest valid
+    * canonical address with the upper bits all cleared.  Note that we
+    * access up to (va + size - 1), not (va + size), so <= is correct.
+    */
+   return va >= VA64_CANONICAL_MASK ||
+          va + size <= VA64_CANONICAL_HOLE_START;
+}
+
 #endif /* _X86PAGING_64_H_ */
diff --git a/vmmon-only/include/x86paging_common.h b/vmmon-only/include/x86paging_common.h
index 128ee69a..4a8c9dc3 100644
--- a/vmmon-only/include/x86paging_common.h
+++ b/vmmon-only/include/x86paging_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -92,6 +92,7 @@
 #define PF_RSVD         0x0008
 #define PF_ID           0x0010
 #define PF_PK           0x0020
+#define PF_SS           0x0040
 #define PF_SGX          0x8000
 
 /*
@@ -109,4 +110,12 @@ typedef struct {
    uint64   la;      /* Used for single address invalidation.  */
 } InvpcidArg;
 
+typedef enum {
+   PM_FLAT,        /* non paging mode                                      */
+   PM_2_LEVEL,     /* classic 32 bit non-pae style paging mode.            */
+   PM_3_LEVEL,     /* classic 32 bit pae style paging mode.                */
+   PM_4_LEVEL,     /* long mode style paging mode (including compat mode). */
+   PM_NUM     = 4, /* number of different paging modes.                    */
+} PagingMode;
+
 #endif /* _X86PAGING_COMMON_H_ */
diff --git a/vmmon-only/include/x86sel.h b/vmmon-only/include/x86sel.h
index 83993684..c13a6905 100644
--- a/vmmon-only/include/x86sel.h
+++ b/vmmon-only/include/x86sel.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2014,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,6 +39,7 @@
 extern "C" {
 #endif
 
+#include "vm_assert.h"
 
 #define SELECTOR_GDT             0
 #define SELECTOR_LDT             1
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
index 831d12fd..69a3479f 100644
--- a/vmmon-only/include/x86vt-vmcs-fields.h
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -95,9 +95,10 @@
  *       _V  -- virtualized
  *       _NV -- not virtualized
  *   _access is one of:
- *       _NA -- no access
- *       _RW -- read/write access
- *       _RO -- read-only access
+ *       _NA  -- no access
+ *       _RW  -- read/write access
+ *       _RO  -- read-only access
+ *       _URW -- read/write acess for the ULM only
  *   _sticky is one of:
  *       _S  -- sticky
  *       _NS -- non-sticky
@@ -109,9 +110,9 @@
 VMCS_SET_START(16)
 /* 16-bit control fields. */
 VMCS_GROUP_START(16, CTL)
-VMCS_FIELD(VPID,                    0x0000, _S16, _TC,  0,  _C,  _V, _NA,  _S)
-VMCS_FIELD(PI_NOTIFY,               0x0002, _S16, _TC,  1, _NC, _NV, _NA,  _S)
-VMCS_FIELD(EPTP_INDEX,              0x0004, _S16, _TC,  2, _NC,  _V, _NA, _NS)
+VMCS_FIELD(VPID,                    0x0000, _S16, _TC,  0,  _C,  _V, _URW,  _S)
+VMCS_FIELD(PI_NOTIFY,               0x0002, _S16, _TC,  1, _NC, _NV,  _NA,  _S)
+VMCS_FIELD(EPTP_INDEX,              0x0004, _S16, _TC,  2, _NC,  _V, _URW, _NS)
 VMCS_UNUSED(                        0x0006, _S16, _TC,  3)
 VMCS_UNUSED(                        0x0008, _S16, _TC,  4)
 VMCS_UNUSED(                        0x000A, _S16, _TC,  5)
@@ -328,16 +329,16 @@ VMCS_GROUP_END(64, DATA)
 
 /* 64-bit guest state. */
 VMCS_GROUP_START(64, GUEST)
-VMCS_FIELD(LINK_PTR,                0x2800, _S64, _TG,  0, _NC,  _V, _NA, _NS)
-VMCS_FIELD(DEBUGCTL,                0x2802, _S64, _TG,  1, _NC,  _V, _NA, _NS)
-VMCS_FIELD(PAT,                     0x2804, _S64, _TG,  2, _NC,  _V, _NA, _NS)
-VMCS_FIELD(EFER,                    0x2806, _S64, _TG,  3, _NC,  _V, _NA, _NS)
-VMCS_FIELD(PGC,                     0x2808, _S64, _TG,  4, _NC,  _V, _NA, _NS)
-VMCS_FIELD(PDPTE0,                  0x280A, _S64, _TG,  5, _NC,  _V, _RW, _NS)
-VMCS_FIELD(PDPTE1,                  0x280C, _S64, _TG,  6, _NC,  _V, _RW, _NS)
-VMCS_FIELD(PDPTE2,                  0x280E, _S64, _TG,  7, _NC,  _V, _RW, _NS)
-VMCS_FIELD(PDPTE3,                  0x2810, _S64, _TG,  8, _NC,  _V, _RW, _NS)
-VMCS_FIELD(BNDCFGS,                 0x2812, _S64, _TG,  9, _NC,  _V, _NA, _NS)
+VMCS_FIELD(LINK_PTR,                0x2800, _S64, _TG,  0, _NC,  _V,  _NA, _NS)
+VMCS_FIELD(DEBUGCTL,                0x2802, _S64, _TG,  1, _NC,  _V,  _NA, _NS)
+VMCS_FIELD(PAT,                     0x2804, _S64, _TG,  2, _NC,  _V,  _NA, _NS)
+VMCS_FIELD(EFER,                    0x2806, _S64, _TG,  3, _NC,  _V, _URW, _NS)
+VMCS_FIELD(PGC,                     0x2808, _S64, _TG,  4, _NC,  _V,  _NA, _NS)
+VMCS_FIELD(PDPTE0,                  0x280A, _S64, _TG,  5, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(PDPTE1,                  0x280C, _S64, _TG,  6, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(PDPTE2,                  0x280E, _S64, _TG,  7, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(PDPTE3,                  0x2810, _S64, _TG,  8, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(BNDCFGS,                 0x2812, _S64, _TG,  9, _NC,  _V,  _NA, _NS)
 VMCS_UNUSED(                        0x2814, _S64, _TG,  10)
 VMCS_UNUSED(                        0x2816, _S64, _TG,  11)
 VMCS_UNUSED(                        0x2818, _S64, _TG,  12)
@@ -403,24 +404,24 @@ VMCS_SET_END(64)
 VMCS_SET_START(32)
 /* 32-bit control fields. */
 VMCS_GROUP_START(32, CTL)
-VMCS_FIELD(PIN_VMEXEC_CTL,          0x4000, _S32, _TC,  0,  _C,  _V, _NA,  _S)
-VMCS_FIELD(CPU_VMEXEC_CTL,          0x4002, _S32, _TC,  1,  _C,  _V, _NA,  _S)
-VMCS_FIELD(XCP_BITMAP,              0x4004, _S32, _TC,  2, _NC,  _V, _NA,  _S)
-VMCS_FIELD(PF_ERR_MASK,             0x4006, _S32, _TC,  3, _NC,  _V, _NA,  _S)
-VMCS_FIELD(PF_ERR_MATCH,            0x4008, _S32, _TC,  4, _NC,  _V, _NA,  _S)
-VMCS_FIELD(CR3_TARG_COUNT,          0x400A, _S32, _TC,  5, _NC,  _V, _NA,  _S)
-VMCS_FIELD(VMEXIT_CTL,              0x400C, _S32, _TC,  6, _NC,  _V, _NA,  _S)
-VMCS_FIELD(VMEXIT_MSR_STORE_COUNT,  0x400E, _S32, _TC,  7, _NC,  _V, _NA,  _S)
-VMCS_FIELD(VMEXIT_MSR_LOAD_COUNT,   0x4010, _S32, _TC,  8, _NC,  _V, _NA,  _S)
-VMCS_FIELD(VMENTRY_CTL,             0x4012, _S32, _TC,  9, _NC,  _V, _NA,  _S)
-VMCS_FIELD(VMENTRY_MSR_LOAD_COUNT,  0x4014, _S32, _TC, 10, _NC,  _V, _NA,  _S)
-VMCS_FIELD(VMENTRY_INTR_INFO,       0x4016, _S32, _TC, 11, _NC,  _V, _NA, _NS)
-VMCS_FIELD(VMENTRY_XCP_ERR,         0x4018, _S32, _TC, 12, _NC,  _V, _NA,  _S)
-VMCS_FIELD(VMENTRY_INSTR_LEN,       0x401A, _S32, _TC, 13, _NC,  _V, _NA,  _S)
-VMCS_FIELD(TPR_THRESHOLD,           0x401C, _S32, _TC, 14,  _C,  _V, _NA,  _S)
-VMCS_FIELD(2ND_VMEXEC_CTL,          0x401E, _S32, _TC, 15,  _C,  _V, _NA,  _S)
-VMCS_FIELD(PAUSE_LOOP_GAP,          0x4020, _S32, _TC, 16, _NC,  _V, _NA,  _S)
-VMCS_FIELD(PAUSE_LOOP_WINDOW,       0x4022, _S32, _TC, 17, _NC,  _V, _NA,  _S)
+VMCS_FIELD(PIN_VMEXEC_CTL,          0x4000, _S32, _TC,  0,  _C,  _V, _URW,  _S)
+VMCS_FIELD(CPU_VMEXEC_CTL,          0x4002, _S32, _TC,  1,  _C,  _V, _URW,  _S)
+VMCS_FIELD(XCP_BITMAP,              0x4004, _S32, _TC,  2, _NC,  _V, _URW,  _S)
+VMCS_FIELD(PF_ERR_MASK,             0x4006, _S32, _TC,  3, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(PF_ERR_MATCH,            0x4008, _S32, _TC,  4, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(CR3_TARG_COUNT,          0x400A, _S32, _TC,  5, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(VMEXIT_CTL,              0x400C, _S32, _TC,  6, _NC,  _V, _URW,  _S)
+VMCS_FIELD(VMEXIT_MSR_STORE_COUNT,  0x400E, _S32, _TC,  7, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(VMEXIT_MSR_LOAD_COUNT,   0x4010, _S32, _TC,  8, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(VMENTRY_CTL,             0x4012, _S32, _TC,  9, _NC,  _V, _URW,  _S)
+VMCS_FIELD(VMENTRY_MSR_LOAD_COUNT,  0x4014, _S32, _TC, 10, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(VMENTRY_INTR_INFO,       0x4016, _S32, _TC, 11, _NC,  _V, _URW, _NS)
+VMCS_FIELD(VMENTRY_XCP_ERR,         0x4018, _S32, _TC, 12, _NC,  _V, _URW,  _S)
+VMCS_FIELD(VMENTRY_INSTR_LEN,       0x401A, _S32, _TC, 13, _NC,  _V, _URW,  _S)
+VMCS_FIELD(TPR_THRESHOLD,           0x401C, _S32, _TC, 14,  _C,  _V,  _NA,  _S)
+VMCS_FIELD(2ND_VMEXEC_CTL,          0x401E, _S32, _TC, 15,  _C,  _V, _URW,  _S)
+VMCS_FIELD(PAUSE_LOOP_GAP,          0x4020, _S32, _TC, 16, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(PAUSE_LOOP_WINDOW,       0x4022, _S32, _TC, 17, _NC,  _V,  _NA,  _S)
 VMCS_UNUSED(                        0x4024, _S32, _TC, 18)
 VMCS_UNUSED(                        0x4026, _S32, _TC, 19)
 VMCS_UNUSED(                        0x4028, _S32, _TC, 20)
@@ -551,14 +552,14 @@ VMCS_SET_END(32)
 VMCS_SET_START(NAT)
 /* natural-width control fields. */
 VMCS_GROUP_START(NAT, CTL)
-VMCS_FIELD(CR0_GHMASK,              0x6000,  _SN, _TC,  0,  _C,  _V, _NA,  _S)
-VMCS_FIELD(CR4_GHMASK,              0x6002,  _SN, _TC,  1,  _C,  _V, _NA,  _S)
-VMCS_FIELD(CR0_SHADOW,              0x6004,  _SN, _TC,  2, _NC,  _V, _NA,  _S)
-VMCS_FIELD(CR4_SHADOW,              0x6006,  _SN, _TC,  3, _NC,  _V, _NA,  _S)
-VMCS_FIELD(CR3_TARGVAL0,            0x6008,  _SN, _TC,  4, _NC,  _V, _NA,  _S)
-VMCS_FIELD(CR3_TARGVAL1,            0x600A,  _SN, _TC,  5, _NC,  _V, _NA,  _S)
-VMCS_FIELD(CR3_TARGVAL2,            0x600C,  _SN, _TC,  6, _NC,  _V, _NA,  _S)
-VMCS_FIELD(CR3_TARGVAL3,            0x600E,  _SN, _TC,  7, _NC,  _V, _NA,  _S)
+VMCS_FIELD(CR0_GHMASK,              0x6000,  _SN, _TC,  0,  _C,  _V, _URW,  _S)
+VMCS_FIELD(CR4_GHMASK,              0x6002,  _SN, _TC,  1,  _C,  _V, _URW,  _S)
+VMCS_FIELD(CR0_SHADOW,              0x6004,  _SN, _TC,  2, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(CR4_SHADOW,              0x6006,  _SN, _TC,  3, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(CR3_TARGVAL0,            0x6008,  _SN, _TC,  4, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(CR3_TARGVAL1,            0x600A,  _SN, _TC,  5, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(CR3_TARGVAL2,            0x600C,  _SN, _TC,  6, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(CR3_TARGVAL3,            0x600E,  _SN, _TC,  7, _NC,  _V,  _NA,  _S)
 VMCS_UNUSED(                        0x6010,  _SN, _TC,  8)
 VMCS_UNUSED(                        0x6012,  _SN, _TC,  9)
 VMCS_UNUSED(                        0x6014,  _SN, _TC,  10)
@@ -622,26 +623,26 @@ VMCS_GROUP_END(NAT, DATA)
 
 /* natural-width guest state. */
 VMCS_GROUP_START(NAT, GUEST)
-VMCS_FIELD(CR0,                     0x6800,  _SN, _TG,  0, _NC,  _V, _NA, _NS)
-VMCS_FIELD(CR3,                     0x6802,  _SN, _TG,  1, _NC,  _V, _RW, _NS)
-VMCS_FIELD(CR4,                     0x6804,  _SN, _TG,  2, _NC,  _V, _RW, _NS)
-VMCS_FIELD(ES_BASE,                 0x6806,  _SN, _TG,  3, _NC,  _V, _RW, _NS)
-VMCS_FIELD(CS_BASE,                 0x6808,  _SN, _TG,  4, _NC,  _V, _RW, _NS)
-VMCS_FIELD(SS_BASE,                 0x680A,  _SN, _TG,  5, _NC,  _V, _RW, _NS)
-VMCS_FIELD(DS_BASE,                 0x680C,  _SN, _TG,  6, _NC,  _V, _RW, _NS)
-VMCS_FIELD(FS_BASE,                 0x680E,  _SN, _TG,  7, _NC,  _V, _RW, _NS)
-VMCS_FIELD(GS_BASE,                 0x6810,  _SN, _TG,  8, _NC,  _V, _RW, _NS)
-VMCS_FIELD(LDTR_BASE,               0x6812,  _SN, _TG,  9, _NC,  _V, _RW, _NS)
-VMCS_FIELD(TR_BASE,                 0x6814,  _SN, _TG, 10, _NC,  _V, _RW, _NS)
-VMCS_FIELD(GDTR_BASE,               0x6816,  _SN, _TG, 11, _NC,  _V, _RW, _NS)
-VMCS_FIELD(IDTR_BASE,               0x6818,  _SN, _TG, 12, _NC,  _V, _RW, _NS)
-VMCS_FIELD(DR7,                     0x681A,  _SN, _TG, 13, _NC,  _V, _NA, _NS)
-VMCS_FIELD(RSP,                     0x681C,  _SN, _TG, 14, _NC,  _V, _RW, _NS)
-VMCS_FIELD(RIP,                     0x681E,  _SN, _TG, 15, _NC,  _V, _RW, _NS)
-VMCS_FIELD(RFLAGS,                  0x6820,  _SN, _TG, 16, _NC,  _V, _RW, _NS)
-VMCS_FIELD(PENDDBG,                 0x6822,  _SN, _TG, 17, _NC,  _V, _RW, _NS)
-VMCS_FIELD(SYSENTER_ESP,            0x6824,  _SN, _TG, 18, _NC,  _V, _RW, _NS)
-VMCS_FIELD(SYSENTER_EIP,            0x6826,  _SN, _TG, 19, _NC,  _V, _RW, _NS)
+VMCS_FIELD(CR0,                     0x6800,  _SN, _TG,  0, _NC,  _V, _URW, _NS)
+VMCS_FIELD(CR3,                     0x6802,  _SN, _TG,  1, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(CR4,                     0x6804,  _SN, _TG,  2, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(ES_BASE,                 0x6806,  _SN, _TG,  3, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(CS_BASE,                 0x6808,  _SN, _TG,  4, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(SS_BASE,                 0x680A,  _SN, _TG,  5, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(DS_BASE,                 0x680C,  _SN, _TG,  6, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(FS_BASE,                 0x680E,  _SN, _TG,  7, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(GS_BASE,                 0x6810,  _SN, _TG,  8, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(LDTR_BASE,               0x6812,  _SN, _TG,  9, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(TR_BASE,                 0x6814,  _SN, _TG, 10, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(GDTR_BASE,               0x6816,  _SN, _TG, 11, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(IDTR_BASE,               0x6818,  _SN, _TG, 12, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(DR7,                     0x681A,  _SN, _TG, 13, _NC,  _V, _URW, _NS)
+VMCS_FIELD(RSP,                     0x681C,  _SN, _TG, 14, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(RIP,                     0x681E,  _SN, _TG, 15, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(RFLAGS,                  0x6820,  _SN, _TG, 16, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(PENDDBG,                 0x6822,  _SN, _TG, 17, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(SYSENTER_ESP,            0x6824,  _SN, _TG, 18, _NC,  _V,  _RW, _NS)
+VMCS_FIELD(SYSENTER_EIP,            0x6826,  _SN, _TG, 19, _NC,  _V,  _RW, _NS)
 VMCS_UNUSED(                        0x6828,  _SN, _TG, 20)
 VMCS_UNUSED(                        0x682A,  _SN, _TG, 21)
 VMCS_UNUSED(                        0x682C,  _SN, _TG, 22)
@@ -658,18 +659,18 @@ VMCS_GROUP_END(NAT, GUEST)
 
 /* natural-width host state. */
 VMCS_GROUP_START(NAT, HOST)
-VMCS_FIELD(HOST_CR0,                0x6C00,  _SN, _TH,  0, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_CR3,                0x6C02,  _SN, _TH,  1, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_CR4,                0x6C04,  _SN, _TH,  2, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_FSBASE,             0x6C06,  _SN, _TH,  3, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_GSBASE,             0x6C08,  _SN, _TH,  4, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_TRBASE,             0x6C0A,  _SN, _TH,  5, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_GDTRBASE,           0x6C0C,  _SN, _TH,  6, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_IDTRBASE,           0x6C0E,  _SN, _TH,  7, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_SYSENTER_ESP,       0x6C10,  _SN, _TH,  8, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_SYSENTER_EIP,       0x6C12,  _SN, _TH,  9, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_RSP,                0x6C14,  _SN, _TH, 10, _NC,  _V, _NA,  _S)
-VMCS_FIELD(HOST_RIP,                0x6C16,  _SN, _TH, 11, _NC,  _V, _NA,  _S)
+VMCS_FIELD(HOST_CR0,                0x6C00,  _SN, _TH,  0, _NC,  _V, _URW,  _S)
+VMCS_FIELD(HOST_CR3,                0x6C02,  _SN, _TH,  1, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_CR4,                0x6C04,  _SN, _TH,  2, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_FSBASE,             0x6C06,  _SN, _TH,  3, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_GSBASE,             0x6C08,  _SN, _TH,  4, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_TRBASE,             0x6C0A,  _SN, _TH,  5, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_GDTRBASE,           0x6C0C,  _SN, _TH,  6, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_IDTRBASE,           0x6C0E,  _SN, _TH,  7, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_SYSENTER_ESP,       0x6C10,  _SN, _TH,  8, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_SYSENTER_EIP,       0x6C12,  _SN, _TH,  9, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_RSP,                0x6C14,  _SN, _TH, 10, _NC,  _V, _URW,  _S)
+VMCS_FIELD(HOST_RIP,                0x6C16,  _SN, _TH, 11, _NC,  _V,  _NA,  _S)
 VMCS_UNUSED(                        0x6C18,  _SN, _TH, 12)
 VMCS_UNUSED(                        0x6C1A,  _SN, _TH, 13)
 VMCS_UNUSED(                        0x6C1C,  _SN, _TH, 14)
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 8256d628..a25ee54c 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -23,6 +23,7 @@
 
 #include <linux/file.h>
 #include <linux/highmem.h>
+#include <linux/miscdevice.h>
 #include <linux/mm.h>
 #include <linux/preempt.h>
 #include <linux/slab.h>
@@ -36,8 +37,8 @@
 
 #include "usercalldefs.h"
 
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 32)
-#error Linux kernels before 2.6.32 are not supported
+#if LINUX_VERSION_CODE < KERNEL_VERSION(3, 10, 0)
+#error Linux kernels before 3.10 are not supported
 #endif
 
 #include <asm/io.h>
@@ -96,7 +97,22 @@ static int LinuxDriver_Close(struct inode *inode, struct file *filp);
 
 static unsigned int LinuxDriverEstimateTSCkHz(void);
 
-static struct file_operations vmuser_fops;
+static const struct file_operations vmuser_fops = {
+   .owner = THIS_MODULE,
+   .open = LinuxDriver_Open,
+   .release = LinuxDriver_Close,
+   .unlocked_ioctl = LinuxDriver_Ioctl,
+   .compat_ioctl = LinuxDriver_Ioctl,
+};
+
+#ifndef VMX86_DEVEL
+static struct miscdevice vmmon_miscdev = {
+   .name = "vmmon",
+   .minor = MISC_DYNAMIC_MINOR,
+   .fops = &vmuser_fops,
+};
+#endif
+
 static struct timer_list tscTimer;
 static Atomic_uint32 tsckHz;
 static VmTimeStart tsckHzStartTime;
@@ -251,9 +267,8 @@ LinuxDriverInitTSCkHz(void)
  *      linux module entry point. Called by /sbin/insmod command
  *
  * Results:
- *      registers a device driver for a major # that depends
- *      on the uid. Add yourself to that list.  List is now in
- *      private/driver-private.c.
+ *      Release: registers a device driver with a misc minor node.
+ *      Devel: registers for a major number with user-created node.
  *
  *----------------------------------------------------------------------
  */
@@ -280,46 +295,43 @@ init_module(void)
    if (!Vmx86_CreateHVIOBitmap()) {
       return -ENOMEM;
    }
-   linuxState.fastClockThread = NULL;
-   linuxState.fastClockRate = 0;
 
-   /*
-    * Initialize the file_operations structure. Because this code is always
-    * compiled as a module, this is fine to do it here and not in a static
-    * initializer.
-    */
+   if (!Vmx86_CheckMSRUniformity()) {
+      return -EPERM;
+   }
 
-   memset(&vmuser_fops, 0, sizeof vmuser_fops);
-   vmuser_fops.owner = THIS_MODULE;
-   vmuser_fops.unlocked_ioctl = LinuxDriver_Ioctl;
-   vmuser_fops.compat_ioctl = LinuxDriver_Ioctl;
-   vmuser_fops.open = LinuxDriver_Open;
-   vmuser_fops.release = LinuxDriver_Close;
+   linuxState.fastClockThread = NULL;
+   linuxState.fastClockRate = 0;
 
 #ifdef VMX86_DEVEL
    devel_init_module();
-   linuxState.minor = 0;
    retval = register_chrdev(linuxState.major, linuxState.deviceName,
                             &vmuser_fops);
+   if (retval) {
+      Warning("Module %s: error registering with major=%d\n",
+              linuxState.deviceName, linuxState.major);
+   } else {
+      Log("Module %s: registered with major=%d\n",
+          linuxState.deviceName, linuxState.major);
+   }
 #else
    sprintf(linuxState.deviceName, "vmmon");
    linuxState.major = 10;
-   linuxState.minor = 165;
-   linuxState.misc.minor = linuxState.minor;
-   linuxState.misc.name = linuxState.deviceName;
-   linuxState.misc.fops = &vmuser_fops;
 
-   retval = misc_register(&linuxState.misc);
+   retval = misc_register(&vmmon_miscdev);
+   if (retval) {
+      Warning("Module %s: error registering misc device %s\n",
+              linuxState.deviceName, vmmon_miscdev.name);
+   } else {
+      Log("Module %s: registered as misc device %s\n", linuxState.deviceName,
+          vmmon_miscdev.name);
+   }
 #endif
 
    if (retval) {
-      Warning("Module %s: error registering with major=%d minor=%d\n",
-              linuxState.deviceName, linuxState.major, linuxState.minor);
       Vmx86_CleanupHVIOBitmap();
       return -ENOENT;
    }
-   Log("Module %s: registered with major=%d minor=%d\n",
-       linuxState.deviceName, linuxState.major, linuxState.minor);
 
    HostIF_InitUptime();
 #if LINUX_VERSION_CODE < KERNEL_VERSION(4, 15, 0) && !defined(timer_setup)
@@ -357,7 +369,7 @@ cleanup_module(void)
 #ifdef VMX86_DEVEL
    unregister_chrdev(linuxState.major, linuxState.deviceName);
 #else
-   misc_deregister(&linuxState.misc);
+   misc_deregister(&vmmon_miscdev);
 #endif
 
    Log("Module %s: unloaded\n", linuxState.deviceName);
@@ -1080,6 +1092,23 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
+   case IOCTL_VMX86_GET_SWITCH_ERROR_ADDR: {
+      VMSwitchErrorArgs args;
+
+      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
+      if (retval != 0) {
+         break;
+      }
+      if (args.vcpuid >= vm->numVCPUs || vm->crosspage == NULL ||
+          vm->crosspage[args.vcpuid] == NULL) {
+         retval = -EINVAL;
+         break;
+      }
+      args.addr = vm->crosspage[args.vcpuid]->wsUD2;
+      retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
+      break;
+   }
+
    case IOCTL_VMX86_GET_KHZ_ESTIMATE:
       retval = LinuxDriverEstimateTSCkHz();
       break;
diff --git a/vmmon-only/linux/driver.h b/vmmon-only/linux/driver.h
index 25c366ac..69c466e6 100644
--- a/vmmon-only/linux/driver.h
+++ b/vmmon-only/linux/driver.h
@@ -23,7 +23,6 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
-#include <linux/miscdevice.h>
 #include <linux/mutex.h>
 #include <linux/sched.h>
 #include <linux/semaphore.h>
@@ -61,8 +60,6 @@ typedef struct Device {
 
 typedef struct VMXLinuxState {
    int major;
-   int minor;
-   struct miscdevice misc;
    char deviceName[VM_DEVICE_NAME_SIZE];
    char buf[LINUXLOG_BUFFER_SIZE];
    Device *head;
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 0dfd3f3f..88912859 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -72,6 +72,7 @@
 #include "memDefaults.h"
 #include "vcpuid.h"
 #include "x86svm.h"
+#include "crosspage.h"
 
 #include "pgtbl.h"
 #include "versioned_atomic.h"
@@ -188,6 +189,7 @@ static void UnlockEntry(void *clientData, MemTrackEntry *entryPtr);
 #define SPURIOUS_APIC_VECTOR 0
 #endif
 static const uint8 monitorIPIVector = SPURIOUS_APIC_VECTOR;
+
 /*
  * POSTED_INTR_VECTOR is defined on kernels after 3.10 when built with
  * KVM support.
@@ -197,6 +199,15 @@ static const uint8 monitorIPIVector = SPURIOUS_APIC_VECTOR;
 #endif
 static const uint8 hvIPIVector = POSTED_INTR_VECTOR;
 
+/*
+ * perfCtrVector may leak, choose highest priority interrupt that is
+ * consistently ack'd by all current linux kernels.
+ */
+#ifndef ERROR_APIC_VECTOR
+#define ERROR_APIC_VECTOR 0xFE
+#endif
+#define PERF_CTR_VECTOR ERROR_APIC_VECTOR
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -615,38 +626,6 @@ HostIF_FastClockUnlock(int callerID) // IN
 }
 
 
-/*
- *----------------------------------------------------------------------
- *
- * MapCrossPage & UnmapCrossPage
- *
- *    Both x86-64 and ia32 need to map crosspage to an executable
- *    virtual address. We use the vmap interface instead of kmap
- *    due to bug 43907.
- *
- * Side effects:
- *
- *    UnmapCrossPage assumes that the page has been refcounted up
- *    so it takes care of the put_page.
- *
- *----------------------------------------------------------------------
- */
-static void *
-MapCrossPage(struct page *p)  // IN:
-{
-   return vmap(&p, 1, VM_MAP, VM_PAGE_KERNEL_EXEC);
-}
-
-
-static void
-UnmapCrossPage(struct page *p,  // IN:
-               void *va)        // IN:
-{
-   vunmap(va);
-   put_page(p);
-}
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -974,11 +953,8 @@ static void
 HostIFFreeVMHost(VMHost *vmhost) // IN:
 {
    ASSERT(vmhost->lockedPages == NULL &&
-          vmhost->AWEPages    == NULL &&
-          vmhost->crosspagePagesCount == 0);
-   Vmx86_Free(vmhost->crosspagePages);
+          vmhost->AWEPages    == NULL);
    Vmx86_Free(vmhost->vcpuSemaTask);
-   vmhost->crosspagePages = NULL;
    vmhost->vcpuSemaTask   = NULL;
    HostIF_FreeKernelMem(vmhost);
 }
@@ -1007,14 +983,14 @@ HostIFAllocVMHost(uint32 numVCPUs) // IN:
    if (vmhost == NULL) {
       return NULL;
    }
-   if ((vmhost->crosspagePages =
-        Vmx86_Calloc(numVCPUs, sizeof *vmhost->crosspagePages, TRUE)) != NULL &&
-       (vmhost->vcpuSemaTask =
-        Vmx86_Calloc(numVCPUs, sizeof *vmhost->vcpuSemaTask, TRUE))   != NULL) {
-      return vmhost;
+   vmhost->vcpuSemaTask = Vmx86_Calloc(numVCPUs, sizeof *vmhost->vcpuSemaTask,
+                                       TRUE);
+   if (vmhost->vcpuSemaTask == NULL) {
+      HostIFFreeVMHost(vmhost);
+      return NULL;
    }
-   HostIFFreeVMHost(vmhost);
-   return NULL;
+
+   return vmhost;
 }
 
 
@@ -1519,20 +1495,12 @@ UnlockEntry(void *clientData,         // IN:
 void
 HostIF_FreeAllResources(VMDriver *vm) // IN
 {
-   unsigned int cnt;
-
    HostIFHostMemCleanup(vm);
    if (vm->memtracker) {
       MemTrack_Cleanup(vm->memtracker, UnlockEntry, vm);
       vm->memtracker = NULL;
    }
    if (vm->vmhost) {
-      ASSERT(vm->vmhost->crosspagePagesCount <= vm->numVCPUs);
-      for (cnt = vm->vmhost->crosspagePagesCount; cnt > 0; ) {
-         struct page* p = vm->vmhost->crosspagePages[--cnt];
-         UnmapCrossPage(p, vm->crosspage[cnt]);
-      }
-      vm->vmhost->crosspagePagesCount = 0;
       HostIFFreeVMHost(vm->vmhost);
       vm->vmhost = NULL;
    }
@@ -1739,7 +1707,10 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
    lockedPages += global_page_state(NR_PAGETABLE);
 #endif
    /* NR_SLAB_* moved from zone to node in 4.13. */
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 13, 0)
+
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 9, 0)
+   lockedPages += global_node_page_state_pages(NR_SLAB_UNRECLAIMABLE_B);
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 13, 0)
    lockedPages += global_node_page_state(NR_SLAB_UNRECLAIMABLE);
 #else
    lockedPages += global_page_state(NR_SLAB_UNRECLAIMABLE);
@@ -2154,49 +2125,36 @@ HostIF_CopyToUser(VA64 dst,         // OUT
 /*
  *-----------------------------------------------------------------------------
  *
- * HostIF_MapCrossPage --
- *
- *    Map the cross page in the kernel address space given a user VA.  The
- *    kernel mapping must not overlap the monitor's 64MB VA space (bug 32922).
- *    In practice, the host kernel does not return mappings in that range.
- *    This is checked in TaskCreatePTPatch() which gracefully fails if it must.
+ * HostIFGetCrossPageMPNWork --
+ * HostIF_GetCrossPageCodeMPN --
+ * HostIF_GetCrossPageDataMPN --
  *
- * Results:
- *    The kernel virtual address on success
- *    NULL on failure
- *
- * Side effects:
- *    None
  *
  *-----------------------------------------------------------------------------
  */
 
-void *
-HostIF_MapCrossPage(VMDriver *vm, // IN
-                    VA64 uAddr)   // IN
+static MPN
+HostIFGetCrossPageMPNWork(void *va)
 {
-   void *p = VA64ToPtr(uAddr);
-   struct page *page;
-   VA           vPgAddr;
-   VA           ret;
+   struct page *pg = vmalloc_to_page(va);
 
-   if (HostIFGetUserPages(p, &page, 1)) {
-      return NULL;
+   if (pg != NULL) {
+      return page_to_pfn(pg);
    }
-   vPgAddr = (VA) MapCrossPage(page);
-   HostIF_VMLock(vm, 27);
-   if (vm->vmhost->crosspagePagesCount >= vm->numVCPUs) {
-      HostIF_VMUnlock(vm, 27);
-      UnmapCrossPage(page, (void*)vPgAddr);
 
-      return NULL;
-   }
-   vm->vmhost->crosspagePages[vm->vmhost->crosspagePagesCount++] = page;
-   HostIF_VMUnlock(vm, 27);
+   return INVALID_MPN;
+}
 
-   ret = vPgAddr | (((VA)p) & (PAGE_SIZE - 1));
+MPN
+HostIF_GetCrossPageDataMPN(VMCrossPageData *crosspageData)
+{
+   return HostIFGetCrossPageMPNWork(crosspageData);
+}
 
-   return (void*)ret;
+MPN
+HostIF_GetCrossPageCodeMPN(void)
+{
+   return HostIFGetCrossPageMPNWork((void *)CrossPage_CodePage);
 }
 
 
@@ -2530,6 +2488,32 @@ HostIF_GetHVIPIVector(void)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * HostIF_GetPerfCtrVector --
+ *
+ *      Return a vector the monitor can use for perf counters.
+ *      This needs to be a high priority interrupt that is always ack'd
+ *      by the kernel because they can leak in edge cases.
+ *
+ * Results:
+ *     The vector for perf counter events.
+ *
+ * Side effects:
+ *      None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+uint8
+HostIF_GetPerfCtrVector(void)
+{
+   ASSERT_ON_COMPILE(PERF_CTR_VECTOR == 0xFE);
+   return PERF_CTR_VECTOR;
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2553,11 +2537,12 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
                      uint64 *args)   // IN:
 {
    struct file *file;
-   mm_segment_t old_fs;
    int res;
    int waitFD = args[0];
    int timeoutms = args[2];
    uint64 value;
+   struct poll_wqueues table;
+   unsigned int mask;
 
    ASSERT(vcpuid < vm->numVCPUs);
 
@@ -2566,33 +2551,29 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
       return MX_WAITERROR;
    }
 
-   old_fs = get_fs();
-   set_fs(KERNEL_DS);
-
-   {
-      struct poll_wqueues table;
-      unsigned int mask;
-
-      poll_initwait(&table);
-      current->state = TASK_INTERRUPTIBLE;
-      mask = file->f_op->poll(file, &table.pt);
-      if (!(mask & (POLLIN | POLLERR | POLLHUP))) {
-         vm->vmhost->vcpuSemaTask[vcpuid] = current;
-         schedule_timeout(timeoutms * HZ / 1000);  // convert to Hz
-         vm->vmhost->vcpuSemaTask[vcpuid] = NULL;
-      }
-      current->state = TASK_RUNNING;
-      poll_freewait(&table);
+   poll_initwait(&table);
+   current->state = TASK_INTERRUPTIBLE;
+   mask = file->f_op->poll(file, &table.pt);
+   if (!(mask & (POLLIN | POLLERR | POLLHUP))) {
+      vm->vmhost->vcpuSemaTask[vcpuid] = current;
+      schedule_timeout(timeoutms * HZ / 1000);  // convert to Hz
+      vm->vmhost->vcpuSemaTask[vcpuid] = NULL;
    }
+   current->state = TASK_RUNNING;
+   poll_freewait(&table);
 
    /*
     * Userland only writes in multiples of sizeof(uint64). This will allow
     * the code to happily deal with a pipe or an eventfd. We only care about
     * reading no bytes (EAGAIN - non blocking fd) or sizeof(uint64).
+    *
+    * Upstream Linux changed the function parameter types/ordering in 4.14.0.
     */
-
-   res = file->f_op->read(file, (char *) &value, sizeof value, &file->f_pos);
-
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 14, 0)
+   res = kernel_read(file, file->f_pos, (char *)&value, sizeof value);
+#else
+   res = kernel_read(file, &value, sizeof value, &file->f_pos);
+#endif
    if (res == sizeof value) {
       res = MX_WAITNORMAL;
    } else {
@@ -2601,7 +2582,6 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
       }
    }
 
-   set_fs(old_fs);
    fput(file);
 
    /*
@@ -2689,7 +2669,6 @@ int
 HostIF_SemaphoreSignal(uint64 *args)  // IN:
 {
    struct file *file;
-   mm_segment_t old_fs;
    int res;
    int signalFD = args[1];
    uint64 value = 1;  // make an eventfd happy should it be there
@@ -2699,22 +2678,23 @@ HostIF_SemaphoreSignal(uint64 *args)  // IN:
       return MX_WAITERROR;
    }
 
-   old_fs = get_fs();
-   set_fs(KERNEL_DS);
-
    /*
     * Always write sizeof(uint64) bytes. This works fine for eventfd and
     * pipes. The data written is formatted to make an eventfd happy should
     * it be present.
+    *
+    * Upstream Linux changed the function parameter types/ordering in 4.14.0.
     */
-
-   res = file->f_op->write(file, (char *) &value, sizeof value, &file->f_pos);
+#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 14, 0)
+   res = kernel_write(file, (char *)&value, sizeof value, file->f_pos);
+#else
+   res = kernel_write(file, &value, sizeof value, &file->f_pos);
+#endif
 
    if (res == sizeof value) {
       res = MX_WAITNORMAL;
    }
 
-   set_fs(old_fs);
    fput(file);
 
    /*
diff --git a/vmmon-only/linux/vmhost.h b/vmmon-only/linux/vmhost.h
index 8e7517f9..8e1b6776 100644
--- a/vmmon-only/linux/vmhost.h
+++ b/vmmon-only/linux/vmhost.h
@@ -79,8 +79,6 @@ typedef struct VMHost {
     */
    Mutex vmMutex;
 
-   unsigned int         crosspagePagesCount;
-   struct page        **crosspagePages;      /* ptr to numVCPUs-sized array */
    struct task_struct **vcpuSemaTask;        /* ptr to numVCPUs-sized array */
 
    /*
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/vmcore/moduleloop.c
index 804494bd..28563fe5 100644
--- a/vmmon-only/vmcore/moduleloop.c
+++ b/vmmon-only/vmcore/moduleloop.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -75,12 +75,13 @@ Vmx86_RunVM(VMDriver *vm,   // IN:
    uint64           retval    = MODULECALL_USERRETURN;
    VMCrossPageData *crosspage;
    int              bailValue = 0;
+   Bool             switchOk = TRUE;
 
    ASSERT(vcpuid < vm->numVCPUs);
    if (vm->crosspage[vcpuid] == NULL) {
       return USERCALL_VMX86ALLOCERR;
    }
-   crosspage = &vm->crosspage[vcpuid]->crosspageData;
+   crosspage = vm->crosspage[vcpuid];
 
    /*
     * Check if we were interrupted by signal.
@@ -95,9 +96,9 @@ Vmx86_RunVM(VMDriver *vm,   // IN:
        * Task_Switch changes the world to the monitor.
        * The monitor is waiting in the BackToHost routine.
        */
-      UCTIMESTAMP(crosspage, SWITCHING_TO_MONITOR);
-      Task_Switch(vm, vcpuid);
-      UCTIMESTAMP(crosspage, SWITCHED_TO_MODULE);
+      UCTIMESTAMP(crosspage->ucTimeStamps, SWITCHING_TO_MONITOR);
+      switchOk = Task_Switch(vm, vcpuid);
+      UCTIMESTAMP(crosspage->ucTimeStamps, SWITCHED_TO_MODULE);
 
       /*
        * Wake up anything that was waiting for this vcpu to run
@@ -119,6 +120,11 @@ skipTaskSwitch:;
 
       retval = MODULECALL_USERRETURN;
 
+      if (UNLIKELY(!switchOk)) {
+         bailValue = USERCALL_SWITCHERR;
+         goto bailOut;
+      }
+
       if (crosspage->userCallType != MODULECALL_USERCALL_NONE) {
          /*
           * This is the main user call path.  Handle by returning
@@ -165,7 +171,6 @@ skipTaskSwitch:;
 
       case MODULECALL_SEMAWAIT: {
          retval = HostIF_SemaphoreWait(vm, vcpuid, crosspage->args);
-
          if (retval == MX_WAITINTERRUPTED) {
             crosspage->moduleCallInterrupted = TRUE;
             bailValue = USERCALL_RESTART;
@@ -283,6 +288,10 @@ skipTaskSwitch:;
          retval = HostIF_GetHVIPIVector();
       } break;
 
+      case MODULECALL_GET_PERF_CTR_VECTOR: {
+         retval = HostIF_GetPerfCtrVector();
+      } break;
+
       case MODULECALL_GET_HOST_TIMER_VECTORS: {
          uint8 v0, v1;
          HostIF_GetTimerVectors(&v0, &v1);
@@ -321,6 +330,19 @@ skipTaskSwitch:;
                                                    hvIOBitmap->mpn;
       } break;
 
+      case MODULECALL_GET_MSR: {
+         /*
+          * Allocate a MSRQuery request on stack with only one MSRReply slot
+          * since this MSR will be queried from a MSR cache or on a single pcpu.
+          */
+         uint8 req[sizeof(MSRQuery) + sizeof(MSRReply)];
+         MSRQuery *query = (MSRQuery *)&req[0];
+         query->msrNum = (uint32)crosspage->args[0];
+         query->numLogicalCPUs = 1;
+         retval = Vmx86_GetAllMSRs(query);
+         crosspage->args[0] = query->logicalCPUs[0].msrVal;
+      } break;
+
       case MODULECALL_ALLOC_CONTIG_PAGES: {
          PageCnt pages = crosspage->args[0];
          HostIFContigMemMap *alloc;
diff --git a/vmnet-only/Makefile b/vmnet-only/Makefile
index 40bdb6a8..2640c1a9 100644
--- a/vmnet-only/Makefile
+++ b/vmnet-only/Makefile
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+# Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -137,7 +137,6 @@ CC_OPTS += -DVMX86_DEBUG
 endif
 
 # Add Spectre options when available
-CC_OPTS += $(call vm_check_gcc,-mindirect-branch=thunk -mindirect-branch-register,)
 
 include $(SRCROOT)/Makefile.kernel
 
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index b33708df..6cf8f520 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2017,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2017,2019,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -81,7 +81,9 @@ extern unsigned int  vnet_max_qlen;
 #   define skb_frag_page(frag) (frag)->page
 #   define skb_frag_size(frag) (frag)->size
 #endif
-#if COMPAT_LINUX_VERSION_CHECK_LT(5, 4, 0)
+#if COMPAT_LINUX_VERSION_CHECK_LT(5, 4, 0) && \
+    !(defined(CONFIG_SUSE_VERSION) && CONFIG_SUSE_VERSION == 15 && \
+      defined(CONFIG_SUSE_PATCHLEVEL) && CONFIG_SUSE_PATCHLEVEL >= 2)
 #   define skb_frag_off(frag) (frag)->page_offset
 #endif
 
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index d13c0502..52bb5d88 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -41,6 +41,13 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
+#if defined _MSC_VER && !defined BORA_NO_WIN32_INTRINS
+#pragma warning(push)
+#pragma warning(disable : 4255)      // disable no-prototype() to (void) warning
+#include <intrin.h>
+#pragma warning(pop)
+#endif
+
 #include "vm_basic_types.h"
 #include "vm_assert.h"
 
@@ -145,64 +152,6 @@ typedef ALIGNED(16) struct Atomic_uint128 {
 } Atomic_uint128;
 #endif
 
-/*
- * Prototypes for msft atomics.  These are defined & inlined by the
- * compiler so no function definition is needed.  The prototypes are
- * needed for C++.
- *
- * The declarations for the intrinsic functions were taken from ntddk.h
- * in the DDK. The declarations must match otherwise the 64-bit C++
- * compiler will complain about second linkage of the intrinsic functions.
- * We define the intrinsic using the basic types corresponding to the
- * Windows typedefs. This avoids having to include windows header files
- * to get to the windows types.
- */
-#if defined _MSC_VER && !defined BORA_NO_WIN32_INTRINS
-#ifdef __cplusplus
-extern "C" {
-#endif
-long  _InterlockedExchange(long volatile*, long);
-long  _InterlockedCompareExchange(long volatile*, long, long);
-long  _InterlockedExchangeAdd(long volatile*, long);
-long  _InterlockedDecrement(long volatile*);
-long  _InterlockedIncrement(long volatile*);
-__int64  _InterlockedCompareExchange64(__int64 volatile*, __int64, __int64);
-#pragma intrinsic(_InterlockedExchange, _InterlockedCompareExchange)
-#pragma intrinsic(_InterlockedExchangeAdd, _InterlockedDecrement)
-#pragma intrinsic(_InterlockedIncrement)
-#pragma intrinsic(_InterlockedCompareExchange64)
-
-# if _MSC_VER >= 1600
-char     _InterlockedExchange8(char volatile *, char);
-char     _InterlockedCompareExchange8(char volatile *, char, char);
-#pragma intrinsic(_InterlockedCompareExchange8, _InterlockedCompareExchange8)
-#endif
-
-#if defined VM_X86_64
-long     _InterlockedAnd(long volatile*, long);
-__int64  _InterlockedAnd64(__int64 volatile*, __int64);
-long     _InterlockedOr(long volatile*, long);
-__int64  _InterlockedOr64(__int64 volatile*, __int64);
-long     _InterlockedXor(long volatile*, long);
-__int64  _InterlockedXor64(__int64 volatile*, __int64);
-__int64  _InterlockedExchangeAdd64(__int64 volatile*, __int64);
-__int64  _InterlockedIncrement64(__int64 volatile*);
-__int64  _InterlockedDecrement64(__int64 volatile*);
-__int64  _InterlockedExchange64(__int64 volatile*, __int64);
-#if !defined _WIN64
-#pragma intrinsic(_InterlockedAnd, _InterlockedAnd64)
-#pragma intrinsic(_InterlockedOr, _InterlockedOr64)
-#pragma intrinsic(_InterlockedXor, _InterlockedXor64)
-#pragma intrinsic(_InterlockedExchangeAdd64, _InterlockedIncrement64)
-#pragma intrinsic(_InterlockedDecrement64, _InterlockedExchange64)
-#endif /* !_WIN64 */
-#endif /* __x86_64__ */
-
-#ifdef __cplusplus
-}
-#endif
-#endif /* _MSC_VER */
-
 #if defined __arm__
 /*
  * LDREX without STREX or CLREX may cause problems in environments where the
@@ -255,15 +204,6 @@ Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
  * registers.
  */
 
-#if defined _MSC_VER && _MSC_VER < 1600 && defined __x86_64__
-uint8 VMWInterlockedExchange8(uint8 volatile *ptr,
-                              uint8 val);
-
-uint8 VMWInterlockedCompareExchange8(uint8 volatile *ptr,
-                                     uint8 newVal,
-                                     uint8 oldVal);
-#endif
-
 #if defined __GNUC__ && defined VM_ARM_32
 /* Force the link step to fail for unimplemented functions. */
 extern int AtomicUndefined(void const *);
@@ -405,19 +345,8 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
       : "memory"
    );
    return val;
-#elif defined _MSC_VER && _MSC_VER >= 1600
+#elif defined _MSC_VER
    return _InterlockedExchange8((volatile char *)&var->value, val);
-#elif defined _MSC_VER && defined __i386__
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm movzx eax, val
-      __asm mov ebx, var
-      __asm xchg [ebx]Atomic_uint8.value, al
-   }
-#pragma warning(pop)
-#elif defined _MSC_VER && defined __x86_64__
-   return VMWInterlockedExchange8(&var->value, val);
 #else
 #error No compiler defined for Atomic_ReadWrite8
 #endif
@@ -500,23 +429,9 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
    );
 
    return val;
-#elif defined _MSC_VER && _MSC_VER >= 1600
+#elif defined _MSC_VER
    return _InterlockedCompareExchange8((volatile char *)&var->value,
                                        newVal, oldVal);
-#elif defined _MSC_VER && defined __i386__
-#pragma warning(push)
-#pragma warning(disable : 4035)         // disable no-return warning
-   {
-      __asm mov al, oldVal
-      __asm mov ebx, var
-      __asm mov cl, newVal
-      __asm lock cmpxchg [ebx]Atomic_uint8.value, cl
-      __asm movzx eax, al
-      // eax is the return value, this is documented to work - edward
-   }
-#pragma warning(pop)
-#elif defined _MSC_VER && defined __x86_64__
-   return VMWInterlockedCompareExchange8(&var->value, newVal, oldVal);
 #else
 #error No compiler defined for Atomic_ReadIfEqualWrite8
 #endif
@@ -1312,13 +1227,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedAnd((long *)&var->value, (long)val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock And [ebx]Atomic_uint32.value, eax
-#endif
 #else
 #error No compiler defined for Atomic_And
 #endif
@@ -1377,13 +1286,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedOr((long *)&var->value, (long)val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock Or [ebx]Atomic_uint32.value, eax
-#endif
 #else
 #error No compiler defined for Atomic_Or
 #endif
@@ -1442,13 +1345,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-#if defined __x86_64__ || defined VM_ARM_32
    _InterlockedXor((long *)&var->value, (long)val);
-#else
-   __asm mov eax, val
-   __asm mov ebx, var
-   __asm lock Xor [ebx]Atomic_uint32.value, eax
-#endif
 #else
 #error No compiler defined for Atomic_Xor
 #endif
@@ -2187,18 +2084,13 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
     */
    return var->value;
 #elif defined _MSC_VER && defined VM_ARM_32
+   /* MSVC + 32-bit ARM has add64 but no cmpxchg64 */
    return _InterlockedAdd64((__int64 *)&var->value, 0);
 #elif defined _MSC_VER && defined __i386__
-#   pragma warning(push)
-#   pragma warning(disable : 4035)      // disable no-return warning
-   {
-      __asm mov ecx, var
-      __asm mov edx, ecx
-      __asm mov eax, ebx
-      __asm lock cmpxchg8b [ecx]
-      // edx:eax is the return value; this is documented to work. --mann
-   }
-#   pragma warning(pop)
+   /* MSVC + 32-bit x86 has cmpxchg64 but no add64 */
+   return _InterlockedCompareExchange64((__int64 *)&var->value,
+                                        (__int64)255,  // Unlikely value to
+                                        (__int64)255); // not dirty cache
 #elif defined __GNUC__ && defined VM_ARM_V7
    __asm__ __volatile__(
       "ldrexd %[value], %H[value], [%[var]] \n\t"
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index ec31efd0..8bc743e8 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -35,6 +35,13 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
+#if defined _MSC_VER && !defined BORA_NO_WIN32_INTRINS
+#pragma warning(push)
+#pragma warning(disable : 4255)      // disable no-prototype() to (void) warning
+#include <intrin.h>
+#pragma warning(pop)
+#endif
+
 #include "vm_basic_types.h"
 
 #if defined VM_X86_64
@@ -499,7 +506,7 @@ uint16set(void *dst, uint16 val, size_t count)
       "strh    %w2, [%0]\n"
       "4:"
       : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
-      : "r" (val)
+      : "r" ((uint64)val)
       : "cc", "memory");
 #else
    size_t dummy0;
@@ -552,6 +559,7 @@ uint32set(void *dst, uint32 val, size_t count)
       : "cc", "memory");
 #elif defined(VM_ARM_64)
    void   *tmpDst = dst;
+   uint64 tmpVal = val;
 
    if (count == 0) {
       return dst;
@@ -588,7 +596,7 @@ uint32set(void *dst, uint32 val, size_t count)
       "cbz     %1, 4f\n\t"
       "str     %w2, [%0]\n\t" // No incr
       "4:"
-      : "+r" (tmpDst), "+r" (count), "+r" (val)
+      : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
       :
       : "cc", "memory");
 #else
@@ -632,22 +640,13 @@ uint32set(void *dst, uint32 val, size_t count)
 static INLINE void *
 uint16set(void *dst, uint16 val, size_t count)
 {
-#ifdef VM_X86_64
+#ifdef VM_X86_ANY
    __stosw((uint16*)dst, val, count);
-#elif defined(VM_ARM_32)
+#else
    size_t i;
    for (i = 0; i < count; i++) {
       ((uint16 *)dst)[i] = val;
    }
-#else
-   __asm { pushf;
-           mov ax, val;
-           mov ecx, count;
-           mov edi, dst;
-           cld;
-           rep stosw;
-           popf;
-   }
 #endif
    return dst;
 }
@@ -655,22 +654,13 @@ uint16set(void *dst, uint16 val, size_t count)
 static INLINE void *
 uint32set(void *dst, uint32 val, size_t count)
 {
-#ifdef VM_X86_64
+#ifdef VM_X86_ANY
    __stosd((unsigned long*)dst, (unsigned long)val, count);
-#elif defined(VM_ARM_32)
+#else
    size_t i;
    for (i = 0; i < count; i++) {
       ((uint32 *)dst)[i] = val;
    }
-#else
-   __asm { pushf;
-           mov eax, val;
-           mov ecx, count;
-           mov edi, dst;
-           cld;
-           rep stosd;
-           popf;
-   }
 #endif
    return dst;
 }
@@ -782,17 +772,9 @@ PAUSE(void)
 #endif
 }
 #elif defined(_MSC_VER)
-#ifdef VM_X86_64
 {
    _mm_pause();
 }
-#else /* VM_X86_64 */
-#pragma warning( disable : 4035)
-{
-   __asm _emit 0xf3 __asm _emit 0x90
-}
-#pragma warning (default: 4035)
-#endif /* VM_X86_64 */
 #else  /* __GNUC__  */
 #error No compiler defined for PAUSE
 #endif
@@ -840,11 +822,11 @@ RDTSC(void)
 #endif
 }
 #elif defined(_MSC_VER)
-#ifdef VM_X86_64
+#ifdef VM_X86_ANY
 {
    return __rdtsc();
 }
-#elif defined(VM_ARM_32)
+#else
 {
    /*
     * We need to do more inverstagetion here to find
@@ -853,13 +835,7 @@ RDTSC(void)
    NOT_IMPLEMENTED();
    return 0;
 }
-#else
-#pragma warning( disable : 4035)
-{
-   __asm _emit 0x0f __asm _emit 0x31
-}
-#pragma warning (default: 4035)
-#endif /* VM_X86_64 */
+#endif /* VM_X86_ANY */
 #else  /* __GNUC__  */
 #error No compiler defined for RDTSC
 #endif /* __GNUC__  */
diff --git a/vmnet-only/vm_basic_asm_x86_64.h b/vmnet-only/vm_basic_asm_x86_64.h
index ee1d1fb0..75823a43 100644
--- a/vmnet-only/vm_basic_asm_x86_64.h
+++ b/vmnet-only/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,41 +39,6 @@
 #error "This file is x86-64 only!"
 #endif
 
-#if defined(_MSC_VER) && !defined(BORA_NO_WIN32_INTRINS)
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-uint64 _umul128(uint64 multiplier, uint64 multiplicand,
-                uint64 *highProduct);
-int64 _mul128(int64 multiplier, int64 multiplicand,
-              int64 *highProduct);
-uint64 __shiftright128(uint64 lowPart, uint64 highPart, uint8 shift);
-#ifdef ULM
-void _fxsave64(void *save);
-void _fxsave(void *save);
-void _fxrstor64(const void *load);
-void _fxrstor(const void *load);
-void _xsave64(void *save, uint64 mask);
-void _xsave(void *save, uint64 mask);
-void _xsaveopt64(void *save, uint64 mask);
-void _xsavec(void *save, uint64 mask);
-void _xrstor64(const void *load, uint64 mask);
-void _xrstor(const void *load, uint64 mask);
-#endif /* ULM */
-#ifdef __cplusplus
-}
-#endif
-
-#pragma intrinsic(_umul128, _mul128, __shiftright128)
-
-#ifdef ULM
-#pragma intrinsic(_fxsave64, _fxsave, _fxrstor64, _fxrstor, _xsave64, _xsave, \
-                  _xsaveopt64, _xsavec, _xrstor64, _xrstor)
-#endif /* ULM */
-
-#endif // _MSC_VER
-
 #if defined(__GNUC__)
 /*
  * GET_CURRENT_PC
diff --git a/vmnet-only/vm_basic_asm_x86_common.h b/vmnet-only/vm_basic_asm_x86_common.h
index 9fc0cacb..8c2ee36e 100644
--- a/vmnet-only/vm_basic_asm_x86_common.h
+++ b/vmnet-only/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,97 +38,6 @@
 #error "Should be included only in x86 builds"
 #endif
 
-/*
- * x86-64 windows doesn't support inline asm so we have to use these
- * intrinsic functions defined in the compiler.  Not all of these are well
- * documented.  There is an array in the compiler dll (c1.dll) which has
- * an array of the names of all the intrinsics minus the leading
- * underscore.  Searching around in the ntddk.h file can also be helpful.
- *
- * The declarations for the intrinsic functions were taken from the DDK.
- * Our declarations must match the ddk's otherwise the 64-bit c++ compiler
- * will complain about second linkage of the intrinsic functions.
- * We define the intrinsic using the basic types corresponding to the
- * Windows typedefs. This avoids having to include windows header files
- * to get to the windows types.
- */
-#if defined(_MSC_VER) && !defined(BORA_NO_WIN32_INTRINS)
-#ifdef __cplusplus
-extern "C" {
-#endif
-/*
- * It seems x86 & x86-64 windows still implements these intrinsic
- * functions.  The documentation for the x86-64 suggest the
- * __inbyte/__outbyte intrinsics even though the _in/_out work fine and
- * __inbyte/__outbyte aren't supported on x86.
- */
-int            _inp(unsigned short);
-unsigned short _inpw(unsigned short);
-unsigned long  _inpd(unsigned short);
-
-int            _outp(unsigned short, int);
-unsigned short _outpw(unsigned short, unsigned short);
-unsigned long  _outpd(uint16, unsigned long);
-#pragma intrinsic(_inp, _inpw, _inpd, _outp, _outpw, _outpw, _outpd)
-
-/*
- * Prevents compiler from re-ordering reads, writes and reads&writes.
- * These functions do not add any instructions thus only affect
- * the compiler ordering.
- *
- * See:
- * `Lockless Programming Considerations for Xbox 360 and Microsoft Windows'
- * http://msdn.microsoft.com/en-us/library/bb310595(VS.85).aspx
- */
-void _ReadBarrier(void);
-void _WriteBarrier(void);
-void _ReadWriteBarrier(void);
-#pragma intrinsic(_ReadBarrier, _WriteBarrier, _ReadWriteBarrier)
-
-void _mm_mfence(void);
-void _mm_lfence(void);
-#pragma intrinsic(_mm_mfence, _mm_lfence)
-
-long _InterlockedXor(long volatile *, long);
-#pragma intrinsic(_InterlockedXor)
-
-unsigned int __getcallerseflags(void);
-#pragma intrinsic(__getcallerseflags)
-
-#ifdef VM_X86_64
-/*
- * intrinsic functions only supported by x86-64 windows as of 2k3sp1
- */
-unsigned __int64 __rdtsc(void);
-void             __stosw(unsigned short *, unsigned short, size_t);
-void             __stosd(unsigned long *, unsigned long, size_t);
-void             _mm_pause(void);
-#pragma intrinsic(__rdtsc, __stosw, __stosd, _mm_pause)
-
-unsigned char  _BitScanForward64(unsigned long *, unsigned __int64);
-unsigned char  _BitScanReverse64(unsigned long *, unsigned __int64);
-#pragma intrinsic(_BitScanForward64, _BitScanReverse64)
-#endif /* VM_X86_64 */
-
-unsigned char  _BitScanForward(unsigned long *, unsigned long);
-unsigned char  _BitScanReverse(unsigned long *, unsigned long);
-#pragma intrinsic(_BitScanForward, _BitScanReverse)
-
-unsigned char  _bittest(const long *, long);
-unsigned char  _bittestandset(long *, long);
-unsigned char  _bittestandreset(long *, long);
-unsigned char  _bittestandcomplement(long *, long);
-#pragma intrinsic(_bittest, _bittestandset, _bittestandreset, _bittestandcomplement)
-#ifdef VM_X86_64
-unsigned char  _bittestandset64(__int64 *, __int64);
-unsigned char  _bittestandreset64(__int64 *, __int64);
-#pragma intrinsic(_bittestandset64, _bittestandreset64)
-#endif // VM_X86_64
-#ifdef __cplusplus
-}
-#endif
-#endif // _MSC_VER
-
 #ifdef __GNUC__
 /*
  * Checked against the Intel manual and GCC --hpreg
@@ -179,9 +88,6 @@ __GCC_IN(l, uint32, IN32)
 #define OUTW(port, val) __GCC_OUT(w, w, port, val)
 #define OUT32(port, val) __GCC_OUT(l, , port, val)
 
-#define GET_CURRENT_EIP(_eip) \
-      __asm__ __volatile("call 0\n\tpopl %0" : "=r" (_eip): );
-
 static INLINE unsigned int
 GetCallerEFlags(void)
 {
@@ -191,35 +97,35 @@ GetCallerEFlags(void)
 }
 
 #elif defined(_MSC_VER)
-static INLINE  uint8
+static INLINE uint8
 INB(uint16 port)
 {
-   return (uint8)_inp(port);
+   return __inbyte(port);
 }
 static INLINE void
 OUTB(uint16 port, uint8 value)
 {
-   _outp(port, value);
+   __outbyte(port, value);
 }
 static INLINE uint16
 INW(uint16 port)
 {
-   return _inpw(port);
+   return __inword(port);
 }
 static INLINE void
 OUTW(uint16 port, uint16 value)
 {
-   _outpw(port, value);
+   __outword(port, value);
 }
 static INLINE  uint32
 IN32(uint16 port)
 {
-   return _inpd(port);
+   return __indword(port);
 }
 static INLINE void
 OUT32(uint16 port, uint32 value)
 {
-   _outpd(port, value);
+   __outdword(port, value);
 }
 
 #ifndef VM_X86_64
@@ -227,11 +133,6 @@ OUT32(uint16 port, uint32 value)
 #undef NEAR
 #endif
 
-#define GET_CURRENT_EIP(_eip) do { \
-   __asm call NEAR PTR $+5 \
-   __asm pop eax \
-   __asm mov _eip, eax \
-} while (0)
 #endif // VM_X86_64
 
 static INLINE unsigned int
@@ -358,11 +259,7 @@ SFENCE(void)
    );
 #elif defined _MSC_VER
    _ReadWriteBarrier();
-#if defined VM_X86_32
-   __asm sfence;
-#else
    _mm_sfence();
-#endif
    _ReadWriteBarrier();
 #else
 #error No compiler defined for SFENCE
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index bb9d86cf..d32cde0d 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -688,22 +688,28 @@ typedef void * UserVA;
 
 /*
  * At present, we effectively require a compiler that is at least
- * gcc-3.3 (circa 2003).  Enforce this here, various things below
+ * gcc-4.1 (circa 2006).  Enforce this here, various things below
  * this line depend upon it.
  *
- * In practice, most things presently compile with gcc-4.1 or gcc-4.4.
- * The various linux kernel modules may use older (gcc-3.3) compilers.
+ * Current oldest compilers:
+ * - guest tools: 4.1.2 (freebsd/solaris)
+ * - buildhost compiler: 4.4.3
+ * - hosted kernel modules: 4.5
+ *
+ * SWIG's preprocessor is exempt.
  */
-#if defined __GNUC__ && (__GNUC__ < 3 || (__GNUC__ == 3 && __GNUC_MINOR__ < 3))
-#error "gcc version is too old to compile assembly, need gcc-3.3 or better"
+#ifndef SWIG
+#if defined __GNUC__ && (__GNUC__ < 4 || (__GNUC__ == 4 && __GNUC_MINOR__ < 1))
+#error "gcc version is too old, need gcc-4.1 or better"
+#endif
 #endif
 
 /*
- * Similarly, we require a compiler that is at least vc90 (vs2008).
+ * Similarly, we require a compiler that is at least vs2012.
  * Enforce this here.
  */
-#if defined _MSC_VER && _MSC_VER < 1500
-#error "cl.exe version is too old, need vc90 or better"
+#if defined _MSC_VER && _MSC_VER < 1700
+#error "cl.exe version is too old, need vs2012 or better"
 #endif
 
 
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
index 440038d0..6e38b220 100644
--- a/vmnet-only/vm_device_version.h
+++ b/vmnet-only/vm_device_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2005-2012,2014-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2005-2012,2014-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -344,7 +344,7 @@
 #define MAX_NVDIMM 64
 
 /************* vRDMA implementation limits ******************************/
-#define MAX_VRDMA_DEVICES 1
+#define MAX_VRDMA_DEVICES 10
 
 /************* QAT implementation limits ********************/
 #define MAX_QAT_PCI_DEVICES 4

From a4d51adffebfd9b56b1519b86473f42a176b7262 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 20 Nov 2020 09:10:32 +0100
Subject: [PATCH 17/41] import Workstation 16.1.0 module sources

---
 vmmon-only/common/crosspage.c   |   8 +--
 vmmon-only/common/hostif.h      |   2 +-
 vmmon-only/include/iocontrols.h |   4 +-
 vmmon-only/include/modulecall.h |   6 +-
 vmmon-only/include/vcpuset.h    |   7 ++-
 vmmon-only/linux/driver.c       |   1 +
 vmmon-only/linux/hostif.c       | 104 +++++++++++++++++++-------------
 vmmon-only/linux/vmhost.h       |   5 ++
 vmmon-only/vmcore/moduleloop.c  |  10 ++-
 vmnet-only/smac.c               |   4 +-
 vmnet-only/userif.c             |  11 ++++
 11 files changed, 101 insertions(+), 61 deletions(-)

diff --git a/vmmon-only/common/crosspage.c b/vmmon-only/common/crosspage.c
index 0806e93d..ed6db5a2 100644
--- a/vmmon-only/common/crosspage.c
+++ b/vmmon-only/common/crosspage.c
@@ -47,11 +47,9 @@
 
 #ifdef __linux__
 #   include "driver-config.h"
-/*
- * linux/frame.h dates back to 4.5-rc5, we need the ANNOTATE_INTRA_FUNCTION_CALL
- * definition from it which came in with 5.7.
- */
-#   if LINUX_VERSION_CODE > KERNEL_VERSION(5, 7, 0)
+#   if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 10, 0)
+#      include <linux/objtool.h>
+#   elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 6, 0)
 #      include <linux/frame.h>
 #   endif
 #endif
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index 49fce0f6..e1939ab1 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -110,7 +110,7 @@ EXTERN int   HostIF_SemaphoreWait(VMDriver *vm,
                                   Vcpuid vcpuid,
                                   uint64 *args);
 
-EXTERN int   HostIF_SemaphoreSignal(uint64 *args);
+EXTERN int   HostIF_SemaphoreSignal(VMDriver *vm, uint64 *args);
 
 EXTERN void  HostIF_SemaphoreForceWakeup(VMDriver *vm, const VCPUSet *vcs);
 EXTERN void  HostIF_IPI(VMDriver *vm, const VCPUSet *vcs);
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 2eb661f9..969e6c58 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -148,7 +148,7 @@ PtrToVA64(void const *ptr) // IN
  * the NT specific VMX86_DRIVER_VERSION.
  */
 
-#define VMMON_VERSION           (398 << 16 | 0)
+#define VMMON_VERSION           (401 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -533,6 +533,8 @@ typedef struct IPIVectors {
  */
 typedef struct VMCreateBlock {
    VA64               bsBlob;        // IN: User VA of the VMM bootstrap blob.
+   VA64               vmmonData;     // IN: User VA of a userlevel scratch area
+                                     //     required by the Linux vmmon
    uint32             bsBlobSize;    // IN: Size of VMM bootstrap blob.
    uint32             numVCPUs;      // IN: Number of VCPUs.
    uint16             vmid;          // OUT: VM ID for the created VM.
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index 7d004475..b5d43f57 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -421,9 +421,7 @@ VMCrossPageData;
 
 #define MX_WAITINTERRUPTED     3
 #define MX_WAITTIMEDOUT        2
-#define MX_WAITNORMAL          1  // Must equal one; see linux module code.
-#define MX_WAITERROR           0  // Use MX_ISWAITERROR() to test for error.
+#define MX_WAITNORMAL          1
+#define MX_WAITERROR           0
 
-// Any zero or negative value denotes error.
-#define MX_ISWAITERROR(e)      ((e) <= MX_WAITERROR)
 #endif
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
index c9e81925..13d5e9fb 100644
--- a/vmmon-only/include/vcpuset.h
+++ b/vmmon-only/include/vcpuset.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -44,10 +44,11 @@
 #   include "str.h"     /* Str_Snprintf */
 #   define VCS_SNPRINTF Str_Snprintf
 #elif defined MONITOR_APP
-#   include <stdio.h>   /* libc snprintf */
 #   if defined WIN32
-#      define VCS_SNPRINTF _snprintf
+#      include "str.h"     /* Str_Snprintf */
+#      define VCS_SNPRINTF Str_Snprintf
 #   else
+#      include <stdio.h>   /* libc snprintf */
 #      define VCS_SNPRINTF snprintf
 #   endif
 #elif defined VMM || defined VMKERNEL
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index a25ee54c..1ebb7033 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -799,6 +799,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       } else {
          device->vm = vm;
          args.vmid = vm->userID;
+         vm->vmhost->vmmonData = (void *__user)args.vmmonData;
          retval = HostIF_CopyToUser((VA64)ioarg, &args, sizeof args);
       }
       break;
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 88912859..b03ebc7a 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -2347,16 +2347,23 @@ HostIF_VMLockIsHeld(VMDriver *vm) // IN
 static Bool
 isVAReadable(VA r)  // IN:
 {
-   mm_segment_t old_fs;
    uint32 dummy;
    int ret;
 
+   r = APICR_TO_ADDR(r, APICR_VERSION);
+#ifdef HAVE_GET_KERNEL_NOFAULT
+   ret = get_kernel_nofault(dummy, (void *)r);
+#else
+   {
+   mm_segment_t old_fs;
+
    old_fs = get_fs();
    set_fs(KERNEL_DS);
-   r = APICR_TO_ADDR(r, APICR_VERSION);
+
    ret = HostIF_CopyFromUser(&dummy, r, sizeof dummy);
    set_fs(old_fs);
-
+   }
+#endif
    return ret == 0;
 }
 #endif
@@ -2522,8 +2529,10 @@ HostIF_GetPerfCtrVector(void)
  *    Perform the semaphore wait (P) operation, possibly blocking.
  *
  * Result:
- *    1 (which equals MX_WAITNORMAL) if success,
- *    negated error code otherwise.
+ *      On success: MX_WAITINTERRUPTED (3) if interrupted by a Unix signal.
+ *                  MX_WAITTIMEDOUT (2) if the timeout occurred.
+ *                  MX_WAITNORMAL (1) if the event was raised.
+ *      On error: MX_WAITERROR (0) on generic error.
  *
  * Side-effects:
  *    None
@@ -2550,6 +2559,11 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
    if (file == NULL) {
       return MX_WAITERROR;
    }
+   if (file->f_op->poll == NULL) {
+      fput(file);
+      Warning("%s: File poll operation is NULL\n", __func__);
+      return MX_WAITERROR;
+   }
 
    poll_initwait(&table);
    current->state = TASK_INTERRUPTIBLE;
@@ -2574,18 +2588,17 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
 #else
    res = kernel_read(file, &value, sizeof value, &file->f_pos);
 #endif
+   fput(file);
+
    if (res == sizeof value) {
-      res = MX_WAITNORMAL;
-   } else {
-      if (res == 0) {
-         res = -EBADF;
-      }
+      return MX_WAITNORMAL;
+   }
+   if (res == 0) {
+      res = -EBADF;
    }
-
-   fput(file);
 
    /*
-    * Handle benign errors:
+    * Handle various errors:
     * EAGAIN is MX_WAITTIMEDOUT.
     * The signal-related errors are all mapped into MX_WAITINTERRUPTED.
     */
@@ -2604,6 +2617,10 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
    case -EBADF:
       res = MX_WAITERROR;
       break;
+   default:
+      Warning("Unexpected error: %s err=%d\n", __FUNCTION__, res);
+      res = MX_WAITERROR;
+      break;
    }
    return res;
 }
@@ -2657,7 +2674,6 @@ HostIF_SemaphoreForceWakeup(VMDriver *vm,       // IN:
  *      On error: MX_WAITINTERRUPTED (3) if interrupted by a Unix signal (we
  *                   can block on a preemptive kernel).
  *                MX_WAITERROR (0) on generic error.
- *                Negated system error (< 0).
  *
  * Side-effects:
  *      None
@@ -2666,57 +2682,64 @@ HostIF_SemaphoreForceWakeup(VMDriver *vm,       // IN:
  */
 
 int
-HostIF_SemaphoreSignal(uint64 *args)  // IN:
+HostIF_SemaphoreSignal(VMDriver *vm,  // IN:
+                       uint64 *args)  // IN:
 {
-   struct file *file;
    int res;
    int signalFD = args[1];
-   uint64 value = 1;  // make an eventfd happy should it be there
+   struct file *file;
 
    file = vmware_fget(signalFD);
-   if (!file) {
-      return MX_WAITERROR;
+   if (file == NULL) {
+      return FALSE;
    }
 
    /*
     * Always write sizeof(uint64) bytes. This works fine for eventfd and
     * pipes. The data written is formatted to make an eventfd happy should
     * it be present.
-    *
-    * Upstream Linux changed the function parameter types/ordering in 4.14.0.
     */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(4, 14, 0)
-   res = kernel_write(file, (char *)&value, sizeof value, file->f_pos);
-#else
-   res = kernel_write(file, &value, sizeof value, &file->f_pos);
-#endif
-
-   if (res == sizeof value) {
-      res = MX_WAITNORMAL;
+   if (file->f_op->write != NULL) {
+      /*
+       * PR2650348 - The kernel_write function signature changed in the vanilla
+       * kernel in 4.14.0 and the signature update was backported before that
+       * point in a kernel used by OpenSUSE 15.1 so call the function directly
+       * instead of via the wrapper.
+       *
+       * Kernel 5.10 removed the set_fs functionality which means a user pointer
+       * must be passed into the write function or a -EFAULT will be returned.
+       */
+      res = file->f_op->write(file, vm->vmhost->vmmonData, sizeof (uint64),
+                              &file->f_pos);
+   } else {
+      Warning("%s: File write operation is NULL\n", __func__);
+      res = -ENOTSUPP;
    }
-
    fput(file);
 
+   if (res == sizeof (uint64)) {
+      return MX_WAITNORMAL;
+   }
+
    /*
-    * Handle benign errors:
+    * Handle various errors:
     * EAGAIN is MX_WAITTIMEDOUT.
     * The signal-related errors are all mapped into MX_WAITINTERRUPTED.
     */
-
    switch (res) {
    case -EAGAIN:
-      // The pipe is full, so it is already signalled. Success.
-      res = MX_WAITNORMAL;
-      break;
+      /* The pipe is full, so it is already signalled. Success. */
+      return MX_WAITNORMAL;
    case -EINTR:
    case -ERESTART:
    case -ERESTARTSYS:
    case -ERESTARTNOINTR:
    case -ERESTARTNOHAND:
-      res = MX_WAITINTERRUPTED;
-      break;
+      return MX_WAITINTERRUPTED;
+   default:
+      Warning("Unexpected error: %s err=%d\n", __FUNCTION__, res);
+      return MX_WAITERROR;
    }
-   return res;
 }
 
 
@@ -3241,12 +3264,9 @@ static int
 HostIFFastClockThread(void *unused)  // IN:
 {
    int res;
-   mm_segment_t oldFS;
    unsigned int rate = 0;
    unsigned int prevRate = 0;
 
-   oldFS = get_fs();
-   set_fs(KERNEL_DS);
    allow_signal(SIGKILL);
 
    while ((rate = linuxState.fastClockRate) > MIN_RATE) {
@@ -3269,8 +3289,6 @@ HostIFFastClockThread(void *unused)  // IN:
    }
 
  out:
-   set_fs(oldFS);
-
    /*
     * Do not exit thread until we are told to do so.
     */
diff --git a/vmmon-only/linux/vmhost.h b/vmmon-only/linux/vmhost.h
index 8e1b6776..5edd9ba7 100644
--- a/vmmon-only/linux/vmhost.h
+++ b/vmmon-only/linux/vmhost.h
@@ -92,6 +92,11 @@ typedef struct VMHost {
     * as pages for "AWE" guest memory.
     */
    struct PhysTracker  *AWEPages;
+   /*
+    * Pointer to a userlevel 64-bit area containing the value 1.
+    * This is used for HostIF_SemaphoreSignal.
+    */
+   void *__user vmmonData;
 } VMHost;
 
 #endif
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/vmcore/moduleloop.c
index 28563fe5..974484aa 100644
--- a/vmmon-only/vmcore/moduleloop.c
+++ b/vmmon-only/vmcore/moduleloop.c
@@ -180,7 +180,7 @@ skipTaskSwitch:;
       }
 
       case MODULECALL_SEMASIGNAL: {
-         retval = HostIF_SemaphoreSignal(crosspage->args);
+         retval = HostIF_SemaphoreSignal(vm, crosspage->args);
 
          if (retval == MX_WAITINTERRUPTED) {
              crosspage->moduleCallInterrupted = TRUE;
@@ -362,7 +362,13 @@ skipTaskSwitch:;
       default:
          Warning("ModuleCall %d not supported\n", crosspage->moduleCallType);
       }
-      ASSERT(retval == (uint64)((uint32)retval));
+
+      if (retval != (uint64)((uint32)retval)) {
+         Warning("Unexpected error in modulecall %u (%llu)\n",
+                 crosspage->moduleCallType, retval);
+         bailValue = USERCALL_SWITCHERR;
+         goto bailOut;
+      }
       crosspage->retval = (uint32)retval;
 #if defined(__linux__)
       cond_resched(); // Other kernels are preemptible
diff --git a/vmnet-only/smac.c b/vmnet-only/smac.c
index 8dc0f956..f18be8a7 100644
--- a/vmnet-only/smac.c
+++ b/vmnet-only/smac.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002,2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002,2018,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -4327,7 +4327,7 @@ LookupTypeClass(unsigned short typeValue) // IN: ethernet type
  *----------------------------------------------------------------------
  */
 
-#if _WIN32
+#ifdef _WIN32
 _Use_decl_annotations_
 #endif
 void
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index 6cf8f520..e99c4368 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -561,7 +561,12 @@ VNetCsumCopyDatagram(const struct sk_buff *skb,	// IN: skb to copy
       return -EINVAL;
    }
 
+#if COMPAT_LINUX_VERSION_CHECK_LT(5, 10, 0)
    csum = csum_and_copy_to_user(skb->data + offset, curr, len, 0, &err);
+#else
+   csum = csum_and_copy_to_user(skb->data + offset, curr, len);
+   err = (csum == 0) ? -EFAULT : 0;
+#endif
    if (err) {
       return err;
    }
@@ -575,8 +580,14 @@ VNetCsumCopyDatagram(const struct sk_buff *skb,	// IN: skb to copy
 	 const void *vaddr;
 
 	 vaddr = kmap(skb_frag_page(frag));
+#if COMPAT_LINUX_VERSION_CHECK_LT(5, 10, 0)
 	 tmpCsum = csum_and_copy_to_user(vaddr + skb_frag_off(frag),
 					 curr, skb_frag_size(frag), 0, &err);
+#else
+	 tmpCsum = csum_and_copy_to_user(vaddr + skb_frag_off(frag),
+					 curr, skb_frag_size(frag));
+         err = (tmpCsum == 0) ? -EFAULT : 0;
+#endif
 	 kunmap(skb_frag_page(frag));
 
 	 if (err) {

From 3a3dd8046c07066dbeee9f5a4ed01080626872c6 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sun, 17 Oct 2021 15:44:31 +0200
Subject: [PATCH 18/41] import Workstation 16.2.0 module sources

---
 vmmon-only/Makefile.kernel                    |  10 +-
 vmmon-only/Makefile.normal                    |  17 +-
 vmmon-only/bootstrap/monLoader.c              |   3 +-
 vmmon-only/bootstrap/monLoaderVmmon.c         |   2 +-
 vmmon-only/bootstrap/vmmblob.c                |   3 +-
 vmmon-only/common/apic.c                      |   5 +-
 vmmon-only/common/cpuid.c                     |  15 +-
 vmmon-only/common/crosspage.c                 | 114 ++-
 vmmon-only/common/crosspage.h                 |   7 +-
 vmmon-only/common/memtrack.c                  |   3 +-
 vmmon-only/common/memtrack.h                  |   6 +-
 vmmon-only/{vmcore => common}/moduleloop.c    |   2 -
 vmmon-only/common/phystrack.c                 |  30 +-
 vmmon-only/common/sharedAreaVmmon.c           |   3 +-
 vmmon-only/common/statVarsVmmon.c             |   3 +-
 vmmon-only/common/task.c                      |  98 +--
 vmmon-only/common/vmx86.c                     | 512 +++++++++---
 vmmon-only/common/vmx86.h                     |   4 -
 vmmon-only/include/address_defs.h             |  14 +-
 vmmon-only/include/addrlayout.h               |  35 +-
 vmmon-only/include/addrlayout_table.h         |   6 +-
 vmmon-only/include/circList.h                 | 507 ------------
 .../driver_vmcore.h => include/cpu_types.h}   |  25 +-
 vmmon-only/include/crossgdt.h                 |   4 +-
 vmmon-only/include/intelVT.h                  | 459 +++++++++++
 vmmon-only/include/iocontrols.h               |  41 +-
 vmmon-only/include/modulecall.h               |  73 +-
 vmmon-only/include/modulecallstructs.h        |  98 ---
 vmmon-only/include/monLoader.h                |   1 +
 vmmon-only/include/mon_assert.h               |  10 +-
 vmmon-only/include/monitorAction_exported.h   |  43 -
 vmmon-only/include/msrCache.h                 |  74 ++
 vmmon-only/include/numa_defs.h                |  83 --
 vmmon-only/include/pagelist.h                 | 109 ---
 vmmon-only/include/pcip_defs.h                | 121 ---
 vmmon-only/include/perfctr_arch.h             |   6 +-
 vmmon-only/include/pshare_ext.h               |  73 --
 vmmon-only/include/ptsc.h                     |   5 +-
 vmmon-only/include/segs.h                     |  71 +-
 vmmon-only/include/uccost.h                   |  77 ++
 vmmon-only/include/vcpuid.h                   |   6 +-
 vmmon-only/include/vcpuset.h                  |  18 +-
 vmmon-only/include/versioned_atomic.h         | 261 ++++--
 vmmon-only/include/virtual_vt.h               | 368 +++++++++
 vmmon-only/include/vm_asm_x86.h               |  20 +-
 vmmon-only/include/vm_assert.h                | 230 ++++--
 vmmon-only/include/vm_atomic.h                | 171 ++--
 vmmon-only/include/vm_atomic_acqrel.h         | 779 ++++++++++++++++++
 vmmon-only/include/vm_atomic_relaxed.h        | 590 +++++++++++++
 vmmon-only/include/vm_basic_asm.h             | 236 ++++--
 vmmon-only/include/vm_basic_asm_x86.h         |  10 +-
 vmmon-only/include/vm_basic_asm_x86_64.h      |  65 +-
 vmmon-only/include/vm_basic_asm_x86_common.h  |  50 +-
 vmmon-only/include/vm_basic_defs.h            | 124 ++-
 vmmon-only/include/vm_basic_types.h           |  91 +-
 vmmon-only/include/vm_idt_x86.h               |   1 +
 vmmon-only/include/vm_pagetable.h             |  42 +-
 vmmon-only/include/vmmem_shared.h             | 119 ---
 vmmon-only/include/vmware.h                   |  57 --
 vmmon-only/include/vmware_pack_begin.h        |  43 -
 vmmon-only/include/vmware_pack_end.h          |  44 -
 vmmon-only/include/vmware_pack_init.h         |  65 --
 .../{x86types.h => x86/cpu_types_arch.h}      |  49 +-
 vmmon-only/include/x86_basic_defs.h           |   5 +-
 vmmon-only/include/x86cpuid.h                 | 439 ++++++----
 vmmon-only/include/x86msr.h                   | 278 ++++++-
 vmmon-only/include/x86paging_64.h             |   2 +-
 vmmon-only/include/x86paging_common.h         |  17 +-
 vmmon-only/include/x86segdescrs.h             |  12 +-
 vmmon-only/include/x86svm.h                   |  35 +-
 vmmon-only/include/x86vt-exit-reasons.h       |   6 +-
 vmmon-only/include/x86vt-vmcs-fields.h        |  18 +-
 vmmon-only/include/x86vt.h                    | 176 ++--
 vmmon-only/linux/driver.c                     |  50 +-
 vmmon-only/linux/driver.h                     |   4 -
 vmmon-only/linux/hostif.c                     |  23 +-
 vmnet-only/vm_assert.h                        | 230 ++++--
 vmnet-only/vm_atomic.h                        | 171 ++--
 vmnet-only/vm_basic_asm.h                     | 236 ++++--
 vmnet-only/vm_basic_asm_x86.h                 |  10 +-
 vmnet-only/vm_basic_asm_x86_64.h              |  65 +-
 vmnet-only/vm_basic_asm_x86_common.h          |  50 +-
 vmnet-only/vm_basic_defs.h                    | 124 ++-
 vmnet-only/vm_basic_types.h                   |  91 +-
 vmnet-only/vm_device_version.h                |  22 +-
 vmnet-only/vm_oui.h                           |   6 +-
 86 files changed, 5266 insertions(+), 3015 deletions(-)
 rename vmmon-only/{vmcore => common}/moduleloop.c (99%)
 delete mode 100644 vmmon-only/include/circList.h
 rename vmmon-only/{vmcore/driver_vmcore.h => include/cpu_types.h} (70%)
 create mode 100644 vmmon-only/include/intelVT.h
 delete mode 100644 vmmon-only/include/modulecallstructs.h
 delete mode 100644 vmmon-only/include/monitorAction_exported.h
 create mode 100644 vmmon-only/include/msrCache.h
 delete mode 100644 vmmon-only/include/numa_defs.h
 delete mode 100644 vmmon-only/include/pagelist.h
 delete mode 100644 vmmon-only/include/pcip_defs.h
 delete mode 100644 vmmon-only/include/pshare_ext.h
 create mode 100644 vmmon-only/include/uccost.h
 create mode 100644 vmmon-only/include/virtual_vt.h
 create mode 100644 vmmon-only/include/vm_atomic_acqrel.h
 create mode 100644 vmmon-only/include/vm_atomic_relaxed.h
 delete mode 100644 vmmon-only/include/vmmem_shared.h
 delete mode 100644 vmmon-only/include/vmware.h
 delete mode 100644 vmmon-only/include/vmware_pack_begin.h
 delete mode 100644 vmmon-only/include/vmware_pack_end.h
 delete mode 100644 vmmon-only/include/vmware_pack_init.h
 rename vmmon-only/include/{x86types.h => x86/cpu_types_arch.h} (97%)

diff --git a/vmmon-only/Makefile.kernel b/vmmon-only/Makefile.kernel
index 385068da..69ee8d03 100644
--- a/vmmon-only/Makefile.kernel
+++ b/vmmon-only/Makefile.kernel
@@ -1,6 +1,6 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998,2015 VMware, Inc. All rights reserved.
+# Copyright (C) 1998,2015,2020 VMware, Inc. All rights reserved.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
@@ -19,19 +19,17 @@
 
 CC_OPTS += -DVMMON -DVMCORE
 
-INCLUDE := -I$(SRCROOT)/include -I$(SRCROOT)/common -I$(SRCROOT)/linux \
-	   -I$(SRCROOT)/vmcore
-
+INCLUDE := -I$(SRCROOT)/include -I$(SRCROOT)/include/x86 -I$(SRCROOT)/common -I$(SRCROOT)/linux
 EXTRA_CFLAGS := $(CC_OPTS) $(INCLUDE)
 
 obj-m += $(DRIVER).o
 
 $(DRIVER)-y := $(subst $(SRCROOT)/, , $(patsubst %.c, %.o, \
-		$(wildcard $(SRCROOT)/linux/*.c $(SRCROOT)/common/*.c $(SRCROOT)/vmcore/*.c \
+		$(wildcard $(SRCROOT)/linux/*.c $(SRCROOT)/common/*.c \
 		$(SRCROOT)/bootstrap/*.c)))
 
 clean:
 	rm -rf $(wildcard $(DRIVER).mod.c $(DRIVER).ko .tmp_versions \
 		Module.symvers Modules.symvers Module.markers modules.order \
-		$(foreach dir,linux/ common/ vmcore/ bootstrap/ \
+		$(foreach dir,linux/ common/ bootstrap/ \
 		./,$(addprefix $(dir),.*.cmd .*.o.flags *.o)))
diff --git a/vmmon-only/Makefile.normal b/vmmon-only/Makefile.normal
index c75c70c0..70ea0764 100644
--- a/vmmon-only/Makefile.normal
+++ b/vmmon-only/Makefile.normal
@@ -66,21 +66,18 @@ endif
 CC_OPTS := -O2 -DMODULE -DVMMON -DVMCORE $(GLOBAL_DEFS) $(CC_KFLAGS) $(CC_WARNINGS)
 
 INCLUDE := -I$(SRCROOT)/include -I$(SRCROOT)/common -I$(SRCROOT)/linux \
-	   -I$(SRCROOT)/vmcore -I$(HEADER_DIR)
+	   -I$(HEADER_DIR)
 
 INCLUDE += $(shell $(CC) $(INCLUDE) -E $(SRCROOT)/autoconf/geninclude.c \
 	   | sed -n -e 's!^APATH!-I$(HEADER_DIR)/asm!p')
 
 C_TARGETS_LINUX  := driver.o hostif.o driverLog.o
-C_TARGETS_COMMON := vmx86.o memtrack.o phystrack.o cpuid.o task.o crosspage.o
-C_TARGETS_VMCORE := moduleloop.o
+C_TARGETS_COMMON := vmx86.o memtrack.o phystrack.o cpuid.o task.o crosspage.o moduleloop.o
 C_TARGETS_BOOTSTRAP := bootstrap.o
 C_TARGETS_LINUX_D := ${C_TARGETS_LINUX:.o=.d}
 C_TARGETS_COMMON_D := ${C_TARGETS_COMMON:.o=.d}
-C_TARGETS_VMCORE_D := ${C_TARGETS_VMCORE:.o=.d}
 C_TARGETS_BOOTSTRAP_D := ${C_TARGETS_BOOTSTRAP:.o=.d}
-C_TARGETS := $(C_TARGETS_LINUX) $(C_TARGETS_COMMON) $(C_TARGETS_VMCORE) \
-             $(C_TARGETS_BOOTSTRAP)
+C_TARGETS := $(C_TARGETS_LINUX) $(C_TARGETS_COMMON) $(C_TARGETS_BOOTSTRAP)
 
 ####
 #### Make Targets are beneath here.
@@ -112,10 +109,6 @@ $(C_TARGETS_COMMON): %.o: $(SRCROOT)/common/%.c
 	$(ECHO) "Compiling  common/$(<F)"
 	$(CC) $(CC_OPTS) $(INCLUDE) -c $<
 
-$(C_TARGETS_VMCORE): %.o: $(SRCROOT)/vmcore/%.c
-	$(ECHO) "Compiling  vmcore/$(<F)"
-	$(CC) $(CC_OPTS) $(INCLUDE) -c $<
-
 $(C_TARGETS_BOOTSTRAP): %.o: $(SRCROOT)/bootstrap/%.c
 	$(ECHO) "Compiling  bootstrap/$(<F)"
 	$(CC) $(CC_OPTS) $(INCLUDE) -c $<
@@ -131,10 +124,6 @@ $(C_TARGETS_LINUX_D): %.d: $(SRCROOT)/linux/%.c
 	$(ECHO) "Dependencies for $(<F)"
 	$(CC) -MM $(CC_OPTS) $(INCLUDE) $< > $@
 
-$(C_TARGETS_VMCORE_D): %.d: $(SRCROOT)/vmcore/%.c
-	$(ECHO) "Dependencies for $(<F)"
-	$(CC) -MM $(CC_OPTS) $(INCLUDE) $< > $@
-
 $(C_TARGETS_BOOTSTRAP_D): %.d: $(SRCROOT)/bootstrap/%.c
 	$(ECHO) "Dependencies for $(<F)"
 	$(CC) -MM $(CC_OPTS) $(INCLUDE) $< > $@
diff --git a/vmmon-only/bootstrap/monLoader.c b/vmmon-only/bootstrap/monLoader.c
index 676c0724..dfc6f527 100644
--- a/vmmon-only/bootstrap/monLoader.c
+++ b/vmmon-only/bootstrap/monLoader.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -26,7 +26,6 @@
 
 #if defined VMKERNEL
 
-#include "vmkernel.h"
 #include "libc.h"
 #include "vm_libc.h"
 
diff --git a/vmmon-only/bootstrap/monLoaderVmmon.c b/vmmon-only/bootstrap/monLoaderVmmon.c
index 6ae9f670..e121f7c4 100644
--- a/vmmon-only/bootstrap/monLoaderVmmon.c
+++ b/vmmon-only/bootstrap/monLoaderVmmon.c
@@ -32,7 +32,7 @@
 
 #include "vm_assert.h"
 #include "vcpuid.h"
-#include "x86types.h"
+#include "cpu_types.h"
 #include "hostif.h"
 #include "x86paging_common.h"
 #include "x86paging_64.h"
diff --git a/vmmon-only/bootstrap/vmmblob.c b/vmmon-only/bootstrap/vmmblob.c
index 60fe76ae..129b62e1 100644
--- a/vmmon-only/bootstrap/vmmblob.c
+++ b/vmmon-only/bootstrap/vmmblob.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2017-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2017-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -25,7 +25,6 @@
 #ifdef __linux__
 #   include "driver-config.h"
 #endif
-#include "vmware.h"
 #include "vm_assert.h"
 #include "hostif.h"
 #include "vmmblob.h"
diff --git a/vmmon-only/common/apic.c b/vmmon-only/common/apic.c
index 6ac29db7..6df44e61 100644
--- a/vmmon-only/common/apic.c
+++ b/vmmon-only/common/apic.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2011, 2016, 2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2011, 2016, 2018,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -16,11 +16,10 @@
  *
  *********************************************************/
 
-#include "vmware.h"
+#include "vm_basic_defs.h"
 #include "x86apic.h"
 #include "x86msr.h"
 #include "x86cpuid_asm.h"
-#include "vm_asm.h"
 #include "cpuid.h"
 #include "apic.h"
 
diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
index 425363f7..cabee8b1 100644
--- a/vmmon-only/common/cpuid.c
+++ b/vmmon-only/common/cpuid.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2016-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2016-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -26,7 +26,6 @@
 #   include <string.h> // For strcmp().
 #endif
 
-#include "vmware.h"
 #include "vm_assert.h"
 #include "hostif.h"
 #include "cpuid.h"
@@ -78,7 +77,7 @@ CPUIDExtendedSupported(void)
 void
 CPUID_Init(void)
 {
-   CPUIDRegs regs;
+   CPUIDRegs regs, regs88;
    uint32 *ptr;
    char name[16];
 
@@ -108,9 +107,13 @@ CPUID_Init(void)
    }
 
    __GET_CPUID2(7, 0, &regs);
-   hostHasSpecCtrl = cpuidVendor == CPUID_VENDOR_INTEL &&
-                     (CPUID_ISSET(7, EDX, IBRSIBPB, regs.edx) ||
-                      CPUID_ISSET(7, EDX, STIBP, regs.edx));
+   __GET_CPUID2(0x80000008, 0, &regs88);
+   hostHasSpecCtrl =  CPUID_ISSET(7, EDX, IBRSIBPB, regs.edx) ||
+                      CPUID_ISSET(7, EDX, STIBP, regs.edx)    ||
+                      CPUID_ISSET(7, EDX, SSBD,  regs.edx)    ||
+                      CPUID_ISSET(0x80000008, EBX, LEAF88_SSBD_SPEC_CTRL,
+                                  regs88.ebx)                 ||
+                      CPUID_ISSET(0x80000008, EBX, LEAF88_PSFD, regs88.ebx);
 
    hostSupportsVT = VT_CapableCPU();
    hostSupportsSVM = SVM_CapableCPU();
diff --git a/vmmon-only/common/crosspage.c b/vmmon-only/common/crosspage.c
index ed6db5a2..2394fa78 100644
--- a/vmmon-only/common/crosspage.c
+++ b/vmmon-only/common/crosspage.c
@@ -105,15 +105,11 @@
 
 #define NOT_REACHED_MINIMAL __builtin_unreachable
 
-#ifdef ANNOTATE_INTRA_FUNCTION_CALL
-#define ANNOTATE_ASM_CALL_STR2(x) #x
-#define ANNOTATE_ASM_CALL_STR(x) ANNOTATE_ASM_CALL_STR2(x) "\n"
-#define ANNOTATE_ASM_CALL ANNOTATE_ASM_CALL_STR(ANNOTATE_INTRA_FUNCTION_CALL)
-#else
-#define ANNOTATE_ASM_CALL
-#endif
-
 void VmmToHost(void);
+void SwitchDBHandler(void);
+void SwitchUDHandler(void);
+void SwitchNMIHandler(void);
+void SwitchMCEHandler(void);
 
 CPDATA const VMCrossPageData cpDataTemplate = {
    .version        = CROSSPAGE_VERSION,
@@ -128,7 +124,7 @@ CPDATA const VMCrossPageData cpDataTemplate = {
    .wsCR0          = CR0_PE | CR0_MP | CR0_EM | CR0_NE | CR0_WP | CR0_PG,
    .wsCR4          = CR4_PAE | CR4_OSFXSR,
 
-   .monTask.rsp[0] = VMM_STACK_TOP,                   /* Monitor stack. */
+   .monTask.rsp[0] = MON_STACK_TOP,                   /* Monitor stack. */
    .monTask.rsp[1] = VPN_2_VA(VMM_STACK_GUARD_START), /* CPL1 is not used. */
    .monTask.rsp[2] = VPN_2_VA(VMM_STACK_GUARD_START), /* CPL2 is not used. */
 
@@ -157,6 +153,102 @@ CPDATA const VMCrossPageData cpDataTemplate = {
 };
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CrossPagePopulateSwitchIDTE --
+ *
+ *      Populates an interrupt descriptor in the crosspage, setting its
+ *      handler to the associated gate stub given a code segment selector.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+CrossPagePopulateSwitchIDTE(unsigned idx, Selector cs, Gate64 *idt,
+                            VA handlerVA)
+{
+   Gate64 *entry;
+
+   ASSERT_ON_COMPILE(sizeof *entry == 16);
+   ASSERT(idx < NUM_EXCEPTIONS);
+   entry = &idt[idx];
+
+   entry->offset_0_15  = LOWORD(handlerVA);
+   entry->offset_16_31 = HIWORD(handlerVA);
+   entry->offset_32_63 = HIDWORD(handlerVA);
+   entry->type         = INTER_GATE;
+   entry->segment      = cs;
+   entry->present      = 1;
+   entry->ist          = 0;
+   entry->DPL          = 0;
+   entry->reserved0    = 0;
+   entry->reserved1    = 0;
+}
+
+static VA
+CrossPageVmmCodeVA(void (*handler)(void))
+{
+   VA baseVA = VPN_2_VA(CROSS_PAGE_CODE_START);
+   VA offs = (VA)handler % PAGE_SIZE;
+
+   return baseVA + offs;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ *  CrossPageInitSwitchIDT --
+ *
+ *      Initializes the contents of the switch IDTs and IDTR.
+ *      Uses the cross page's host kernel linear address and host kernel CS.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+void
+CrossPageInitSwitchIDTs(struct VMCrossPageData *cpData)
+{
+   const Selector hostCS = cpData->hostInitial64CS;
+   Gate64 *switchHostIDT = cpData->switchHostIDT;
+   Gate64 *switchMonIDT  = cpData->switchMonIDT;
+
+   cpData->switchHostIDTR.limit = sizeof cpData->switchHostIDT - 1;
+   cpData->switchHostIDTR.offset = PtrToVA64(&cpData->switchHostIDT);
+
+   CrossPagePopulateSwitchIDTE(EXC_DB,  hostCS, switchHostIDT,
+                               (VA)SwitchDBHandler);
+   CrossPagePopulateSwitchIDTE(EXC_NMI, hostCS, switchHostIDT,
+                               (VA)SwitchNMIHandler);
+   CrossPagePopulateSwitchIDTE(EXC_UD,  hostCS, switchHostIDT,
+                               (VA)SwitchUDHandler);
+   CrossPagePopulateSwitchIDTE(EXC_MC,  hostCS, switchHostIDT,
+                               (VA)SwitchMCEHandler);
+
+   CrossPagePopulateSwitchIDTE(EXC_DB,  SYSTEM_CODE_SELECTOR, switchMonIDT,
+                          CrossPageVmmCodeVA(SwitchDBHandler));
+   CrossPagePopulateSwitchIDTE(EXC_NMI, SYSTEM_CODE_SELECTOR, switchMonIDT,
+                          CrossPageVmmCodeVA(SwitchNMIHandler));
+   CrossPagePopulateSwitchIDTE(EXC_UD,  SYSTEM_CODE_SELECTOR, switchMonIDT,
+                          CrossPageVmmCodeVA(SwitchUDHandler));
+   CrossPagePopulateSwitchIDTE(EXC_MC,  SYSTEM_CODE_SELECTOR, switchMonIDT,
+                          CrossPageVmmCodeVA(SwitchMCEHandler));
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -218,7 +310,6 @@ CrossPage_CodePage(void)
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchDBHandler)
    "pushq        %%rax\n"
-   ANNOTATE_ASM_CALL
    "call         SwitchExcGetCrossPageData\n"
    "addq         %[wsExceptionDB], %%rax\n"
    "movb         $1,               (%%rax)\n" /* log EXC_DB */
@@ -259,7 +350,6 @@ CrossPage_CodePage(void)
    "pushq        %%rax\n"
    "pushq        %%rbx\n"
    "pushq        %%rcx\n"
-   ANNOTATE_ASM_CALL
    "call         SwitchExcGetCrossPageData\n"
    "movl         %[wsExceptionUD],      %%ecx\n"    /* log EXC_UD */
    "movb         $1,                    (%%rax, %%rcx)\n"
@@ -326,7 +416,6 @@ CrossPage_CodePage(void)
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchNMIHandler)
    "pushq        %%rax\n"
-   ANNOTATE_ASM_CALL
    "call         SwitchExcGetCrossPageData\n"
    "addq         %[wsExceptionNMI], %%rax\n"
    "movb         $1,                (%%rax)\n" /* log EXC_NMI */
@@ -362,7 +451,6 @@ CrossPage_CodePage(void)
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchMCEHandler)
    "pushq        %%rax\n"
-   ANNOTATE_ASM_CALL
    "call         SwitchExcGetCrossPageData\n"
    "addq         %[wsExceptionMC], %%rax\n"
    "movb         $1,              (%%rax)\n" /* log EXC_MC */
diff --git a/vmmon-only/common/crosspage.h b/vmmon-only/common/crosspage.h
index c9178fbf..e877ff09 100644
--- a/vmmon-only/common/crosspage.h
+++ b/vmmon-only/common/crosspage.h
@@ -27,14 +27,11 @@ struct VMCrossPageData;
 
 extern void HostToVmm(struct VMCrossPageData *crosspageWIN, void *unused1,
                       void *unused2, struct VMCrossPageData *crosspageSYSV);
-extern const VMCrossPageData cpDataTemplate;
+extern void CrossPageInitSwitchIDTs(struct VMCrossPageData *cpData);
 
-extern void SwitchDBHandler(void);
-extern void SwitchUDHandler(void);
-extern void SwitchNMIHandler(void);
-extern void SwitchMCEHandler(void);
 extern void CrossPage_CodePage(void);
 extern void CrossPage_CodeEnd(void);
+extern const VMCrossPageData cpDataTemplate;
 
 #ifdef __cplusplus
 }
diff --git a/vmmon-only/common/memtrack.c b/vmmon-only/common/memtrack.c
index 48f8241b..2e015d17 100644
--- a/vmmon-only/common/memtrack.c
+++ b/vmmon-only/common/memtrack.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -86,7 +86,6 @@
 #   include <string.h>
 #endif
 
-#include "vmware.h"
 #include "hostif.h"
 #include "vmx86.h"
 
diff --git a/vmmon-only/common/memtrack.h b/vmmon-only/common/memtrack.h
index e0b6bd5f..5bfab3f4 100644
--- a/vmmon-only/common/memtrack.h
+++ b/vmmon-only/common/memtrack.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2017-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2017-2018,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -27,9 +27,7 @@
 #ifndef _MEMTRACK_H_
 #define _MEMTRACK_H_
 
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMCORE
-#include "includeCheck.h"
+#include "vmx86.h"
 
 struct MemTrack;
 
diff --git a/vmmon-only/vmcore/moduleloop.c b/vmmon-only/common/moduleloop.c
similarity index 99%
rename from vmmon-only/vmcore/moduleloop.c
rename to vmmon-only/common/moduleloop.c
index 974484aa..ca1063f0 100644
--- a/vmmon-only/vmcore/moduleloop.c
+++ b/vmmon-only/common/moduleloop.c
@@ -30,7 +30,6 @@
 #   include <linux/kernel.h>
 #   include <linux/sched.h>
 #endif
-#include "vmware.h"
 #include "modulecall.h"
 #include "vmx86.h"
 #include "task.h"
@@ -38,7 +37,6 @@
 #include "iocontrols.h"
 #include "hostif.h"
 #include "memtrack.h"
-#include "driver_vmcore.h"
 #include "usercalldefs.h"
 #include "cpuid.h"
 #include "vmmblob.h"
diff --git a/vmmon-only/common/phystrack.c b/vmmon-only/common/phystrack.c
index 2e09e3e6..d4d9aaef 100644
--- a/vmmon-only/common/phystrack.c
+++ b/vmmon-only/common/phystrack.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2014,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2014,2019-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -41,7 +41,6 @@
 #   include <string.h>
 #endif
 
-#include "vmware.h"
 #include "vmx86.h"
 #include "phystrack.h"
 #include "hostif.h"
@@ -154,9 +153,7 @@ PhysTrackAllocL3(PhysTrackerL2 *dir2,
    if (!dir3) {
       ASSERT_ON_COMPILE(sizeof *dir3 == PAGE_SIZE);
       dir3 = HostIF_AllocPage();
-      if (!dir3) {
-         PANIC();
-      }
+      VERIFY(dir3);
       memset(dir3, 0, sizeof *dir3);
       dir2->dir[p2] = dir3;
    }
@@ -263,8 +260,7 @@ PhysTrack_Free(PhysTracker *tracker)
 
                for (pos = 0; pos < BYTES_PER_ENTRY; pos++) {
                   if (dir3->bits[pos]) {
-                     Warning("%s: pfns still locked\n", __FUNCTION__);
-                     PANIC();
+                     Panic("%s: pfns still locked\n", __FUNCTION__);
                   }
                }
                PHYSTRACK_FREEL3(dir2, p2);
@@ -316,17 +312,13 @@ PhysTrack_Add(PhysTracker *tracker, // IN/OUT
       // more efficient with page alloc
       ASSERT_ON_COMPILE(sizeof *dir2 == PAGE_SIZE);
       dir2 = HostIF_AllocPage();
-      if (!dir2) {
-         PANIC();
-      }
+      VERIFY(dir2);
       memset(dir2, 0, sizeof *dir2);
       tracker->dir[p1] = dir2;
    }
    dir3 = PHYSTRACK_ALLOCL3(dir2, p2);
    PHYSTRACK_GETL3POS(p3, pos, bit);
-   if (dir3->bits[pos] & bit) {
-      PANIC();
-   }
+   VERIFY((dir3->bits[pos] & bit) == 0);
    dir3->bits[pos] |= bit;
 }
 
@@ -365,17 +357,11 @@ PhysTrack_Remove(PhysTracker *tracker, // IN/OUT
    ASSERT(p1 < PHYSTRACK_L1_ENTRIES);
 
    dir2 = tracker->dir[p1];
-   if (!dir2) {
-      PANIC();
-   }
+   VERIFY(dir2);
    dir3 = PHYSTRACK_GETL3(dir2, p2);
-   if (!dir3) {
-      PANIC();
-   }
+   VERIFY(dir3);
    PHYSTRACK_GETL3POS(p3, pos, bit);
-   if (!(dir3->bits[pos] & bit)) {
-      PANIC();
-   }
+   VERIFY((dir3->bits[pos] & bit) != 0);
    dir3->bits[pos] &= ~bit;
 }
 
diff --git a/vmmon-only/common/sharedAreaVmmon.c b/vmmon-only/common/sharedAreaVmmon.c
index a5cdeeb7..6c66f2b0 100644
--- a/vmmon-only/common/sharedAreaVmmon.c
+++ b/vmmon-only/common/sharedAreaVmmon.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2018,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -28,7 +28,6 @@
 #else
 #   include <string.h>
 #endif
-#include "vmware.h"
 #include "vm_assert.h"
 #include "hostif.h"
 #include "sharedAreaVmmon.h"
diff --git a/vmmon-only/common/statVarsVmmon.c b/vmmon-only/common/statVarsVmmon.c
index 8cc0d1bf..f3bf1136 100644
--- a/vmmon-only/common/statVarsVmmon.c
+++ b/vmmon-only/common/statVarsVmmon.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2018-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2018-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -28,7 +28,6 @@
 #else
 #   include <string.h>
 #endif
-#include "vmware.h"
 #include "vm_assert.h"
 #include "hostif.h"
 #include "statVarsVmmon.h"
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index 0757688c..583b9126 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -46,7 +46,6 @@
 #   include <string.h>
 #endif
 
-#include "vmware.h"
 #include "modulecall.h"
 #include "vmx86.h"
 #include "task.h"
@@ -66,8 +65,8 @@
 #include "x86paging_64.h"
 #include "memtrack.h"
 #include "monLoader.h"
-#include "segs.h"
 #include "crosspage.h"
+#include "cpu_defs.h"
 
 #ifdef LINUX_GDT_IS_RO
 #   include <asm/desc.h>
@@ -77,7 +76,6 @@
 #endif
 
 #if defined(_WIN64)
-#   include "x86.h"
 #   include "vmmon-asm-x86-64.h"
 #   define USE_TEMPORARY_GDT 1
 #else
@@ -1209,96 +1207,6 @@ Task_CreateCrossGDT(BSVMM_GDTInit *gdt)
 }
 
 
-/*
- *-----------------------------------------------------------------------------
- *
- * TaskPopulateSwitchIDTE --
- *
- *      Populates an interrupt descriptor in the crosspage, setting its
- *      handler to the associated gate stub given a code segment selector.
- *
- * Results:
- *      None
- *
- * Side effects:
- *      None
- *
- *-----------------------------------------------------------------------------
- */
-
-static void
-TaskPopulateSwitchIDTE(unsigned idx, Selector cs, Gate64 *idt, VA handlerVA)
-{
-   Gate64 *entry;
-
-   ASSERT_ON_COMPILE(sizeof *entry == 16);
-   ASSERT(idx < NUM_EXCEPTIONS);
-   entry = &idt[idx];
-
-   entry->offset_0_15  = LOWORD(handlerVA);
-   entry->offset_16_31 = HIWORD(handlerVA);
-   entry->offset_32_63 = HIDWORD(handlerVA);
-   entry->type         = INTER_GATE;
-   entry->segment      = cs;
-   entry->present      = 1;
-   entry->ist          = 0;
-   entry->DPL          = 0;
-   entry->reserved0    = 0;
-   entry->reserved1    = 0;
-}
-
-static VA
-TaskVmmCodeVA(void (*handler)(void))
-{
-   VA baseVA = VPN_2_VA(CROSS_PAGE_CODE_START);
-   VA offs = (VA)handler % PAGE_SIZE;
-
-   return baseVA + offs;
-}
-
-/*
- *-----------------------------------------------------------------------------
- *
- *  TaskInitSwitchIDT --
- *
- *      Initializes the contents of the switch IDTs and IDTR.
- *      Uses the cross page's host kernel linear address and host kernel CS.
- *
- * Results:
- *      None
- *
- * Side effects:
- *      None
- *
- *-----------------------------------------------------------------------------
- */
-
-static void
-TaskInitSwitchIDTs(VMCrossPageData *cpData)
-{
-   const Selector hostCS = cpData->hostInitial64CS;
-   Gate64 *switchHostIDT = cpData->switchHostIDT;
-   Gate64 *switchMonIDT  = cpData->switchMonIDT;
-
-   cpData->switchHostIDTR.limit = sizeof cpData->switchHostIDT - 1;
-   cpData->switchHostIDTR.offset = PtrToVA64(&cpData->switchHostIDT);
-
-   TaskPopulateSwitchIDTE(EXC_DB,  hostCS, switchHostIDT, (VA)SwitchDBHandler);
-   TaskPopulateSwitchIDTE(EXC_NMI, hostCS, switchHostIDT, (VA)SwitchNMIHandler);
-   TaskPopulateSwitchIDTE(EXC_UD,  hostCS, switchHostIDT, (VA)SwitchUDHandler);
-   TaskPopulateSwitchIDTE(EXC_MC,  hostCS, switchHostIDT, (VA)SwitchMCEHandler);
-
-   TaskPopulateSwitchIDTE(EXC_DB,  SYSTEM_CODE_SELECTOR, switchMonIDT,
-                          TaskVmmCodeVA(SwitchDBHandler));
-   TaskPopulateSwitchIDTE(EXC_NMI, SYSTEM_CODE_SELECTOR, switchMonIDT,
-                          TaskVmmCodeVA(SwitchNMIHandler));
-   TaskPopulateSwitchIDTE(EXC_UD,  SYSTEM_CODE_SELECTOR, switchMonIDT,
-                          TaskVmmCodeVA(SwitchUDHandler));
-   TaskPopulateSwitchIDTE(EXC_MC,  SYSTEM_CODE_SELECTOR, switchMonIDT,
-                          TaskVmmCodeVA(SwitchMCEHandler));
-}
-
-
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1693,7 +1601,7 @@ Task_InitCrosspage(VMDriver     *vm,           // IN
 
       /*
        * The version of the crosspage must be the first four bytes of the
-       * crosspage.  See the declaration of VMCrossPage in modulecall.h.
+       * crosspage.  See the declaration of VMCrossPageData in modulecall.h.
        */
 
       ASSERT_ON_COMPILE(offsetof(VMCrossPageData, version) == 0);
@@ -1758,7 +1666,7 @@ Task_InitCrosspage(VMDriver     *vm,           // IN
       cpData->hstTimerExpiry        = MAX_ABSOLUTE_TS;
       cpData->monTimerExpiry        = MAX_ABSOLUTE_TS;
 
-      TaskInitSwitchIDTs(cpData);
+      CrossPageInitSwitchIDTs(cpData);
    }
    /*
     * Store the number of pages allocated for this VM's page table patches so
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index e5fb7ad4..adcc9171 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -34,22 +34,19 @@
 #endif
 
 #ifdef __APPLE__
-#include <IOKit/IOLib.h>  // must come before "vmware.h"
+#include <IOKit/IOLib.h>
 #endif
 
-#include "vmware.h"
 #include "vm_assert.h"
 #include "vm_basic_math.h"
 #include "vmx86.h"
 #include "task.h"
-#include "vm_asm.h"
 #include "iocontrols.h"
 #include "hostif.h"
 #include "cpuid.h"
 #include "vcpuset.h"
 #include "memtrack.h"
 #if defined(_WIN64)
-#include "x86.h"
 #include "vmmon-asm-x86-64.h"
 #endif
 #include "x86vt.h"
@@ -65,6 +62,8 @@
 #include "vmmblob.h"
 #include "sharedAreaVmmon.h"
 #include "statVarsVmmon.h"
+#include "intelVT.h"
+#include "cpu_defs.h"
 
 PseudoTSC pseudoTSC;
 
@@ -78,7 +77,6 @@ static VMDriver *vmDriverList = NULL;
 static LockedPageLimit lockedPageLimit = {
    0,                        // host: does not need to be initialized.
    0,                        // configured: must be set by some VM as it is powered on.
-   MAX_LOCKED_PAGES,         // dynamic
 };
 
 /* Percentage of guest "paged" memory that must fit within the hard limit. */
@@ -132,11 +130,55 @@ typedef struct VMX86MSRCacheInfo {
    uint64 msrValue;
 } VMX86MSRCacheInfo;
 
+struct MSRCache {
+   Vmx86GetMSRData *queryCache;
+   uint32 nPCPUs;
+};
+
+static Vmx86GetMSRData msrCacheQueryData;
+
+/*
+ * A MSR cache list for checking uniformity across physical cpus and for
+ * generating least common denominated values across pcpus.
+ * {MSR_Index, Member_Name}
+ */
+#define UNIFORMITY_CACHE_MSRS                                                  \
+   MSRNUM(IA32_MSR_ARCH_CAPABILITIES,     ArchCap)                             \
+   MSRNUM(MSR_BIOS_SIGN_ID,               BIOSSignID)                          \
+   MSRNUM(MSR_PLATFORM_INFO,              Join)                                \
+   MSRNUM(MSR_TSX_CTRL,                   Join)                                \
+   MSRNUM(MSR_VM_CR,                      VMCR)                                \
+   MSRNUMVT(MSR_FEATCTL,                  FeatureCtl)                          \
+   MSRNUMVT(MSR_VMX_BASIC,                Basic)                               \
+   MSRNUMVT(MSR_VMX_MISC,                 Misc)                                \
+   MSRNUMVT(MSR_VMX_VMCS_ENUM,            Enum)                                \
+   MSRNUMVT(MSR_VMX_EPT_VPID,             EPT)                                 \
+   MSRNUMVT(MSR_VMX_VMFUNC,               VMFunc)                              \
+   MSRNUMVT(MSR_VMX_3RD_CTLS,             3rd)                                 \
+   MSRNUMVT2(MSR_VMX_PINBASED_CTLS,       Ctls)                                \
+   MSRNUMVT2(MSR_VMX_PROCBASED_CTLS,      Ctls)                                \
+   MSRNUMVT2(MSR_VMX_EXIT_CTLS,           Ctls)                                \
+   MSRNUMVT2(MSR_VMX_ENTRY_CTLS,          Ctls)                                \
+   MSRNUMVT2(MSR_VMX_2ND_CTLS,            Ctls)                                \
+   MSRNUMVT2(MSR_VMX_TRUE_PINBASED_CTLS,  Ctls)                                \
+   MSRNUMVT2(MSR_VMX_TRUE_PROCBASED_CTLS, Ctls)                                \
+   MSRNUMVT2(MSR_VMX_TRUE_EXIT_CTLS,      Ctls)                                \
+   MSRNUMVT2(MSR_VMX_TRUE_ENTRY_CTLS,     Ctls)                                \
+   MSRNUMVT2(MSR_VMX_CR0_FIXED0,          Fixed0)                              \
+   MSRNUMVT2(MSR_VMX_CR4_FIXED0,          Fixed0)                              \
+   MSRNUMVT2(MSR_VMX_CR0_FIXED1,          Fixed1)                              \
+   MSRNUMVT2(MSR_VMX_CR4_FIXED1,          Fixed1)                              \
+
 static VMX86MSRCacheInfo msrUniformityCacheInfo[] = {
-#define MSR_FEAT(member) {member, CONST64(0)},
-   MSR_FEAT(IA32_MSR_ARCH_CAPABILITIES)
-#undef MSR_FEAT
+#define MSRNUM(msr, member) {msr, CONST64(0)},
+#define MSRNUMVT    MSRNUM
+#define MSRNUMVT2   MSRNUM
+   UNIFORMITY_CACHE_MSRS
 };
+#undef MSRNUM
+#undef MSRNUMVT
+#undef MSRNUMVT2
+
 
 /*
  *----------------------------------------------------------------------
@@ -179,7 +221,6 @@ Vmx86AdjustLimitForOverheads(const VMDriver* vm,
  *       a host:
  *
  *       lockedPageLimit.configured is controlled by UI,
- *       lockedPageLimit.dynamic is controlled by authd's hardLimitMonitor,
  *       lockedPageLimit.host is calculated dynamically based on kernel stats
  *       by vmmon using kernel stats.
  *
@@ -200,8 +241,8 @@ Vmx86LockedPageLimit(const VMDriver* vm)  // IN:
    PageCnt overallLimit;
    ASSERT(HostIF_GlobalLockIsHeld());
    lockedPageLimit.host = HostIF_EstimateLockedPageLimit(vm, numLockedPages);
-   overallLimit = MIN(MIN(lockedPageLimit.configured, lockedPageLimit.dynamic),
-                      lockedPageLimit.host);
+   overallLimit = MIN(MIN(lockedPageLimit.configured, lockedPageLimit.host),
+                      MAX_LOCKED_PAGES);
 
    return Vmx86AdjustLimitForOverheads(vm, overallLimit);
 }
@@ -1913,33 +1954,6 @@ Vmx86_SetConfiguredLockedPagesLimit(PageCnt limit)  // IN:
 }
 
 
-/*
- *----------------------------------------------------------------------
- *
- * Vmx86_SetDynamicLockedPageLimit --
- *
- *      Set the dynamic locked page limit.  This limit is determined by
- *      authd in response to host pressure.  It can be both raised and
- *      lowered at any time.
- *
- * Results:
- *      None.
- *
- * Side effects:
- *      Hard limit may be changed.
- *
- *----------------------------------------------------------------------
- */
-
-void
-Vmx86_SetDynamicLockedPagesLimit(PageCnt limit)  // IN:
-{
-   HostIF_GlobalLock(11);
-   lockedPageLimit.dynamic = limit;
-   HostIF_GlobalUnlock(11);
-}
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -2866,16 +2880,18 @@ Vmx86GetMSR(void *clientData) // IN/OUT: A Vmx86GetMSRData *
 {
    uint32 i;
    Vmx86GetMSRData *data = (Vmx86GetMSRData *)clientData;
+   uint32 numPCPUs = data->query->numLogicalCPUs;
+   size_t offset = sizeof(MSRQuery) + sizeof(MSRReply) * numPCPUs;
    ASSERT(data && data->index && data->query);
 
    for (i = 0; i < data->numItems; ++i) {
       uint32 index;
       int err;
       Atomic_uint32 *cpus = &data->index[i];
-      MSRQuery *query = &data->query[i];
+      MSRQuery *query = (MSRQuery *) ((uint8 *)&data->query[0] + i * offset);
 
       index = Atomic_ReadInc32(cpus);
-      if (index >= query->numLogicalCPUs) {
+      if (index >= numPCPUs) {
          continue;
       }
 
@@ -2902,8 +2918,6 @@ Vmx86GetMSR(void *clientData) // IN/OUT: A Vmx86GetMSRData *
          err =
             HostIF_SafeRDMSR(query->msrNum, &query->logicalCPUs[index].msrVal);
       }
-
-      query->logicalCPUs[index].implemented = (err == 0) ? 1 : 0;
    }
 }
 
@@ -2946,7 +2960,6 @@ Vmx86_GetAllMSRs(MSRQuery *query) // IN/OUT
       if (msrUniformityCacheInfo[i].msrIndex == query->msrNum) {
          for (cpu = 0; cpu < query->numLogicalCPUs; cpu++) {
             query->logicalCPUs[cpu].msrVal = msrUniformityCacheInfo[i].msrValue;
-            query->logicalCPUs[cpu].implemented = 1;
             query->logicalCPUs[cpu].tag = cpu;
          }
          return TRUE;
@@ -3620,6 +3633,350 @@ Vmx86RegisterCPU(void *data) // IN: *data
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86VTMSRCacheGet --
+ *
+ *      Retrieve the requested VT MSR value from the cache.  Returns zero
+ *      for uncached values.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static uint64
+Vmx86VTMSRCacheGet(const MSRCache *cache, uint32 msrNum, unsigned cpu)
+{
+   ASSERT((msrNum >= MSR_VMX_BASIC && msrNum < MSR_VMX_BASIC + NUM_VMX_MSRS) ||
+          msrNum == MSR_FEATCTL);
+   if (cache != NULL && cache->queryCache != NULL) {
+      size_t offset = sizeof(MSRQuery) + sizeof(MSRReply) * cache->nPCPUs;
+      MSRQuery *query;
+      unsigned ix;
+      ASSERT(cpu < cache->nPCPUs);
+      for (ix = 0; ix < cache->queryCache->numItems; ix++) {
+         query = (MSRQuery *) ((uint8 *)&cache->queryCache->query[0] +
+                               ix * offset);
+         if (query->msrNum == msrNum) {
+            return query->logicalCPUs[cpu].msrVal;
+         }
+      }
+   }
+   return 0;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86AllocMSRUniformityCache --
+ * Vmx86FreeMSRUniformityCache --
+ *
+ *      Allocate/populate and cleanup MSR uniformity cache.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static Bool
+Vmx86AllocMSRUniformityCache(uint32 numPCPUs)
+{
+   MSRQuery *query = NULL;
+   uint32 i;
+   uint32 numQueries = ARRAYSIZE(msrUniformityCacheInfo);
+   Atomic_uint32 *cpuCounters;
+   MSRQuery *multMSRQueryAllPcpus = Vmx86_Calloc(numQueries,
+         sizeof(MSRQuery) + sizeof(MSRReply) * numPCPUs, FALSE);
+   if (multMSRQueryAllPcpus == NULL) {
+      return FALSE;
+   }
+
+   cpuCounters = Vmx86_Calloc(numQueries, sizeof(Atomic_uint32), FALSE);
+   if (cpuCounters == NULL) {
+      Vmx86_Free(multMSRQueryAllPcpus);
+      return FALSE;
+   }
+   msrCacheQueryData.query = multMSRQueryAllPcpus;
+   msrCacheQueryData.index = cpuCounters;
+   msrCacheQueryData.numItems = numQueries;
+
+   /*
+    * Enumerates a MSR list and initializes MSR msrCacheQueryData structure
+    * before the actual (safe) MSR query takes place.
+    */
+   for (i = 0; i < ARRAYSIZE(msrUniformityCacheInfo); ++i) {
+      query = (MSRQuery *) ((uint8 *)&msrCacheQueryData.query[0] +
+                 i * (sizeof(MSRQuery) + sizeof(MSRReply) * numPCPUs));
+      Atomic_Write32(&msrCacheQueryData.index[i], 0);
+      query->msrNum = msrUniformityCacheInfo[i].msrIndex;
+      query->numLogicalCPUs = numPCPUs;
+   }
+
+   /* Perform a single query for all of the MSRs in the uniformity check list.*/
+   HostIF_CallOnEachCPU(Vmx86GetMSR, &msrCacheQueryData);
+   return TRUE;
+}
+
+
+static void
+Vmx86FreeMSRUniformityCache(void)
+{
+   Vmx86_Free(msrCacheQueryData.index);
+   Vmx86_Free(msrCacheQueryData.query);
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86CheckMSRUniformity --
+ *
+ *      Iterate MSR uniformity cache and test uniformity of each MSR across all
+ *      physical cpu(s).
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static void
+Vmx86CheckMSRUniformity(uint32 numPCPUs)
+{
+   uint32 i, j;
+   MSRQuery *query = NULL;
+
+   for (i = 0; i < ARRAYSIZE(msrUniformityCacheInfo); ++i) {
+      uint32 msrIndex = msrUniformityCacheInfo[i].msrIndex;
+      query = (MSRQuery *)((uint8 *)&msrCacheQueryData.query[0] +
+                 i * (sizeof(MSRQuery) + sizeof(MSRReply) * numPCPUs));
+      ASSERT(Atomic_Read32(&msrCacheQueryData.index[i]) == numPCPUs);
+      for (j = 1; j < numPCPUs; j++) {
+         uint64 msrValuePCPU = query->logicalCPUs[j].msrVal;
+         if (msrValuePCPU != query->logicalCPUs[0].msrVal) {
+            Warning("Found a mismatch on MSR feature 0x%x; logical cpu%u "
+                    "value = 0x%llx, but logical cpu%u value = 0x%llx\n",
+                    msrIndex, j, msrValuePCPU, 0, query->logicalCPUs[0].msrVal);
+         }
+      }
+   }
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86FindMSRQueryFromCache --
+ *
+ *      Iterate MSR uniformity cache and find query position for the given msr.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static MSRQuery*
+Vmx86FindMSRQueryFromCache(uint32 msrIndex, uint32 numPCPUs)
+{
+   uint32 i;
+   MSRQuery *query = NULL;
+   size_t offset = sizeof(MSRQuery) + sizeof(MSRReply) * numPCPUs;
+   MSRQuery *first = &msrCacheQueryData.query[0];
+
+   for (i = 0; i < ARRAYSIZE(msrUniformityCacheInfo); ++i) {
+      if (msrIndex == msrUniformityCacheInfo[i].msrIndex) {
+         query = (MSRQuery *)((uint8 *)first + i * offset);
+         break;
+      }
+   }
+   return query;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86FindCommonMSRArchCap --
+ * Vmx86FindCommonMSRBIOSSignID --
+ * Vmx86FindCommonMSRVMCR --
+ * Vmx86FindCommonMSRJoin --
+ *
+ *      Calculate least common denominator for IA32_MSR_ARCH_CAPABILITIES,
+ *      MSR_BIOS_SIGN_ID, MSR_VM_CR, and general case respectively.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static uint64
+Vmx86FindCommonMSRArchCap(uint32 msrIndex, uint32 numPCPUs)
+{
+   uint32 j;
+   uint64 msrCommonVal;
+
+   MSRQuery *query = Vmx86FindMSRQueryFromCache(msrIndex, numPCPUs);
+   ASSERT(query != NULL);
+   ASSERT(msrIndex == IA32_MSR_ARCH_CAPABILITIES);
+
+   msrCommonVal = query->logicalCPUs[0].msrVal;
+   /*
+    * MSR_ARCH_CAPABILITIES_RSBA bit 1 represents lack of feature while 0
+    * represents presence. Therefore, bit is flipped for calculating the
+    * least common set and flipped again on the final value for resetting.
+    */
+   msrCommonVal ^= MSR_ARCH_CAPABILITIES_RSBA;
+   for (j = 1; j < numPCPUs; j++) {
+      uint64 msrValuePCPU = query->logicalCPUs[j].msrVal;
+      if (msrValuePCPU != query->logicalCPUs[0].msrVal) {
+         msrValuePCPU ^= MSR_ARCH_CAPABILITIES_RSBA;
+         msrCommonVal &= msrValuePCPU;
+      }
+   }
+   msrCommonVal ^= MSR_ARCH_CAPABILITIES_RSBA;
+   return msrCommonVal;
+}
+
+
+static uint64
+Vmx86FindCommonMSRBIOSSignID(uint32 msrIndex, uint32 numPCPUs)
+{
+   unsigned cpu;
+   uint64 commonVal;
+
+   MSRQuery *query = Vmx86FindMSRQueryFromCache(msrIndex, numPCPUs);
+   ASSERT(query != NULL);
+   commonVal = ~0ULL;
+
+   for (cpu = 0; cpu < numPCPUs; cpu++) {
+      if (query->logicalCPUs[cpu].msrVal < commonVal) {
+         commonVal = query->logicalCPUs[cpu].msrVal;
+      }
+   }
+
+   return commonVal;
+}
+
+
+static uint64
+Vmx86FindCommonMSRVMCR(uint32 msrIndex, uint32 numPCPUs)
+{
+   unsigned cpu;
+   uint64 commonVal;
+
+   MSRQuery *query = Vmx86FindMSRQueryFromCache(msrIndex, numPCPUs);
+   ASSERT(query != NULL);
+   commonVal = query->logicalCPUs[0].msrVal;
+
+   for (cpu = 1; cpu < numPCPUs; cpu++) {
+      uint64 msrValuePCPU = query->logicalCPUs[cpu].msrVal;
+      commonVal &= msrValuePCPU & MSR_VM_CR_R_INIT;
+      commonVal |= msrValuePCPU & ~MSR_VM_CR_R_INIT;
+   }
+
+   return commonVal;
+}
+
+
+static uint64
+Vmx86FindCommonMSRJoin(uint32 msrIndex, uint32 numPCPUs)
+{
+   uint32 j;
+   uint64 msrCommonVal;
+
+   MSRQuery *query = Vmx86FindMSRQueryFromCache(msrIndex, numPCPUs);
+   ASSERT(query != NULL);
+
+   msrCommonVal = query->logicalCPUs[0].msrVal;
+   for (j = 1; j < numPCPUs; j++) {
+      msrCommonVal &= query->logicalCPUs[j].msrVal;
+   }
+   return msrCommonVal;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Vmx86GenFindCommonCap --
+ * Vmx86GenFindCommonIntelVTCap --
+ * Vmx86FindCommonMSR --
+ *
+ *      Generate common MSR calculation routines by deriving appropriate
+ *      function with 'member' name.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static uint64
+Vmx86GenFindCommonCap(uint32 msrIndex, uint32 numPCPUs)
+{
+#define MSRNUMVT(msr, member)
+#define MSRNUMVT2 MSRNUMVT
+
+#define MSRNUM(msr, member)                                                    \
+   if (msrIndex == msr) {                                                      \
+      return Vmx86FindCommonMSR##member(msrIndex, numPCPUs);                   \
+   } else {                                                                    \
+      return Vmx86FindCommonMSRJoin(msrIndex, numPCPUs);                       \
+   }
+
+   UNIFORMITY_CACHE_MSRS
+#undef MSRNUM
+#undef MSRNUMVT
+#undef MSRNUMVT2
+
+   return CONST64(0);
+}
+
+
+static uint64
+Vmx86GenFindCommonIntelVTCap(uint32 msrIndex, uint32 numPCPUs)
+{
+   MSRCache vt;
+   IntelVTMSRGet_Fn fn = Vmx86VTMSRCacheGet;
+
+   /* Prepare a special cache for VT MSR uniformity checks. */
+   vt.queryCache = &msrCacheQueryData;
+   vt.nPCPUs = numPCPUs;
+
+#define MSRNUM(msr, member)
+
+#define MSRNUMVT(msr, member)                                                  \
+   if (msrIndex == msr) {                                                      \
+      return IntelVT_FindCommon##member(&vt, fn, numPCPUs);                    \
+   }
+
+#define MSRNUMVT2(msr, member)                                                 \
+   if (msrIndex == msr) {                                                      \
+      return IntelVT_FindCommon##member(&vt, fn, numPCPUs, msr);               \
+   }
+
+   UNIFORMITY_CACHE_MSRS
+#undef MSRNUM
+#undef MSRNUMVT
+#undef MSRNUMVT2
+
+   return CONST64(0);
+}
+
+
+static uint64
+Vmx86FindCommonMSR(uint32 msrIndex, uint32 numPCPUs)
+{
+#define MSRNUM(msr, member)                                                    \
+   if (msrIndex == msr) {                                                      \
+      return Vmx86GenFindCommonCap(msrIndex, numPCPUs);                        \
+   }
+
+#define MSRNUMVT(msr, member)                                                  \
+   if (msrIndex == msr) {                                                      \
+      return Vmx86GenFindCommonIntelVTCap(msrIndex, numPCPUs);                 \
+   }
+
+#define MSRNUMVT2 MSRNUMVT
+
+   UNIFORMITY_CACHE_MSRS
+#undef MSRNUM
+#undef MSRNUMVT
+#undef MSRNUMVT2
+
+   return CONST64(0);
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -3646,13 +4003,9 @@ Vmx86RegisterCPU(void *data) // IN: *data
 Bool
 Vmx86_CheckMSRUniformity(void)
 {
-   Vmx86GetMSRData data;
-   uint32 i, j;
-   uint32 numQueries = ARRAYSIZE(msrUniformityCacheInfo);
+   uint32 i;
    Atomic_uint32 numLogicalCPUs;
-   Atomic_uint32 *cpuCounters;
    uint32 numPCPUs = 0;
-   MSRQuery *query = NULL;
 
    Atomic_Write32(&numLogicalCPUs, 0);
    /*
@@ -3662,69 +4015,22 @@ Vmx86_CheckMSRUniformity(void)
    HostIF_CallOnEachCPU(Vmx86RegisterCPU, &numLogicalCPUs);
    numPCPUs = Atomic_Read32(&numLogicalCPUs);
    ASSERT(numPCPUs > 0);
-   query = Vmx86_Calloc(numQueries,
-                        sizeof(MSRQuery) + sizeof(MSRReply) * numPCPUs, TRUE);
-   if (query == NULL) {
-      Warning("Fatal, not enough memory for MSR feature uniformity checks");
-      return FALSE;
-   }
 
-   cpuCounters = Vmx86_Calloc(numQueries, sizeof(Atomic_uint32), TRUE);
-   if (cpuCounters == NULL) {
-      Vmx86_Free(query);
+   if (!Vmx86AllocMSRUniformityCache(numPCPUs)) {
       Warning("Fatal, not enough memory for MSR feature uniformity checks");
       return FALSE;
    }
-   data.query = query;
-   data.index = cpuCounters;
-   data.numItems = numQueries;
 
-   /*
-    * Enumerates a MSR list and initializes MSR data structure before the
-    * actual (safe) MSR query takes place. The Nested loop tests a MSR for
-    * uniformity on all logical processors.
-    */
-   for (i = 0; i < ARRAYSIZE(msrUniformityCacheInfo); ++i) {
-      query = &data.query[i];
-      Atomic_Write32(&data.index[i], 0);
-      query->msrNum = msrUniformityCacheInfo[i].msrIndex;
-      query->numLogicalCPUs = numPCPUs;
-   }
-
-   /* perform once, a multi MSR query for MSRs in uniformity check list. */
-   HostIF_CallOnEachCPU(Vmx86GetMSR, &data);
+   Vmx86CheckMSRUniformity(numPCPUs);
 
    for (i = 0; i < ARRAYSIZE(msrUniformityCacheInfo); ++i) {
       uint32 msrIndex = msrUniformityCacheInfo[i].msrIndex;
-      query = &data.query[i];
-      ASSERT(Atomic_Read32(&data.index[i]) == numPCPUs);
-      msrUniformityCacheInfo[i].msrValue = query->logicalCPUs[0].msrVal;
-      if (msrIndex == IA32_MSR_ARCH_CAPABILITIES) {
-         /*
-          * MSR_ARCH_CAPABILITIES_RSBA bit 1 represents lack of feature while 0
-          * represents presence. Therefore, bit is flipped for calculating the
-          * least common set and flipped again on the final value for resetting.
-          */
-         msrUniformityCacheInfo[i].msrValue ^= MSR_ARCH_CAPABILITIES_RSBA;
-      }
-      for (j = 1; j < numPCPUs; j++) {
-         uint64 msrValuePCPU = query->logicalCPUs[j].msrVal;
-         if (msrValuePCPU != query->logicalCPUs[0].msrVal) {
-            if (msrIndex == IA32_MSR_ARCH_CAPABILITIES) {
-               msrValuePCPU ^= MSR_ARCH_CAPABILITIES_RSBA;
-            }
-            msrUniformityCacheInfo[i].msrValue &= msrValuePCPU;
-            Warning("Found a mismatch on MSR feature 0x%x; logical cpu%u "
-                    "value = 0x%llx, but logical cpu%u value = 0x%llx\n",
-                    msrIndex, j, msrValuePCPU, 0, query->logicalCPUs[0].msrVal);
-         }
-      }
-      if (msrIndex == IA32_MSR_ARCH_CAPABILITIES) {
-         msrUniformityCacheInfo[i].msrValue ^= MSR_ARCH_CAPABILITIES_RSBA;
-      }
+      msrUniformityCacheInfo[i].msrValue = Vmx86FindCommonMSR(msrIndex,
+                                                              numPCPUs);
    }
-   Vmx86_Free(cpuCounters);
-   Vmx86_Free(query);
+
+   Vmx86FreeMSRUniformityCache();
+
    return TRUE;
 }
 
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index 2766822b..b739496d 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -33,11 +33,8 @@
 #include "modulecall.h"
 #include "vcpuid.h"
 #include "iocontrols.h"
-#include "numa_defs.h"
 #include "rateconv.h"
-#include "vmmem_shared.h"
 #include "apic.h"
-#include "bootstrap_vmm.h"
 #include "sharedAreaVmmon.h"
 #include "statVarsVmmon.h"
 
@@ -163,7 +160,6 @@ extern void  Vmx86_Free(void *ptr);
 
 extern int32 Vmx86_GetNumVMs(void);
 extern Bool Vmx86_SetConfiguredLockedPagesLimit(PageCnt limit);
-extern void Vmx86_SetDynamicLockedPagesLimit(PageCnt limit);
 extern Bool Vmx86_GetMemInfo(VMDriver *curVM,
                              Bool curVMOnly,
                              VMMemInfoArgs *args,
diff --git a/vmmon-only/include/address_defs.h b/vmmon-only/include/address_defs.h
index 94259e8a..dca8980e 100644
--- a/vmmon-only/include/address_defs.h
+++ b/vmmon-only/include/address_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2014 VMware, Inc. All rights reserved.
+ * Copyright (C) 2014-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -57,8 +57,14 @@ extern "C" {
  * high bits of your ppn.
  */
 
-#define PA_2_PPN(_pa)     ((_pa) >> PAGE_SHIFT)
-#define PPN_2_PA(_ppn)    ((PA)(_ppn) << PAGE_SHIFT)
+#define PA_2_PPN(_pa)      ((_pa) >> PAGE_SHIFT)
+#define PPN_2_PA(_ppn)     ((PA)(_ppn) << PAGE_SHIFT)
+
+#define PA_2_PPN_4KB(_pa)  ((_pa) >> PAGE_SHIFT_4KB)
+#define PPN_2_PA_4KB(_ppn) ((PA)(_ppn) << PAGE_SHIFT_4KB)
+
+#define PA_2_PPN_16KB(_pa)  ((_pa) >> PAGE_SHIFT_16KB)
+#define PPN_2_PA_16KB(_ppn) ((PA)(_ppn) << PAGE_SHIFT_16KB)
 
 static INLINE MA    MPN_2_MA(MPN mpn)     { return  (MA)mpn << PAGE_SHIFT;  }
 static INLINE MPN   MA_2_MPN(MA ma)       { return (MPN)(ma >> PAGE_SHIFT); }
@@ -66,8 +72,6 @@ static INLINE MPN   MA_2_MPN(MA ma)       { return (MPN)(ma >> PAGE_SHIFT); }
 static INLINE IOA   IOPN_2_IOA(IOPN iopn) { return (IOA)(iopn << PAGE_SHIFT); }
 static INLINE IOPN  IOA_2_IOPN(IOA ioa)   { return (IOPN)(ioa >> PAGE_SHIFT); }
 
-typedef char PageArray[PAGE_SIZE];
-
 /*
  *----------------------------------------------------------------------
  *
diff --git a/vmmon-only/include/addrlayout.h b/vmmon-only/include/addrlayout.h
index 305373ae..df3b0d76 100644
--- a/vmmon-only/include/addrlayout.h
+++ b/vmmon-only/include/addrlayout.h
@@ -27,14 +27,13 @@
 
 #include "vm_basic_types.h"
 #include "vm_basic_defs.h"
+#include "vm_assert.h"
 #include "address_defs.h"
-#include "x86desc.h"
-#include "x86types.h"
 #include "vmm_constants.h"
 
 #define DIRECT_EXEC_USER_RPL    3
 #define BINARY_TRANSLATION_RPL  1
-typedef char x86_PAGE[PAGE_SIZE];
+typedef char x86_PAGE[4096];
 
 #define MAX_VADDR                    CONST64U(0xffffffffffffffff)
 #define MONITOR_SIZE                 (64 * 1024 * 1024)
@@ -175,22 +174,12 @@ enum {
 #define SWITCH_PAGE_TABLE_LEN          12
 #endif
 
-#define VMM_STACK_TOP_HW          VPN_2_VA(MON_STACK_PAGES_START + \
-                                           MON_STACK_PAGES_LEN)
-/*
- * VMM_STKTOP_HW_LEN needs to contain an ExcFrame64ForCopy (72 bytes) and
- * some more bytes for a "no man's land" region.  We make sure the "no
- * man's land" region is 0 on BT_Resume and HV_Resume.  Because we
- * check "no man's land" in 8-byte chunks, VMM_STKTOP_HW_LEN must be
- * divisible by 8.
- */
-#define VMM_STKTOP_HW_LEN          168
-#define VMM_STKTOP_HW_LRET_LEN     (VMM_STKTOP_HW_LEN + sizeof(LretFrame64))
-#define VMM_STKTOP_LRET_OFFSET     (PAGE_SIZE - VMM_STKTOP_HW_LRET_LEN)
+#define VMM_STKTOP_LRET_LEN        sizeof(LretFrame64)
+#define VMM_STKTOP_LRET_OFFSET     (PAGE_SIZE - VMM_STKTOP_LRET_LEN)
 
-#define MON_STACK_BASE            VPN_2_VA(MON_STACK_PAGES_START)
-#define MON_STACK_TOP             VPN_2_VA(MON_STACK_PAGES_START + \
-                                           MON_STACK_PAGES_LEN)
+#define MON_STACK_BASE             VPN_2_VA(MON_STACK_PAGES_START)
+#define MON_STACK_TOP              VPN_2_VA(MON_STACK_PAGES_START + \
+                                            MON_STACK_PAGES_LEN)
 #define DF_STACK_BASE              VPN_2_VA(DF_STACK_PAGES_START)
 #define DF_STACK_TOP               VPN_2_VA(DF_STACK_PAGES_START + \
                                             DF_STACK_PAGES_LEN)
@@ -239,7 +228,7 @@ enum {
                                     MC_STACK_PAGES_LEN   + \
                                     NMI_STACK_PAGES_LEN  + \
                                     HV_CURRENT_VMCB_LEN  + \
-                                    IDT_NORMAL_LEN       + \
+                                    MON_IDT_LEN          + \
                                     GDT_AND_TASK_LEN)
 
 #else
@@ -261,15 +250,14 @@ enum {
                                     MC_STACK_PAGES_LEN  + \
                                     NMI_STACK_PAGES_LEN + \
                                     GDT_AND_TASK_LEN    + \
-                                    IDT_NORMAL_LEN      + \
+                                    MON_IDT_LEN         + \
                                     HV_CURRENT_VMCB_LEN + \
                                     SWITCH_PAGE_TABLE_LEN)
 #endif
 
 #define MON_PAGE_TABLE_L5        VPN_2_VA(MON_PAGE_TABLE_L5_START)
 #define MON_PAGE_TABLE_L4        VPN_2_VA(MON_PAGE_TABLE_L4_START)
-#define VMM_STACK_TOP            (VMM_STACK_TOP_HW - VMM_STKTOP_HW_LEN)
-#define VMM_LRET_STACK_TOP       (VMM_STACK_TOP_HW - VMM_STKTOP_HW_LRET_LEN)
+#define VMM_LRET_STACK_TOP       (MON_STACK_TOP - VMM_STKTOP_LRET_LEN)
 /*
  * Mark out a guard page for the VMM stack, this is not in the addrlayout_table
  * explicitly because it overlaps the last page of the MONITOR_READONLY region.
@@ -285,8 +273,7 @@ enum {
 static INLINE Bool
 AddrLayout_InMonStack(VA64 va, size_t len)
 {
-   return VPN_2_VA(MON_STACK_PAGES_START) <= va &&
-          va <= VMM_STACK_TOP_HW - len;
+   return MON_STACK_BASE <= va && va <= MON_STACK_TOP - len;
 }
 
 static INLINE Bool
diff --git a/vmmon-only/include/addrlayout_table.h b/vmmon-only/include/addrlayout_table.h
index 88fbd2ff..27f20056 100644
--- a/vmmon-only/include/addrlayout_table.h
+++ b/vmmon-only/include/addrlayout_table.h
@@ -56,7 +56,7 @@ REGION(MONITOR_READONLY,        1024)
  */
 REGION(MONITOR_DATA,            512)
   ITEM(MON_STACK_PAGES,           8) // Monitor stack.
-  ITEM(IDT_NORMAL,                1) // Normal IDT (used for all but SVM).
+  ITEM(MON_IDT,                   1) // BS/normal IDT (used for all but SVM).
   ITEM(MONITOR_DATA,            503) // Used by linker and TC.
 
 /*
@@ -92,7 +92,7 @@ REGION(MONITOR_MISC,           5632)
   ITEM(GUEST_APIC,                1) // Guest APIC.
 
   ITEM(DF_GUARD_PAGE,             1) // Double Fault stack guard page.
-  ITEM(DF_STACK_PAGES,            1) // Double Fault stack; need ~768 bytes.
+  ITEM(DF_STACK_PAGES,            1) // Double Fault stack; need ~1600 bytes.
 
   ITEM(MC_GUARD_PAGE,             1) // Machine Check stack guard page.
   ITEM(MC_STACK_PAGES,            1) // Machine Check stack.
@@ -136,7 +136,7 @@ REGION(BOOTSTRAP,              8192)
   ITEM(BS_VCPU_L1PT_PT,           1) // L1PT that maps a VCPU's L1 page tables
   ITEM(BS_INIT_POOL,              1) // pool for initializing VMM pages
   ITEM(BS_DYNAMIC_ALLOC,       1880) // bs_alloc's dynamic allocator pages
-  ITEM(IDT_BOOTSTRAP,             1) // bootstrap IDT
+  ITEM(MON_IDT_TMP,               1) // temporary addr for normal IDT on bsp
   ITEM(IDT_BOOTSTRAP_STUBS,       2) // bootstrap IDT gate stubs
   ITEM(BS_PER_VM_VMX,           300) // vmm64's shared_per_vm_vmx
   ITEM(BS_PER_VCPU,               8) // vmm64's shared_per_vcpu for VCPU 0
diff --git a/vmmon-only/include/circList.h b/vmmon-only/include/circList.h
deleted file mode 100644
index ee04a9e1..00000000
--- a/vmmon-only/include/circList.h
+++ /dev/null
@@ -1,507 +0,0 @@
-/*********************************************************
- * Copyright (C) 1998-2017,2019 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- *   circList.h --
- *
- * macros, prototypes and struct definitions for double-linked
- * circular lists.
- */
-
-#ifndef _CIRCLIST_H_
-#define _CIRCLIST_H_
-
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_VMKERNEL
-#include "includeCheck.h"
-
-#include "vmware.h"
-
-#if defined(__cplusplus)
-extern "C" {
-#endif
-
-typedef struct ListItem {
-   struct ListItem *prev;
-   struct ListItem *next;
-} ListItem;
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_IsEmpty --
- *
- *      A NULL list is an empty list.
- *
- * Result:
- *      TRUE if list is empty, FALSE otherwise.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE Bool
-CircList_IsEmpty(const ListItem *item)  // IN
-{
-   return item == NULL;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_InitItem --
- *
- *      Initialize item as a single-element circular list.
- *
- * Result:
- *      None.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE void
-CircList_InitItem(ListItem *item)  // OUT
-{
-   item->prev = item->next = item;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_First --
- *
- *      Return first item in the list.
- *
- * Result:
- *      First item.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE ListItem *
-CircList_First(ListItem *item)  // IN
-{
-   return item;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_Last --
- *
- *      Return last item in the list.
- *
- * Result:
- *      Last item.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE ListItem *
-CircList_Last(ListItem *item)
-{
-   return item->prev;
-}
-
-
-/*
- * CIRC_LIST_CONTAINER - get the struct for this entry (like list_entry)
- * @ptr: the &struct ListItem pointer.
- * @type:   the type of the struct this is embedded in.
- * @member: the name of the list struct within the struct.
- */
-#define CIRC_LIST_CONTAINER(ptr, type, member) \
-   VMW_CONTAINER_OF(ptr, type, member)
-/* 
- * Historical name, left here to reduce churn.
- * TODO: remove, all LIST_CONTAINER uses should be
- * VMW_CONTAINER_OF and stop depending on circList.h
- * to provide the definition.
- */
-#define LIST_CONTAINER(ptr, type, member) VMW_CONTAINER_OF(ptr, type, member)
-
-/*
- * LIST_SCAN_FROM scans the list from "from" up until "until".
- * The loop variable p should not be destroyed in the process.
- * "from" is an element in the list where to start scanning.
- * "until" is the element where search should stop.
- * member is the field to use for the search - either "next" or "prev".
- */
-#define CIRC_LIST_SCAN_FROM(p, from, until, member)   \
-   for (p = (from); (p) != NULL;   \
-      (p) = (((p)->member == (until)) ? NULL : (p)->member))
-
-/* scan the entire list (non-destructively) */
-#define CIRC_LIST_SCAN(p, l)   \
-   CIRC_LIST_SCAN_FROM(p, CircList_First(l), CircList_First(l), next)
-
-
-/* scan the entire list where loop element may be destroyed */
-#define CIRC_LIST_SCAN_SAFE(p, pn, l)   \
-   if (!CircList_IsEmpty(l))  \
-      for (p = (l), (pn) = CircList_Next(p, l); (p) != NULL;   \
-           (p) = (pn), (pn) = CircList_Next(p, l))
-
-/* scan the entire list backwards where loop element may be destroyed */
-#define CIRC_LIST_SCAN_BACK_SAFE(p, pn, l)   \
-   if (!CircList_IsEmpty(l))  \
-      for (p = CircList_Last(l), (pn) = CircList_Prev(p, l); (p) != NULL;   \
-           (p) = (pn), (pn) = CircList_Prev(p, l))
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_Next --
- *
- *      Returns the next member of a doubly linked list, or NULL if last.
- *      Assumes: p is member of the list headed by head.
- *
- * Result:
- *      If head or p is NULL, return NULL. Otherwise,
- *      next list member (or null if last).
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE ListItem *
-CircList_Next(ListItem *p,        // IN
-              ListItem *head)     // IN
-{
-   if (head == NULL || p == NULL) {
-      return NULL;
-   }
-   /* both p and head are non-null */
-   p = p->next;
-   return p == head ? NULL : p;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_Prev --
- *
- *      Returns the prev member of a doubly linked list, or NULL if first.
- *      Assumes: p is member of the list headed by head.
- *
- * Result:
- *      If head or prev is NULL, return NULL. Otherwise,
- *      prev list member (or null if first).
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE ListItem *
-CircList_Prev(ListItem *p,        // IN
-              ListItem *head)     // IN
-{
-   if (head == NULL || p == NULL) {
-      return NULL;
-   }
-   /* both p and head are non-null */
-   return p == head ? NULL : p->prev;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_DeleteItem --
- *
- *      Deletes a member of a doubly linked list, possibly modifies the
- *      list header itself.
- *      Assumes neither p nor headp is null and p is a member of *headp.
- *
- * Result:
- *      None
- *
- * Side effects:
- *      Modifies *headp.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE void
-CircList_DeleteItem(ListItem *p,         // IN
-                    ListItem **headp)    // IN/OUT
-{
-   ListItem *next;
-
-   ASSERT(p != NULL);
-   ASSERT(headp != NULL);
-
-   next = p->next;
-   if (p == next) {
-      *headp = NULL;
-   } else {
-      next->prev = p->prev;
-      p->prev->next = next;
-      if (*headp == p) {
-         *headp = next;
-      }
-   }
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_Queue --
- *
- *      Adds a new member to the back of a doubly linked list (queue)
- *      Assumes neither p nor headp is null and p is not a member of *headp.
- *
- * Result:
- *      None
- *
- * Side effects:
- *      Modifies *headp.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE void
-CircList_Queue(ListItem *p,              // IN
-               ListItem **headp)         // IN/OUT
-{
-   ListItem *head;
-
-   head = *headp;
-   if (CircList_IsEmpty(head)) {
-      CircList_InitItem(p);
-      *headp = p;
-   } else {
-      p->prev = head->prev;
-      p->next = head;
-      p->prev->next = p;
-      head->prev = p;
-   }
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_Push --
- *
- *      Adds a new member to the front of a doubly linked list (stack)
- *      Assumes neither p nor headp is null and p is not a member of *headp.
- *
- * Result:
- *      None
- *
- * Side effects:
- *      Modifies *headp.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE void
-CircList_Push(ListItem *p,               // IN
-              ListItem **headp)          // IN/OUT
-{
-   CircList_Queue(p, headp);
-   *headp = p;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_InsertAfter --
- *
- *      Adds a new member to the list after the provided item.  Assumes p
- *      is not a member of a list already.
- *
- * Result:
- *      None.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE void
-CircList_InsertAfter(ListItem *p,      // IN:
-                     ListItem *after)  // IN:
-{
-   p->prev = after;
-   p->next = after->next;
-   p->next->prev = p;
-   after->next = p;
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_Splice --
- *
- *      Make a single list {l1 l2} from {l1} and {l2} and return it.
- *      It is okay for one or both lists to be NULL.
- *      No checking is done. It is assumed that l1 and l2 are two
- *      distinct lists.
- *
- * Result:
- *      A list { l1 l2 }.
- *
- * Side effects:
- *      Modifies l1 and l2 list pointers.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE ListItem *
-CircList_Splice(ListItem *l1,      // IN
-                ListItem *l2)      // IN
-{
-   ListItem *l1Last, *l2Last;
-
-   if (CircList_IsEmpty(l1)) {
-      return l2;
-   }
-
-   if (CircList_IsEmpty(l2)) {
-      return l1;
-   }
-
-   l1Last = l1->prev;   /* last elem of l1 */
-   l2Last = l2->prev;   /* last elem of l2 */
-
-   /*
-    *    l1 -> ... -> l1Last    l2 -> ... l2Last
-    */
-   l1Last->next = l2;
-   l2->prev = l1Last;
-
-   l1->prev = l2Last;
-   l2Last->next = l1;
-
-   return l1;
-}
-
-
-#if 0  /* Presently unused, enable if a use is found */
-/*
- *----------------------------------------------------------------------
- *
- * CircList_Split --
- *
- *      Make a list l = {l1 l2} into two separate lists {l1} and {l2}, where:
- *      l = { ... x -> p -> ... } split into:
- *      l1 = { ... -> x }
- *      l2 = { p -> ... }
- *      Assumes neither p nor l is null and p is a member of l.
- *      If p is the first element of l, then l1 will be NULL.
- *
- * Result:
- *      None.
- *
- * Side effects:
- *      Sets *l1p and *l2p to the resulting two lists.
- *      Modifies l's pointers.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE void
-CircList_Split(ListItem *p,         // IN
-               ListItem *l,         // IN
-               ListItem **l1p,      // OUT
-               ListItem **l2p)      // OUT
-{
-   ListItem *last;
-
-   if (p == CircList_First(l)) {   /* first element */
-      *l1p = NULL;
-      *l2p = l;
-      return;
-   }
-
-   last = l->prev;
-
-   *l1p = l;
-   p->prev->next = l;
-   l->prev = p->prev;
-
-   *l2p = p;
-   p->prev = last;
-   last->next = p;
-}
-#endif
-
-
-/*
- *----------------------------------------------------------------------
- *
- * CircList_Size --
- *
- *	Return the number of items in the list.
- *
- * Result:
- *	The number of items in the list.
- *
- * Side effects:
- *	None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE int
-CircList_Size(ListItem *head)     // IN
-{
-   ListItem *li;
-   int ret = 0;
-
-   CIRC_LIST_SCAN(li, head) {
-      ret++;
-   }
-   return ret;
-}
-
-#if defined(__cplusplus)
-}  // extern "C"
-#endif
-
-#endif /* _CIRCLIST_H_ */
diff --git a/vmmon-only/vmcore/driver_vmcore.h b/vmmon-only/include/cpu_types.h
similarity index 70%
rename from vmmon-only/vmcore/driver_vmcore.h
rename to vmmon-only/include/cpu_types.h
index 3863424a..7b30e94a 100644
--- a/vmmon-only/vmcore/driver_vmcore.h
+++ b/vmmon-only/include/cpu_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2004 VMware, Inc. All rights reserved.
+ * Copyright (C) 2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -16,19 +16,26 @@
  *
  *********************************************************/
 
-#ifndef _DRIVER_VMCORE_H_
-#define _DRIVER_VMCORE_H_
+/*
+ * cpu_types.h --
+ *
+ *      Type definitions for the target architecture.
+ */
 
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMCORE
-#include "includeCheck.h"
+#if !defined(_CPU_TYPES_H_)
+#define _CPU_TYPES_H_
 
-#include "vmx86.h"
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+
+typedef uint8 Instruction;
 
 /*
- * Exported vmcore functions.
+ * Page
  */
+typedef char PageArray[PAGE_SIZE];
+
 
-int Vmx86_RunVM(VMDriver *vm, Vcpuid vcpuid);
+#include "cpu_types_arch.h"
 
 #endif
diff --git a/vmmon-only/include/crossgdt.h b/vmmon-only/include/crossgdt.h
index 3a048880..f2c9bb9f 100644
--- a/vmmon-only/include/crossgdt.h
+++ b/vmmon-only/include/crossgdt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2017, 2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -49,7 +49,7 @@
 #include "includeCheck.h"
 
 #include "vm_basic_defs.h"  // PAGE_SIZE
-#include "x86types.h"       // Descriptor
+#include "x86/cpu_types_arch.h"       // Descriptor
 
 
 typedef struct CrossGDT {
diff --git a/vmmon-only/include/intelVT.h b/vmmon-only/include/intelVT.h
new file mode 100644
index 00000000..d6755fb9
--- /dev/null
+++ b/vmmon-only/include/intelVT.h
@@ -0,0 +1,459 @@
+/*********************************************************
+ * Copyright (C) 2008-2021 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _INTELVT_H_
+#define _INTELVT_H_
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+/*
+ * intelVT.h -
+ *
+ *      Module to handle Intel VT configuration.
+ *
+ */
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "msrCache.h"
+#include "x86vt.h"
+#include "virtual_vt.h"
+
+#if defined(__cplusplus)
+extern "C" {
+#endif
+
+
+#define INTELVT_MSRS                   \
+   MSRNUM(MSR_FEATCTL)                 \
+   MSRNUM(MSR_VMX_BASIC)               \
+   MSRNUM(MSR_VMX_PINBASED_CTLS)       \
+   MSRNUM(MSR_VMX_PROCBASED_CTLS)      \
+   MSRNUM(MSR_VMX_EXIT_CTLS)           \
+   MSRNUM(MSR_VMX_ENTRY_CTLS)          \
+   MSRNUM(MSR_VMX_MISC)                \
+   MSRNUM(MSR_VMX_CR0_FIXED0)          \
+   MSRNUM(MSR_VMX_CR0_FIXED1)          \
+   MSRNUM(MSR_VMX_CR4_FIXED0)          \
+   MSRNUM(MSR_VMX_CR4_FIXED1)          \
+   MSRNUM(MSR_VMX_VMCS_ENUM)           \
+   MSRNUM(MSR_VMX_2ND_CTLS)            \
+   MSRNUM(MSR_VMX_EPT_VPID)            \
+   MSRNUM(MSR_VMX_TRUE_PINBASED_CTLS)  \
+   MSRNUM(MSR_VMX_TRUE_PROCBASED_CTLS) \
+   MSRNUM(MSR_VMX_TRUE_EXIT_CTLS)      \
+   MSRNUM(MSR_VMX_TRUE_ENTRY_CTLS)     \
+   MSRNUM(MSR_VMX_VMFUNC)              \
+   MSRNUM(MSR_VMX_3RD_CTLS)
+
+
+#define EXTRACT_FIELD(msr, basename) \
+   (((msr) >> basename ## _SHIFT) & basename ## _MASK)
+
+#define INSERT_FIELD(msr, basename, val) \
+   (((msr) & ~((uint64)(basename ## _MASK) << basename ## _SHIFT)) |    \
+    (uint64)(val) << basename ## _SHIFT)
+
+#define INVALID_VMX_BASIC INSERT_FIELD(~0ULL, MSR_VMX_BASIC_VMCS_SIZE, 0)
+
+typedef uint64 (*IntelVTMSRGet_Fn)(const MSRCache*, uint32, unsigned);
+
+const uint32 *IntelVT_MSRs(void);
+unsigned IntelVT_MSRCount(void);
+Bool IntelVT_FindCommonMSRs(MSRCache *common, const MSRCache *data);
+Bool IntelVT_IsValid(const MSRCache *common, uint32 pcpu);
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonCtls --
+ *
+ *      Computes and returns common VMX_*_CTLS feature MSR across all
+ *      logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonCtls(const MSRCache *data,    // IN
+                       IntelVTMSRGet_Fn getMSR, // IN
+                       unsigned numCPUs,        // IN
+                       uint32 msrNum)           // IN
+{
+   unsigned cpu;
+   uint64 commonVal = getMSR(data, msrNum, 0);
+
+   for (cpu = 1; cpu < numCPUs; cpu++) {
+      uint64 thisCpu = getMSR(data, msrNum, cpu);
+      uint32 zeros = LODWORD(commonVal) | LODWORD(thisCpu);
+      uint32 ones = HIDWORD(commonVal) & HIDWORD(thisCpu);
+
+      commonVal = QWORD(ones, zeros);
+   }
+   return commonVal;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonBasic --
+ *
+ *      Computes and returns a common VMX_BASIC feature MSR across all
+ *      logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonBasic(const MSRCache *data,    // IN
+                        IntelVTMSRGet_Fn getMSR, // IN
+                        unsigned numCPUs)        // IN
+{
+   unsigned cpu;
+   const uint64 orFields = MSR_VMX_BASIC_32BITPA;
+   const uint64 andFields = MSR_VMX_BASIC_TRUE_CTLS | MSR_VMX_BASIC_DUALVMM |
+                            MSR_VMX_BASIC_ADVANCED_IOINFO;
+   uint64 commonVal = getMSR(data, MSR_VMX_BASIC, 0);
+   for (cpu = 1; cpu < numCPUs; cpu++) {
+      uint64 thisCpu = getMSR(data, MSR_VMX_BASIC, cpu);
+      uint64 diff = commonVal ^ thisCpu;
+
+      if (EXTRACT_FIELD(diff, MSR_VMX_BASIC_VMCS_ID) ||
+          EXTRACT_FIELD(diff, MSR_VMX_BASIC_VMCS_SIZE) ||
+          EXTRACT_FIELD(diff, MSR_VMX_BASIC_MEMTYPE)) {
+         commonVal = INVALID_VMX_BASIC;
+         break;
+      }
+      commonVal |= thisCpu & orFields;
+      commonVal &= ~andFields | (thisCpu & andFields);
+   }
+
+   return commonVal;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonMisc --
+ *
+ *      Computes and returns a common VMX_MISC feature MSR across all
+ *      logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonMisc(const MSRCache *data,    // IN
+                       IntelVTMSRGet_Fn getMSR, // IN
+                       unsigned numCPUs)        // IN
+{
+   unsigned cpu;
+   const uint64 fieldMask =
+      (MSR_VMX_MISC_TMR_RATIO_MASK << MSR_VMX_MISC_TMR_RATIO_SHIFT) |
+      (MSR_VMX_MISC_CR3_TARGETS_MASK << MSR_VMX_MISC_CR3_TARGETS_SHIFT) |
+      (MSR_VMX_MISC_MAX_MSRS_MASK << MSR_VMX_MISC_MAX_MSRS_SHIFT) |
+      ((uint64)MSR_VMX_MISC_MSEG_ID_MASK << MSR_VMX_MISC_MSEG_ID_SHIFT);
+   uint64 commonVal = getMSR(data, MSR_VMX_MISC, 0);
+   unsigned cr3Targets = EXTRACT_FIELD(commonVal, MSR_VMX_MISC_CR3_TARGETS);
+   unsigned maxMSRs = EXTRACT_FIELD(commonVal, MSR_VMX_MISC_MAX_MSRS);
+
+   for (cpu = 1; cpu < numCPUs; cpu++) {
+      uint64 thisCpu = getMSR(data, MSR_VMX_MISC, cpu);
+      uint64 diff = commonVal ^ thisCpu;
+
+      if (EXTRACT_FIELD(diff, MSR_VMX_MISC_MSEG_ID)) {
+         commonVal = 0;
+         break;
+      }
+
+      commonVal &= fieldMask | (thisCpu & ~fieldMask);
+      cr3Targets = MIN(cr3Targets, EXTRACT_FIELD(thisCpu,
+                       MSR_VMX_MISC_CR3_TARGETS));
+      maxMSRs = MIN(maxMSRs, EXTRACT_FIELD(thisCpu, MSR_VMX_MISC_MAX_MSRS));
+   }
+   commonVal = INSERT_FIELD(commonVal, MSR_VMX_MISC_CR3_TARGETS, cr3Targets);
+   commonVal = INSERT_FIELD(commonVal, MSR_VMX_MISC_MAX_MSRS, maxMSRs);
+
+   return commonVal;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVTFindCommon --
+ *
+ *      Computes and returns a common value for a given MSR by a bitwise OR or
+ *      AND operation, across all logical processors.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVTFindCommon(uint32 msrNum,           // IN
+                  const MSRCache *data,    // IN
+                  IntelVTMSRGet_Fn getMSR, // IN
+                  unsigned numCPUs,        // IN
+                  Bool isOpAND)            // IN
+{
+   uint64 commonVal = getMSR(data, msrNum, 0);
+   unsigned cpu;
+
+   for (cpu = 1; cpu < numCPUs; cpu++) {
+      if (isOpAND) {
+         commonVal &= getMSR(data, msrNum, cpu);
+      } else {
+         commonVal |= getMSR(data, msrNum, cpu);
+      }
+   }
+   return commonVal;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonEPT --
+ *
+ *      Computes and returns a common VMX_EPT_VPID feature MSR across
+ *      all logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonEPT(const MSRCache *data,    // IN
+                      IntelVTMSRGet_Fn getMSR, // IN
+                      unsigned numCPUs)        // IN
+{
+   return IntelVTFindCommon(MSR_VMX_EPT_VPID, data, getMSR, numCPUs, TRUE);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonFixed0 --
+ *
+ *      Computes and returns a common VMX_*_FIXED0 feature MSR across
+ *      all logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonFixed0(const MSRCache *data,    // IN
+                         IntelVTMSRGet_Fn getMSR, // IN
+                         unsigned numCPUs,        // IN
+                         uint32 msrNum)           // IN
+{
+   return IntelVTFindCommon(msrNum, data, getMSR, numCPUs, FALSE);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonFixed1 --
+ *
+ *      Computes and returns a common VMX_*_FIXED1 feature MSR across
+ *      all logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonFixed1(const MSRCache *data,     // IN
+                         IntelVTMSRGet_Fn getMSR,  // IN
+                         unsigned numCPUs,         // IN
+                         uint32 msrNum)            // IN
+{
+   return IntelVTFindCommon(msrNum, data, getMSR, numCPUs, TRUE);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonFeatureCtl --
+ *
+ *      Computes and returns a common MSR_FEATCTL MSR across all logical
+ *      processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonFeatureCtl(const MSRCache *data,           // IN
+                             IntelVTMSRGet_Fn getMSR,        // IN
+                             unsigned numCPUs)               // IN
+{
+   return IntelVTFindCommon(MSR_FEATCTL, data, getMSR, numCPUs, TRUE);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonVMFunc --
+ *
+ *      Computes and returns a common MSR_VMX_VMFUNC feature MSR across
+ *      all logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonVMFunc(const MSRCache *data,    // IN
+                         IntelVTMSRGet_Fn getMSR, // IN
+                         unsigned numCPUs)        // IN
+{
+   return IntelVTFindCommon(MSR_VMX_VMFUNC, data, getMSR, numCPUs, TRUE);
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonEnum --
+ *
+ *      Computes and returns a common MSR_VMX_VMCS_ENUM feature MSR across
+ *      all logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE uint64
+IntelVT_FindCommonEnum(const MSRCache *data,    // IN
+                       IntelVTMSRGet_Fn getMSR, // IN
+                       unsigned numCPUs)        // IN
+{
+   uint64 commonVal = getMSR(data, MSR_VMX_VMCS_ENUM, 0);
+   unsigned cpu;
+   unsigned maxIndex = EXTRACT_FIELD(commonVal, MSR_VMX_VMCS_ENUM_MAX_INDEX);
+
+   for (cpu = 1; cpu < numCPUs; cpu++) {
+      maxIndex = MIN(maxIndex,
+                     EXTRACT_FIELD(getMSR(data, MSR_VMX_VMCS_ENUM, cpu),
+                                   MSR_VMX_VMCS_ENUM_MAX_INDEX));
+   }
+
+   commonVal = INSERT_FIELD(commonVal, MSR_VMX_VMCS_ENUM_MAX_INDEX, maxIndex);
+   return commonVal;
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommon3rd --
+ *
+ *      Computes and returns a common MSR_VMX_3RD_CTLS feature MSR across
+ *      all logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+IntelVT_FindCommon3rd(const MSRCache *data,     // IN
+                      IntelVTMSRGet_Fn getMSR,  // IN
+                      unsigned numCPUs)         // IN
+{
+   return IntelVTFindCommon(MSR_VMX_3RD_CTLS, data, getMSR, numCPUs, TRUE);
+}
+
+
+#undef EXTRACT_FIELD
+#undef INSERT_FIELD
+#undef INVALID_VMX_BASIC
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_Enabled --
+ *
+ *      Use the MSR cache to check the feature control MSR.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+IntelVT_Enabled(const MSRCache *cache, uint32 pcpu)
+{
+   return VT_EnabledFromFeatures(MSRCache_Get(cache, MSR_FEATCTL, pcpu));
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_Supported --
+ *
+ *      Helper function to query all the MSRs needed by
+ *      VT_SupportedFromFeatures().
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+IntelVT_Supported(const MSRCache *cache, uint32 pcpu)
+{
+   uint64 basic = MSRCache_Get(cache, MSR_VMX_BASIC, pcpu);
+   if (basic & MSR_VMX_BASIC_TRUE_CTLS) {
+      uint64 pin   = MSRCache_Get(cache, MSR_VMX_TRUE_PINBASED_CTLS, pcpu);
+      uint64 cpu   = MSRCache_Get(cache, MSR_VMX_TRUE_PROCBASED_CTLS, pcpu);
+      uint64 entry = MSRCache_Get(cache, MSR_VMX_TRUE_ENTRY_CTLS, pcpu);
+      uint64 exit  = MSRCache_Get(cache, MSR_VMX_TRUE_EXIT_CTLS, pcpu);
+      return VT_SupportedFromFeatures(pin, cpu, entry, exit, basic);
+   } else {
+      /* Bug 1914425 - VMM no longer supports CPUs without TRUE_xxx_CTLS */
+      return FALSE;
+   }
+}
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_VVTSupported --
+ *
+ *      Helper function to query all the MSRs needed by
+ *      VVT_SupportedFromFeatures().
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+IntelVT_VVTSupported(const MSRCache *cache, uint32 pcpu)
+{
+   uint64 basic = MSRCache_Get(cache, MSR_VMX_BASIC, pcpu);
+   uint64 misc = MSRCache_Get(cache, MSR_VMX_MISC, pcpu);
+   uint64 cr0Fixed0 = MSRCache_Get(cache, MSR_VMX_CR0_FIXED0, pcpu);
+   uint64 cr0Fixed1 = MSRCache_Get(cache, MSR_VMX_CR0_FIXED1, pcpu);
+   uint64 cr4Fixed0 = MSRCache_Get(cache, MSR_VMX_CR4_FIXED0, pcpu);
+   uint64 cr4Fixed1 = MSRCache_Get(cache, MSR_VMX_CR4_FIXED1, pcpu);
+   uint64 secondary = MSRCache_Get(cache, MSR_VMX_2ND_CTLS, pcpu);
+   uint64 eptVPID = MSRCache_Get(cache, MSR_VMX_EPT_VPID, pcpu);
+   uint64 truePin = MSRCache_Get(cache, MSR_VMX_TRUE_PINBASED_CTLS, pcpu);
+   uint64 trueCPU = MSRCache_Get(cache, MSR_VMX_TRUE_PROCBASED_CTLS, pcpu);
+   return VVT_SupportedFromFeatures(basic, misc, cr0Fixed0, cr0Fixed1,
+                                    cr4Fixed0, cr4Fixed1, secondary, eptVPID,
+                                    truePin, trueCPU);
+}
+
+#if defined(__cplusplus)
+}  // extern "C"
+#endif
+
+#endif
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 969e6c58..61d71e35 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -41,8 +41,6 @@
 #include "rateconv.h"
 #include "overheadmem_types.h"
 #include "pageLock_defs.h"
-#include "numa_defs.h"
-#include "bootstrap_vmm.h"
 #include "contextinfo.h"
 #include "vcpuid.h"
 #include "sharedAreaType.h"
@@ -148,7 +146,7 @@ PtrToVA64(void const *ptr) // IN
  * the NT specific VMX86_DRIVER_VERSION.
  */
 
-#define VMMON_VERSION           (401 << 16 | 0)
+#define VMMON_VERSION           (410 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -261,8 +259,6 @@ enum IOCTLCmd {
 #endif
 
 #if defined _WIN32
-   IOCTLCMD(HARD_LIMIT_MONITOR_STATUS), // used by vmauthd on Windows
-   IOCTLCMD(CHANGE_HARD_LIMIT),         // used by vmauthd on Windows
    IOCTLCMD(READ_DISASM_PROC_BINARY),
    IOCTLCMD(CHECK_CANDIDATE_VA64),
    IOCTLCMD(SET_MEMORY_PARAMS),
@@ -328,8 +324,6 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_ADMIT               VMIOCTL_BUFFERED(ADMIT)
 #define IOCTL_VMX86_READMIT             VMIOCTL_BUFFERED(READMIT)
 #define IOCTL_VMX86_UPDATE_MEM_INFO     VMIOCTL_BUFFERED(UPDATE_MEM_INFO)
-#define IOCTL_VMX86_HARD_LIMIT_MONITOR_STATUS   VMIOCTL_BUFFERED(HARD_LIMIT_MONITOR_STATUS)
-#define IOCTL_VMX86_CHANGE_HARD_LIMIT   VMIOCTL_BUFFERED(CHANGE_HARD_LIMIT)
 
 #define IOCTL_VMX86_GET_TOTAL_MEM_USAGE	VMIOCTL_BUFFERED(GET_TOTAL_MEM_USAGE)
 #define IOCTL_VMX86_GET_KHZ_ESTIMATE    VMIOCTL_BUFFERED(GET_KHZ_ESTIMATE)
@@ -368,32 +362,26 @@ enum IOCTLCmd {
 #define INIT_BLOCK_MAGIC     (0x1789 + 14)
 
 
-typedef
-#include "vmware_pack_begin.h"
-struct VMLockPageRet {
+#pragma pack(push, 1)
+typedef struct VMLockPageRet {
    MPN   mpn;      // OUT: MPN
    int32 status;   // OUT: PAGE_* status code
-}
-#include "vmware_pack_end.h"
-VMLockPageRet;
+} VMLockPageRet;
+#pragma pack(pop)
 
-typedef
-#include "vmware_pack_begin.h"
-union {
+#pragma pack(push, 1)
+typedef union {
    VA64 uAddr;        // IN: user address
    VMLockPageRet ret; // OUT: status code and MPN
-}
-#include "vmware_pack_end.h"
-VMLockPage;
+} VMLockPage;
+#pragma pack(pop)
 
-typedef
-#include "vmware_pack_begin.h"
-union {
+#pragma pack(push, 1)
+typedef union {
    Vcpuid vcpuid; // IN: VCPU
    MPN pageRoot;  // OUT: MPN of the VCPU's page root
-}
-#include "vmware_pack_end.h"
-VcpuPageRoot;
+} VcpuPageRoot;
+#pragma pack(pop)
 
 #define VMX86_DRIVER_VCPUID_OFFSET 1000
 
@@ -410,7 +398,6 @@ VcpuPageRoot;
 typedef struct LockedPageLimit {
    PageCnt host;        // driver calculated maximum for this host
    PageCnt configured;  // user defined maximum pages to lock
-   PageCnt dynamic;     // authd hardLimitMonitor pages to lock
 } LockedPageLimit;
 
 /*
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index b5d43f57..2a816fd3 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -30,7 +30,7 @@
 #define INCLUDE_ALLOW_VMMON
 #include "includeCheck.h"
 
-#include "x86types.h"
+#include "cpu_types.h"
 #include "x86desc.h"
 #include "ptsc.h"
 #include "vcpuid.h"
@@ -38,8 +38,8 @@
 #include "vmm_constants.h"
 #include "contextinfo.h"
 #include "rateconv.h"
-#include "modulecallstructs.h"
 #include "mon_assert.h"
+#include "uccost.h"
 
 #define NUM_EXCEPTIONS   20     /* EXC_DE ... EXC_XF. */
 
@@ -93,49 +93,6 @@ typedef enum ModuleCallType {
 
 #define MODULECALL_USERCALL_NONE     300
 
-/*
- * Define VMX86_UCCOST in the makefiles (Local.mk,
- * typically) if you want a special build whose only purpose
- * is to measure the overhead of a user call and its
- * breakdown.
- *
- * WINDOWS NOTE: I don't know how to pass VMX86_UCCOST to
- * the driver build on Windows.  It must be defined by hand.
- *
- * ESX Note: we don't have a crosspage in which to store these
- * timestamps.  Such a feature would perhaps be nice (if we
- * ever tire of the argument that esx does so few usercalls
- * that speed doesn't matter).
- */
-
-#if defined(VMX86_UCCOST) && !defined(VMX86_SERVER)
-#define UCTIMESTAMP(ptr, stamp) \
-             do { (ptr)[UCCOST_ ## stamp] = RDTSC(); } while (0)
-#else
-#define UCTIMESTAMP(cp, stamp)
-#endif
-
-#ifdef VMX86_SERVER
-typedef struct UCCostResults {
-   uint32 vmksti;
-   uint32 vmkcli;
-   uint32 ucnop;
-} UCCostResults;
-#else
-
-typedef struct UCCostResults {
-   uint32 htom;
-   uint32 mtoh;
-   uint32 ucnop;
-} UCCostResults;
-
-typedef enum UCCostStamp {
-#define UC(x, y) UCCOST_ ## x,
-#include "uccostTable.h"
-   UCCOST_MAX
-} UCCostStamp;
-#endif // VMX86_SERVER
-
 #define SHADOW_DR(cpData, n)    (cpData)->shadowDR[n].ureg64
 
 
@@ -204,9 +161,8 @@ typedef enum UCCostStamp {
  *
  *----------------------------------------------------------------------
  */
-typedef
-#include "vmware_pack_begin.h"
-struct VMMPageTablePatch {
+#pragma pack(push, 1)
+typedef struct VMMPageTablePatch {
 #define PTP_EMPTY    (0U) /* Unused array entry. (must be 0) */
 #define PTP_LEVEL_L1 (1U)
 #define PTP_LEVEL_L2 (2U)
@@ -217,9 +173,8 @@ struct VMMPageTablePatch {
    uint64   pteGlobalIdx;       /* Global index of the PTE in 'level'. */
    LPN      lpn;                /* Logical page number mapped by patch. */
    VM_PDPTE pte;                /* PTE.                                */
-}
-#include "vmware_pack_end.h"
-VMMPageTablePatch;
+} VMMPageTablePatch;
+#pragma pack(pop)
 
 #define MODULECALL_NUM_ARGS  4
 
@@ -256,9 +211,8 @@ VMMPageTablePatch;
  *
  *----------------------------------------------------------------------
  */
-typedef
-#include "vmware_pack_begin.h"
-struct VMCrossPageData {
+#pragma pack(push, 1)
+typedef struct VMCrossPageData {
    uint32   version;           // CROSSPAGE_VERSION
    uint32   vmmonVersion;      // VMMON_VERSION
 
@@ -349,8 +303,6 @@ struct VMCrossPageData {
    uint8  _ucPad[8];
 #endif
 
-   SwitchedMSRState switchedMSRState;
-
    /*
     * The values in the shadow debug registers must match those in the
     * hardware debug register immediately after a task switch in
@@ -405,11 +357,10 @@ struct VMCrossPageData {
    uint8         _pad7[4];
    uint64        wsUD2;                       // IP of ud2 instr or 0 if unset.
    uint64        specCtrl; /* host MSR_SPEC_CTRL value before world switch. */
-}
-#include "vmware_pack_end.h"
-VMCrossPageData;
+} VMCrossPageData;
+#pragma pack(pop)
 
-#define CROSSPAGE_VERSION_BASE 0xc12 /* increment by 1 */
+#define CROSSPAGE_VERSION_BASE 0xc14 /* increment by 1 */
 #define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
 
 #if !defined(VMX86_SERVER) && defined(VMM)
diff --git a/vmmon-only/include/modulecallstructs.h b/vmmon-only/include/modulecallstructs.h
deleted file mode 100644
index ab9c0ac9..00000000
--- a/vmmon-only/include/modulecallstructs.h
+++ /dev/null
@@ -1,98 +0,0 @@
-/*********************************************************
- * Copyright (C) 2006,2009-2011,2013-2015,2020 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * modulecallstructs.h --
- *
- *
- *      Data structures that need to be included in modulecall.h
- *      as well as the vmkernel.
- *
- */
-
-#ifndef _MODULECALLSTRUCTS_H_
-#define _MODULECALLSTRUCTS_H_
-
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_VMCORE
-
-#include "includeCheck.h"
-
-#include "vm_basic_types.h"
-
-/*
- *      Flags indicating switched MSR status.
- *
- * UNUSED    - Not used by the monitor (yet). [This is a value, not a flag.]
- * USED      - Hardware MSR is used by the monitor.
- * RESTORED  - Monitor value is restored on world switch into the VMM.
- * SHADOWED  - Live monitor value is always shadowed in the SwitchedMSRState.
- *
- */
-
-#define SWITCHED_MSR_FLAG_UNUSED           0
-#define SWITCHED_MSR_FLAG_USED             1
-#define SWITCHED_MSR_FLAG_RESTORED         2
-#define SWITCHED_MSR_FLAG_SHADOWED         4
-
-/*
- * Note: If you add an msr to this list, please also ensure that
- *       hardware support for the msr is properly indicated in
- *       both the monitor (MonMSRIsSupported) and in the vmkernel
- *       (world switch msrSupported array).
- */
-#define SWITCHED_MSRS       \
-   SWMSR(MSR_SYSENTER_CS)   \
-   SWMSR(MSR_SYSENTER_EIP)  \
-   SWMSR(MSR_SYSENTER_ESP)  \
-   SWMSR(MSR_STAR)          \
-   SWMSR(MSR_LSTAR)         \
-   SWMSR(MSR_CSTAR)         \
-   SWMSR(MSR_SFMASK)        \
-   SWMSR(MSR_TSC_AUX)       \
-   SWMSR(MSR_BD_TSC_RATIO)
-
-/*
- *      Data structures for dealing with the context-switched MSRs that need
- *      to be specially handled.  While the MSR definitions themselves
- *      are part of the x86 architecture, our handling of them (and hence
- *      these data structures) is an implementation detail.
- */
-
-
-typedef enum SwitchedMSR {
-#define SWMSR(msr) SWITCHED_##msr,
-   SWITCHED_MSRS
-#undef SWMSR
-   NUM_SWITCHED_MSRS
-} SwitchedMSR;
-
-/*
- * Switched MSR values for each [vp]CPU.
- */
-typedef struct SwitchedMSRValues {
-   uint64 a[NUM_SWITCHED_MSRS];
-} SwitchedMSRValues;
-
-typedef struct SwitchedMSRState {
-   SwitchedMSRValues smv;
-   uint8             flags[NUM_SWITCHED_MSRS];
-} SwitchedMSRState;
-
-#endif
diff --git a/vmmon-only/include/monLoader.h b/vmmon-only/include/monLoader.h
index 3389c445..b1f6ae01 100644
--- a/vmmon-only/include/monLoader.h
+++ b/vmmon-only/include/monLoader.h
@@ -300,6 +300,7 @@ typedef enum MonLoaderError {
 #define MONLOADER_HT_MAP_IDX          7
 #define MONLOADER_CROSS_PAGE_CODE_IDX 8
 #define MONLOADER_CROSS_PAGE_DATA_IDX 9
+#define MONLOADER_GDT_TASK_IDX        10
 
 MonLoaderError MonLoader_Process(MonLoaderHeader *header, unsigned numVCPUs,
                                  void *args, unsigned *line, Vcpuid *vcpu);
diff --git a/vmmon-only/include/mon_assert.h b/vmmon-only/include/mon_assert.h
index 363c9960..c9de933c 100644
--- a/vmmon-only/include/mon_assert.h
+++ b/vmmon-only/include/mon_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2007-2015,2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2007-2015,2018,2020,2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -57,8 +57,8 @@
  *
  *     Using the full pathname for __FILE__ is undesirable because
  *     different source trees frequently have different path name
- *     lengths, and this causes the 'monitor-modular-size' script to
- *     report differences in '.rodata'.
+ *     lengths, and this causes the 'monitor-size' script to report
+ *     differences in '.rodata'.
  *
  *   o Each __FILE__ is put into its own .assert_pathname_##__FILE
  *     section.  The monitor's runtime linker (not ld) then uses the name
@@ -82,12 +82,10 @@
  */
 
 #define ALL_ASSERT_TYPES \
-   ADEF(AssertType_AssertPanic,          _AssertPanicFmt),                 \
    ADEF(AssertType_AssertAssert,         _AssertAssertFmt),                \
    ADEF(AssertType_AssertVerify,         _AssertVerifyFmt),                \
    ADEF(AssertType_AssertNotImplemented, _AssertNotImplementedFmt),        \
    ADEF(AssertType_AssertNotReached,     _AssertNotReachedFmt),            \
-   ADEF(AssertType_AssertPanicBug,       _AssertPanicFmt " bugNr=%d"),     \
    ADEF(AssertType_AssertAssertBug,      _AssertAssertFmt " bugNr=%d"),    \
    ADEF(AssertType_AssertVerifyBug,      _AssertVerifyFmt " bugNr=%d"),    \
    ADEF(AssertType_AssertNotImplementedBug,                                \
@@ -106,7 +104,7 @@ typedef enum Assert_Type {
 typedef struct Assert_Info {
    VA faultAddr;
    struct {
-      Assert_Type type:4;
+      uint32 type:4;
       int bugNr:28;
    } misc;
    Assert_MonSrcLoc loc;
diff --git a/vmmon-only/include/monitorAction_exported.h b/vmmon-only/include/monitorAction_exported.h
deleted file mode 100644
index 08d732ea..00000000
--- a/vmmon-only/include/monitorAction_exported.h
+++ /dev/null
@@ -1,43 +0,0 @@
-/*********************************************************
- * Copyright (C) 2010-2017 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef _MONITORACTION_EXPORTED_H_
-#define _MONITORACTION_EXPORTED_H_
-
-#define INCLUDE_ALLOW_VMX
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_DISTRIBUTE
-#include "includeCheck.h"
-
-#include "vm_basic_types.h"
-
-#if defined __cplusplus
-extern "C" {
-#endif
-
-#define MONACTION_INVALID  MAX_UINT32
-
-typedef uint32 MonitorIdemAction;
-
-#if defined __cplusplus
-} // extern "C"
-#endif
-
-#endif // _MONITORACTION_EXPORTED_H_
diff --git a/vmmon-only/include/msrCache.h b/vmmon-only/include/msrCache.h
new file mode 100644
index 00000000..5d44f7b1
--- /dev/null
+++ b/vmmon-only/include/msrCache.h
@@ -0,0 +1,74 @@
+/*********************************************************
+ * Copyright (C) 2008-2020 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _MSRCACHE_H_
+#define _MSRCACHE_H_
+
+/*
+ * msrCache.h -
+ *
+ *      Module to handle MSR data from multiple CPUs.
+ *
+ */
+
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_types.h"
+#include "vm_basic_defs.h"
+#include "x86msr.h"
+
+#if defined(__cplusplus)
+extern "C" {
+#endif
+
+#define FORALL_MSRS(_msr, _cache)                                  \
+   do {                                                            \
+      unsigned _ix;                                                \
+      unsigned _count = MSRCache_NumMSRs(_cache);                  \
+      const uint32 *_list = MSRCache_MSRList(_cache);              \
+      for (_ix = 0; _ix < _count; _ix++) {                         \
+         uint32 _msr = _list[_ix];
+
+#define MSRS_DONE                                                  \
+      }                                                            \
+   } while(0)
+
+typedef struct MSRCache MSRCache;
+typedef Bool (*MSRQueryFunction)(MSRQuery *query);
+
+unsigned MSRCache_NumCPUs(const MSRCache *cache);
+unsigned MSRCache_NumMSRs(const MSRCache *cache);
+const uint32 *MSRCache_MSRList(const MSRCache *cache);
+MSRCache *MSRCache_Alloc(unsigned nCPUs, unsigned nMSRs, const uint32 *msrNum);
+void MSRCache_Free(MSRCache *cache);
+uint64 MSRCache_Get(const MSRCache *cache, uint32 msrNum, unsigned cpu);
+void MSRCache_Set(MSRCache *cache, uint32 msrNum, unsigned cpu, uint64 val);
+void MSRCache_Populate(MSRCache *cache, unsigned numCPUs,
+                       MSRQueryFunction queryFn);
+MSRCache *MSRCache_Clone(const MSRCache *cache);
+
+#if defined(__cplusplus)
+}  // extern "C"
+#endif
+
+#endif
diff --git a/vmmon-only/include/numa_defs.h b/vmmon-only/include/numa_defs.h
deleted file mode 100644
index 4df0a6b9..00000000
--- a/vmmon-only/include/numa_defs.h
+++ /dev/null
@@ -1,83 +0,0 @@
-/*********************************************************
- * Copyright (C) 2006,2009-2017 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * numa_defs.h --
- *	This is the internal header file for the NUMA module.
- */
-
-#ifndef _NUMA_DEFS_H
-#define _NUMA_DEFS_H
-
-#define INCLUDE_ALLOW_VMX
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_VMMON
-
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_VMKERNEL
-
-#include "includeCheck.h"
-#include "vm_basic_types.h"
-#include "vm_basic_defs.h"
-#include "cpu_defs.h"
-
-/* Machine NUMA nodes */
-typedef uint32 NUMA_Node;
-typedef uint32 NUMA_PxmID;
-typedef uint64 NUMA_NodeMask;
-typedef uint8  NUMA_MemRangeID;
-
-/*
- * Constants
- */
-#define NUMA_MAX_NODES              64
-#define NUMA_MAX_CPUS_PER_NODE      (vmx86_server ? MAX_PCPUS : 32)
-#ifdef VMKBOOT
-#define NUMA_MAX_MEM_RANGES         64
-#else
-#define NUMA_MAX_MEM_RANGES         256
-#endif
-#define INVALID_NUMANODE            ((NUMA_Node)-1)
-#define NUMA_NODE_MASK_ANY          ((NUMA_NodeMask)-1)
-#define NUMA_NODE_MASK_NONE         ((NUMA_NodeMask)0)
-
-
-/*
- * Structures
- */
-typedef struct {
-   MPN          startMPN;
-   MPN          endMPN;
-   NUMA_PxmID   id;
-   Bool         isReliable;
-   Bool         isVolatile;
-} NUMA_MemRange;
-
-typedef struct NUMA_MemRangesList {
-   uint64        numMemRanges;
-   NUMA_MemRange memRange[NUMA_MAX_MEM_RANGES];
-} NUMA_MemRangesList;
-
-
-typedef struct NUMA_MemRangesListRef {
-   uint64        numMemRanges;
-   const NUMA_MemRange *memRange;
-} NUMA_MemRangesListRef;
-
-#endif // _NUMA_DEFS_H
diff --git a/vmmon-only/include/pagelist.h b/vmmon-only/include/pagelist.h
deleted file mode 100644
index c261d4ec..00000000
--- a/vmmon-only/include/pagelist.h
+++ /dev/null
@@ -1,109 +0,0 @@
-/*********************************************************
- * Copyright (C) 2010-2014,2017 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * pagelist.h -- 
- *
- *      Definitions of operations on BPNs used in communicating page info
- *	between VMKernel/VMX and VMM.
- */
-
-#ifndef	_PAGELIST_H
-#define	_PAGELIST_H
-
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_MODULE
-#include "includeCheck.h"
-
-#include "vm_assert.h"
-#include "vmcore_types.h"
-
-#if defined __cplusplus
-extern "C" {
-#endif
-
-
-/*
- * Sets of pages are passed between the monitor and the platform to be 
- * shared, invalidated, remapped, or swapped.
- *
- * A set is sized so that it fits in a 4KB page.
- */
-
-#pragma pack(push, 1)
-typedef struct PageListEntry {
-   CompressedBPN cbpn;
-   Bool voided;
-   uint8 _pad[1];
-} PageListEntry;
-#pragma pack(pop) 
-
-#define PAGELIST_MAX     (PAGE_SIZE / sizeof(PageListEntry))
-
-static INLINE void
-PageList_SetEntry(PageListEntry *ple, BPN bpn)
-{
-   CompressedBPN_Write(&ple->cbpn, bpn);
-   ple->voided = FALSE;
-}   
-
-static INLINE BPN
-PageList_BPN(const PageListEntry *ple)
-{
-   return CompressedBPN_Read(&ple->cbpn);
-}
-
-static INLINE Bool
-PageList_IsVoid(const PageListEntry *ple)
-{
-   ASSERT(ple->voided == TRUE || ple->voided == FALSE);
-   return ple->voided;
-}
-
-static INLINE void
-PageList_VoidEntry(PageListEntry *ple)
-{
-   ple->voided = TRUE;
-}
-
-
-/*
- * This function inspects the set of BPN between entry [0,i) in the page list
- * and returns TRUE if any of them matches the provided BPN.
- */
-static INLINE Bool
-PageList_IsBPNDup(const PageListEntry *pageList, unsigned i, BPN bpn)
-{
-   unsigned k;
-   for (k = 0; k < i; k++) {
-      if (PageList_BPN(&pageList[k]) == bpn) {
-         return TRUE;
-      }
-   }
-   return FALSE;
-}
-
-
-#if defined __cplusplus
-} // extern "C"
-#endif
-
-#endif // _PAGELIST_H
diff --git a/vmmon-only/include/pcip_defs.h b/vmmon-only/include/pcip_defs.h
deleted file mode 100644
index 690f93e1..00000000
--- a/vmmon-only/include/pcip_defs.h
+++ /dev/null
@@ -1,121 +0,0 @@
-/*********************************************************
- * Copyright (C) 2009-2020 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * pcip_defs.h --
- *
- *      PCI passthru definitions shared by the vmx, monitor, vmkernel, and
- *      vmmon. Not all PCI passthru definitions are found here: the shared
- *      bits mainly pertain to interrupt proxying.
- */
-
-#ifndef _PCIP_DEFS_H
-#define _PCIP_DEFS_H
-
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_VMMON
-#include "includeCheck.h"
-
-#include "monitorAction_exported.h"
-
-#include "bitvector.h"
-
-#define MAX_INTERRUPTS                 256 // max interrupts a device could use
-#define PCIP_MAX_MSIX_VECTORS          128
-#define PCIP_MAX_VECTORS               (PCIP_MAX_MSIX_VECTORS + 2)
-
-typedef struct PCIPVecBV {
-   BitVector bv;
-   uint32 reserved[PCIP_MAX_VECTORS / sizeof (uint32) - 1];
-} PCIPVecBV;
-
-typedef enum PCIPassthruVectorIndex {
-   PCIP_INDEX_IOAPIC,
-   PCIP_INDEX_MSI,
-   PCIP_INDEX_MSIXOFF,
-   PCIP_INDEX_INVALID = PCIP_INDEX_MSIXOFF + PCIP_MAX_MSIX_VECTORS,
-} PCIPassthruVectorIndex;
-
-typedef enum PCIPassthru_IntrType {
-   PCIPASSTHRU_INTR_NONE    = 0x00,
-   PCIPASSTHRU_INTR_IOAPIC  = 0x01,
-   PCIPASSTHRU_INTR_MSI     = 0x02,
-   PCIPASSTHRU_INTR_MSIX    = 0x04,
-   PCIPASSTHRU_INTR_MSI_INT = 0x08,
-} PCIPassthru_IntrType;
-
-#define PCIPASSTHRU_INTR_MSI_COMBINED                   \
-   (PCIPASSTHRU_INTR_MSI | PCIPASSTHRU_INTR_MSI_INT)
-
-typedef struct FPTIntrProxyInfo {
-   uint32            vectorIndex;
-   MonitorIdemAction actionID;
-} FPTIntrProxyInfo;
-
-typedef struct UPTIntrProxyInfo {
-   uint32            adapterIndex;
-   MonitorIdemAction actionID;
-} UPTIntrProxyInfo;
-
-typedef struct MPTIntrProxyInfo {
-   uint32            adapterIndex;
-   MonitorIdemAction actionID;
-} MPTIntrProxyInfo;
-
-typedef union PCIPassthru_IntrProxyInfo {
-   FPTIntrProxyInfo fpt;
-   UPTIntrProxyInfo upt;
-   MPTIntrProxyInfo mpt;
-} PCIPassthru_IntrProxyInfo;
-
-typedef enum PCIPassthru_ErrorType {
-   PCIPASSTHRU_ERROR_NONE       = 0x00,
-   PCIPASSTHRU_ERROR_AER        = 0x01,
-   PCIPASSTHRU_ERROR_PAGE_FAULT = 0x02,
-} PCIPassthru_ErrorType;
-
-typedef struct PCIPassthru_PageFaultInfo {
-   uint64 ioAddr;
-   uint64 machAddr;
-   uint8  faultReason;
-   uint8  unused[7];
-} PCIPassthru_PageFaultInfo;
-
-typedef struct PCIPassthru_AERInfo {
-   uint64 count;
-} PCIPassthru_AERInfo;
-
-typedef union PCIPassthru_ErrorInfo {
-   PCIPassthru_PageFaultInfo pageFaultInfo;
-   PCIPassthru_AERInfo aerInfo;
-} PCIPassthru_ErrorInfo;
-
-typedef 
-#include "vmware_pack_begin.h"
-struct PCIPassthru_ErrorMsg {
-   uint32                 sbdf;
-   PCIPassthru_ErrorType  errorType;
-   PCIPassthru_ErrorInfo  errorInfo;
-}
-#include "vmware_pack_end.h"
-PCIPassthru_ErrorMsg;
-
-#endif // _PCIP_DEFS_H
diff --git a/vmmon-only/include/perfctr_arch.h b/vmmon-only/include/perfctr_arch.h
index 47fd70f6..e8b23cee 100644
--- a/vmmon-only/include/perfctr_arch.h
+++ b/vmmon-only/include/perfctr_arch.h
@@ -22,8 +22,8 @@
  *      Performance counters (x64 specific).
  */
 
-#ifndef _PERFCTR_ARCH_H
-#define _PERFCTR_ARCH_H
+#ifndef _X86_PERFCTR_ARCH_H_
+#define _X86_PERFCTR_ARCH_H_
 
 #ifndef _PERFCTR_H_
 #error "This file can only be included by perfctr.h"
@@ -754,4 +754,4 @@ PerfCtr_PTAvailable(void)
    return FALSE;
 }
 
-#endif // _PERFCTR_ARCH_H
+#endif // _X86_PERFCTR_ARCH_H_
diff --git a/vmmon-only/include/pshare_ext.h b/vmmon-only/include/pshare_ext.h
deleted file mode 100644
index 3a3063c9..00000000
--- a/vmmon-only/include/pshare_ext.h
+++ /dev/null
@@ -1,73 +0,0 @@
-/*********************************************************
- * Copyright (C) 2001,2014 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * pshare_ext.h --
- *
- *      VMKernel/VMMon <-> VMM transparent page sharing info.
- */
-
-#ifndef _PSHARE_EXT_H
-#define _PSHARE_EXT_H
-
-#define INCLUDE_ALLOW_USERLEVEL
-
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_MODULE
-#include "includeCheck.h"
-
-#include "pagelist.h"
-#include "vm_basic_types.h"
-#include "vm_assert.h"
-
-/*
- * constants
- */
-
-#define PSHARE_PAGELIST_MAX             (PAGELIST_MAX)
-#define PSHARE_P2M_BUFFER_MPNS_MAX      (32)
-#define PSHARE_P2M_BUFFER_MPNS_DEFAULT  (5)
-#define PSHARE_P2M_BUFFER_SLOTS_PER_MPN (PAGE_SIZE / sizeof(PShare_P2MUpdate))
-#define PSHARE_P2M_BUFFER_SLOTS_MIN     (2)
-
-#define PSHARE_POISON_MARKER            (CONST64U(0xAAAAAAAAAAAAAAAA))
-
-#define PSHARE_SALT_UNSET       0
-#define PSHARE_SALT_DEFAULT     1
-
-MY_ASSERTS(PSHARE_EXT,
-           ASSERT_ON_COMPILE(PSHARE_PAGELIST_MAX <= PAGELIST_MAX);)
-
-/*
- * types
- */
-
-typedef union {
-   MPN mpn;
-   uint64 vpmemRef;
-} PShare_P2MUpdateReference;
-
-#define PSHARE_SET_INVALID_P2MUPDATE_REFERENCE(ref) ((ref).vpmemRef = CONST64U(-1))
-#define PSHARE_IS_INVALID_P2MUPDATE_REFERENCE(ref) ((ref).vpmemRef == CONST64U(-1))
-
-typedef struct PShare_P2MUpdate {
-   BPN bpn;
-   PShare_P2MUpdateReference reference;
-} PShare_P2MUpdate;
-#endif
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
index c6a2fd6b..476edc68 100644
--- a/vmmon-only/include/ptsc.h
+++ b/vmmon-only/include/ptsc.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2017,2019-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2017,2019-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -101,6 +101,7 @@ VmAbsoluteTS PTSC_InitialCount(const char *module,
                                VmIntervalTS freq,
                                VmAbsoluteTS defaultCnt);
 Bool PTSC_HasPerfectlySynchronizedTSCs(void);
+VmRelativeTS PTSC_RefClockOffset(void);
 
 static INLINE int64
 PTSC_Hz(void)
@@ -166,7 +167,7 @@ int64 PTSC_CyclesToUS(VmRelativeTS ts);
 
 #endif
 
-#if defined(VMX86_SERVER) && defined(VMX86_VMX)
+#if defined(VMX86_SERVER) && (defined(VMX86_VMX) || defined (ULM_ESX))
 
 /*
  * ESX with userworld VMX
diff --git a/vmmon-only/include/segs.h b/vmmon-only/include/segs.h
index 21f7f3fa..1819c87b 100644
--- a/vmmon-only/include/segs.h
+++ b/vmmon-only/include/segs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2018-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2018-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -33,32 +33,28 @@
 
 #include "vm_basic_types.h"
 #include "vm_basic_defs.h"
-#include "x86types.h"
+#include "x86/cpu_types_arch.h"
 #include "x86segdescrs.h"
 #include "x86sel.h"
 #include "addrlayout.h"
 
 
 /*
- * Segment map of the monitor.
- *
- * The GDT and Task State Segment reside consecutively on one page.  The
- * monitor segments are placed at the end of the GDT.  The vmkernel can use all
- * lower-numbered segments for user-mode as well as higher-numbered segments
- * (though the vmkernel should not use monitor-private segments).  The high
- * segment placement ensures that there is no selector-overlap with hosted
- * kernel segments (the hosted world switch code can be a bit faster then, as
- * it can use a single cross GDT).
+ * For each pcpu, a per-pcpu data area, the GDT, and the Task State
+ * Segment reside consecutively on a page.
  */
 
+#define PCPU_DATA_SIZE        (32 * CACHELINE_SIZE)
+
 #define GDT_SIZE              (sizeof(Descriptor) * NUM_VALID_SEGMENTS)
 #define GDT_LIMIT             (GDT_SIZE - 1)
 
 #define IRB_SIZE              32 /* Interrupt redirection bitmap. */
 #define TSS_SIZE              (sizeof(Task64) + IRB_SIZE)
 
-#define GDT_START_VA          (VPN_2_VA(GDT_AND_TASK_START))
-#define TASK_START_VA         (VPN_2_VA(GDT_AND_TASK_START) + GDT_SIZE)
+#define PCPU_DATA_VA          (VPN_2_VA(GDT_AND_TASK_START))
+#define GDT_START_VA          (PCPU_DATA_VA + PCPU_DATA_SIZE)
+#define TASK_START_VA         (GDT_START_VA + GDT_SIZE)
 
 /*
  * vmkBoot uses some of the lower-numbered segments, as do host kernels on
@@ -75,7 +71,8 @@
 #define FIRST_SYSTEM_SEGMENT  (PAGE_SIZE / sizeof(Descriptor) - \
                                NUM_SYSTEM_SEGMENTS            - \
                                NUM_TASK_SEGMENTS * 2          - \
-                               TSS_SIZE / sizeof(Descriptor))
+                               TSS_SIZE / sizeof(Descriptor)  - \
+                               PCPU_DATA_SIZE / sizeof(Descriptor))
 
 #define GDT_USER_TLS_MIN      USER_TLS_1_SEGMENT
 #define GDT_USER_TLS_MAX      USER_TLS_3_SEGMENT
@@ -93,9 +90,19 @@
 #define NULL_LDTR             0
 
 /*
+ * The vmkernel can use all lower-numbered segments for user-mode as
+ * well as higher-numbered segments, though the vmkernel should not
+ * use monitor-private segments.
+ *
  * The descriptor after SYSTEM_CODE_SEGMENT (loaded into %cs) must be
  * appropriate for %ss because of the syscall instruction for 64-bit
  * user worlds.  Thus SYSTEM_DATA_SEGMENT is directly after it.
+ *
+ * The monitor segments are placed at the end of the GDT.  The high
+ * segment placement for the monitor ensures that there is no
+ * selector-overlap with hosted kernel segments; the hosted world
+ * switch code can be a bit faster then, as it can use a single cross
+ * GDT.
  */
 typedef enum VmwSegs {
    NULL_SEGMENT             = 0,
@@ -131,29 +138,45 @@ typedef enum VmwSegs {
 
 /* Selectors used statically in code or in assembly must be unchecked. */
 #define SYSTEM_NULL_SELECTOR    GDT_SYSTEM_SEL(NULL)
+#ifdef VMKERNEL
+/* USER32_CODE_SELECTOR is also defined in mach/i386/thread_status.h */
 #define USER32_CODE_SELECTOR    GDT_USER_SEL_UNCHECKED(USER32_CODE)
 #define USER_DATA_SELECTOR      GDT_USER_SEL_UNCHECKED(USER_DATA)
 #define USER64_CODE_SELECTOR    GDT_USER_SEL_UNCHECKED(USER64_CODE)
 #define USER64_SYSRET_SELECTOR  GDT_USER_SEL(USER64_SYSRET)
+#endif
 #define SYSTEM_CODE_SELECTOR    GDT_SYSTEM_SEL_UNCHECKED(SYSTEM_CODE)
 #define SYSTEM_DATA_SELECTOR    GDT_SYSTEM_SEL_UNCHECKED(SYSTEM_DATA)
 #define MONITOR_TASK_SELECTOR   GDT_SYSTEM_SEL(MONITOR_TASK)
 #define VMKERNEL_TASK_SELECTOR  GDT_SYSTEM_SEL(VMKERNEL_TASK)
 
+/*
+ * This struct is shared between the vmkernel and the monitor. Since
+ * the vmm and vmk always run as a matched set, the layout can be
+ * changed down the line as needed.
+ */
+#pragma pack(push, 1)
+typedef struct PcpuData {
+   Bool         inVMM;       /* TRUE iff vmm world running in vmm context. */
+   uint8        _unused[PCPU_DATA_SIZE - sizeof(Bool)];
+} PcpuData;
+#pragma pack(pop)
+
 /*
  * The VMM GDT is comprised of many segment descriptors with one initial
  * Task State Segment system descriptor.  The VMM Task State Segment is
  * on the same page sequentially after its GDT.
  */
 #pragma pack(push, 1)
-typedef struct StaticGDTAndTSS {
+typedef struct StaticGDTPage {
+   PcpuData     pcpuData;                        /* Non-architectural. */
    Descriptor   empty[NUM_BOOT_SEGMENTS + NUM_USER_SEGMENTS];
    Descriptor   systemSegs[NUM_SYSTEM_SEGMENTS];
    Descriptor64 vmkTask;
    Descriptor64 monTask;
    Task64       monTSS;
    uint8        TSSIRBitmap[IRB_SIZE];
-} StaticGDTAndTSS;
+} StaticGDTPage;
 #pragma pack(pop)
 
 #pragma pack(push, 1)
@@ -166,6 +189,15 @@ typedef struct VmkernelGDT {
 } VmkernelGDT;
 #pragma pack(pop)
 
+#pragma pack(push, 1)
+typedef struct VmkernelGDTPage {
+   PcpuData     pcpuData;                        /* Non-architectural */
+   VmkernelGDT  vmkGDT;
+   Task64       vmkTSS;
+   uint8        TSSIRBitmap[IRB_SIZE];
+} VmkernelGDTPage;
+#pragma pack(pop)
+
 MY_ASSERTS(segs,
            ASSERT_ON_COMPILE(SYSTEM_CODE_SEGMENT + 1 == SYSTEM_DATA_SEGMENT);
            ASSERT_ON_COMPILE(AFTER_LAST_USER_SEGMENT - FIRST_USER_SEGMENT <=
@@ -173,4 +205,11 @@ MY_ASSERTS(segs,
            ASSERT_ON_COMPILE(AFTER_LAST_USER_SEGMENT <= FIRST_SYSTEM_SEGMENT);
 )
 
+MY_ASSERTS(pcpuData,
+           ASSERT_ON_COMPILE(sizeof(PcpuData) == PCPU_DATA_SIZE);
+           ASSERT_ON_COMPILE(offsetof(VmkernelGDTPage, vmkGDT) ==
+                             PCPU_DATA_SIZE);
+           ASSERT_ON_COMPILE(sizeof(VmkernelGDTPage) == PAGE_SIZE);
+)
+
 #endif /* _SEGS_H_ */
diff --git a/vmmon-only/include/uccost.h b/vmmon-only/include/uccost.h
new file mode 100644
index 00000000..71f5a50d
--- /dev/null
+++ b/vmmon-only/include/uccost.h
@@ -0,0 +1,77 @@
+/*********************************************************
+ * Copyright (C) 2020 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * uccost.h
+ *
+ *        Definitons for VMX86_UCCOST builds.
+ */
+
+#ifndef _UCCOST_H
+#define _UCCOST_H
+
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "vm_basic_defs.h"
+
+/*
+ * Define VMX86_UCCOST in the makefiles (Local.mk,
+ * typically) if you want a special build whose only purpose
+ * is to measure the overhead of a user call and its
+ * breakdown.
+ *
+ * WINDOWS NOTE: I don't know how to pass VMX86_UCCOST to
+ * the driver build on Windows.  It must be defined by hand.
+ *
+ * ESX Note: we don't have a crosspage in which to store these
+ * timestamps.  Such a feature would perhaps be nice (if we
+ * ever tire of the argument that esx does so few usercalls
+ * that speed doesn't matter).
+ */
+
+#if defined(VMX86_UCCOST) && !defined(VMX86_SERVER)
+#define UCTIMESTAMP(ptr, stamp) \
+             do { (ptr)[UCCOST_ ## stamp] = RDTSC(); } while (0)
+#else
+#define UCTIMESTAMP(cp, stamp)
+#endif
+
+#ifdef VMX86_SERVER
+typedef struct UCCostResults {
+   uint32 vmksti;
+   uint32 vmkcli;
+   uint32 ucnop;
+} UCCostResults;
+#else
+
+typedef struct UCCostResults {
+   uint32 htom;
+   uint32 mtoh;
+   uint32 ucnop;
+} UCCostResults;
+
+typedef enum UCCostStamp {
+#define UC(x, y) UCCOST_ ## x,
+#include "uccostTable.h"
+   UCCOST_MAX
+} UCCostStamp;
+#endif // VMX86_SERVER
+
+#endif
diff --git a/vmmon-only/include/vcpuid.h b/vmmon-only/include/vcpuid.h
index 60a80936..12c3dd12 100644
--- a/vmmon-only/include/vcpuid.h
+++ b/vmmon-only/include/vcpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014, 2016-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014, 2016-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -50,7 +50,7 @@ typedef uint32 Vcpuid;                 // VCPU number
 #define IS_BOOT_VCPUID(vcpuid)  ((vcpuid) == BOOT_VCPU_ID)
 
 #define MAX_VCPUS            2048
-#define MAX_CORES_PER_SOCKET   64
+#define MAX_CORES_PER_SOCKET  256
 #define MAX_VCPU_SOCKETS      128
 
 /*
@@ -60,7 +60,7 @@ typedef uint32 Vcpuid;                 // VCPU number
 #define MAX_SMALL_VM_VCPUS 128
 
 /* Supported limit. */
-#define MAX_SUPPORTED_VCPUS   (FEATURE_STATE_IS_ENABLED(MonsterVM) ? 768 : 256)
+#define MAX_SUPPORTED_VCPUS   768
 
 #if defined __cplusplus
 } // extern "C"
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
index 13d5e9fb..58af6f85 100644
--- a/vmmon-only/include/vcpuset.h
+++ b/vmmon-only/include/vcpuset.h
@@ -40,20 +40,12 @@
 #include "vcpuid.h"
 #include "vcpuset_types.h"
 
-#if defined VMX86_VMX
-#   include "str.h"     /* Str_Snprintf */
-#   define VCS_SNPRINTF Str_Snprintf
-#elif defined MONITOR_APP
-#   if defined WIN32
-#      include "str.h"     /* Str_Snprintf */
-#      define VCS_SNPRINTF Str_Snprintf
-#   else
-#      include <stdio.h>   /* libc snprintf */
-#      define VCS_SNPRINTF snprintf
-#   endif
+#if defined VMX86_VMX || defined MONITOR_APP
+#   include <stdio.h>   /* libc snprintf */
+#   define VCS_SNPRINTF
 #elif defined VMM || defined VMKERNEL
 #   include "vm_libc.h" /* vmcore snprintf */
-#   define VCS_SNPRINTF snprintf
+#   define VCS_SNPRINTF
 #endif
 
 #ifdef VMX86_VMX
@@ -875,7 +867,7 @@ VCPUSet_LogFormat(char *buf, size_t size, const VCPUSet *vcs)
    ASSERT(size >= VCS_BUF_SIZE);
 #define VCS_LOGF(...)                                                   \
    {                                                                    \
-      int ret = VCS_SNPRINTF(buf + offset, size - offset, __VA_ARGS__); \
+      int ret = snprintf(buf + offset, size - offset, __VA_ARGS__);     \
       ASSERT(0 <= ret && size >= offset && ret < (int)(size - offset)); \
       offset += (unsigned)ret;                                          \
    }
diff --git a/vmmon-only/include/versioned_atomic.h b/vmmon-only/include/versioned_atomic.h
index b58cfc02..9ebc8997 100644
--- a/vmmon-only/include/versioned_atomic.h
+++ b/vmmon-only/include/versioned_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2015-2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2007-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -29,41 +29,126 @@
  *      writer threads into a single logical writer thread. This is preferable
  *      for cases where readers are expected to greatly outnumber writers.
  *
+ *      In literature, this is called a 'seqlock' (Sequence Lock).
+ *      Seqlocks are also the implementation used by Linux VDSO for fast
+ *      clock_gettime implementation.
+ *         https://en.wikipedia.org/wiki/Seqlock
+ *         https://lwn.net/Articles/22818/
+ *
+ *      For a thorough discussion of C++11/C11 memory models with seqlock, see
+ *      "Can Seqlocks Get Along with Programming Language Memory Models?" by
+ *      Hans-J. Boehm (who chaired the C++ Concurrency Study Group when atomics
+ *      were added):
+ *         https://web.archive.org/web/20201130051130/http://safari.ece.cmu.edu/MSPC2012/slides_posters/boehm-slides.pdf
+ *         https://www.hpl.hp.com/techreports/2012/HPL-2012-68.pdf
+ *         https://dl.acm.org/doi/10.1145/2247684.2247688  [MSPC 2012]
+ *         https://hboehm.info/
+ *      Boehm's article uses relaxed atomics for 'data', due to a concern about
+ *      C++11/C11 not fully defining the difference between non-atomic and
+ *      relaxed-atomic and the possibility of torn non-atomic access.
+ *      This implementation assumes no practical difference.
+ *
+ *      One well-known danger of seqlocks: reads of the data could be torn
+ *      (and multiple reads of the same data could give different values) prior
+ *      to the version being verified.
+ *
  *      Implementation
- *      --------------
- *      This implementation is based on Leslie Lamport's paper "Concurrent
- *      Reading and Writing", Communications of the ACM, November 1977
- *      (http://url.eng.vmware.com/udcc ).
- *
- *      Lamport's algorithm was designed for systems in which the reader and
- *      the writers run on separate computers and where the version variables
- *      (v0 and v1 in this implementation) are stored on a shared hard disk. So
- *      it did not assume that the version variables could be accessed
- *      atomically. Instead, it assumed that the version variables were made of
- *      multiple basic units of data, called "digits", and that each digit
- *      could be accessed atomically. The upper-left corner of page 4 of the
- *      paper precisely and concisely describes the algorithm, and in
- *      particular the order in which digits of the version variables must be
- *      accessed (left to right, right to left, or no particular order).
- *
- *      This implementation is designed for systems in which the reader and the
- *      writers run on the same computer and where the version variables are
- *      stored in shared memory. So it assumes that the version variables can
- *      be accessed atomically. As a result, this implementation uses a
- *      simplified version of Lamport's algorithm, where:
- *      o Each left to right or right to left access in Lamport's algorithm is
- *        replaced with a single atomic access in this implementation.
- *      o Each access in no particular order in Lamport's algorithm is replaced
- *        with a single non-atomic access in this implementation.
- *      Note: The writer is the only thread which writes to version variables,
- *            so it is allowed to read them non-atomically.
- *
- *      Multiple concurrent writers to the version variables are not allowed.
- *      Even if writers are working on lock-free or disjoint data, the version
- *      variables are not interlocked for read-modify-write. See PR514764.
- *
- *      Recursive use of versioned atomics in writers is currently not
- *      supported. See PR514764.
+ *      -------------
+ *      The standard seqlock (WITHOUT synchronization) is:
+ *         int seq;
+ *         struct { ... } data
+ *         reader() {
+ *            int seq0, seq1;
+ *            do {
+ *               seq0 = seq;
+ *               // read data
+ *               seq1 = seq;
+ *            } while (seq0 != seq1 || seq0 & 1);
+ *            // use copy of data
+ *         }
+ *         writer(...) {
+ *            seq++;
+ *            // write data
+ *            seq++;
+ *         }
+ *      The LSB of seq functions as a "busy" bit saying write is in progress.
+ *      The counter will wrap eventually, but is assumed to be large enough
+ *      that this is impractical.
+ *
+ *      Atomic Considerations
+ *      ---------------------
+ *      The implemenation below uses C11 atomics (acquire/release/relaxed),
+ *      including one of very few scenarios where C11 fences make sense. The
+ *      naive, intuitive implementation of just making all writes Release and
+ *      all reads Acquire is explicitly *incorrect*: data writes can re-order
+ *      before the first increment, and data reads can re-order after the
+ *      second sequence read. In C11, reordering can happen from either the
+ *      hardware or compiler.
+ *
+ *      There are three correct strategies to ensure data reads/writes stay
+ *      within the seqlock critical sections. This will discuss reads;
+ *      equivalent reasoning applies to writes.
+ *      1) Convert all reads to acquire. Acquires cannot reorder around each
+ *         other, so this provides sufficient ordering. Free on x86 (where all
+ *         loads are acquires), very expensive on Arm (where acquires are
+ *         explicit barriers), and awkward to write code.
+ *      2) Spurious write with release, to prevent ops from reordering later.
+ *         Loads cannot release, so this forces a read-modify-write. Cheap
+ *         enough on Arm, very expensive on x86 where the write would make
+ *         the cache line exclusive.
+ *      3) C11 thread fence. A (very) rare scenario where thread fence is
+ *         needed, the fence is a two-way barrier. An acquire fence, in
+ *         to the normal acquire behavior of preventing later operations
+ *         from moving before THAT load, also prevents later operations
+ *         from moving before ANY prior load; in effect, an acquire fence
+ *         is an acquire operation on all memory. This also permits making
+ *         the final read be relaxed. Free on x86 (where all loads are
+ *         acquires), cheap on Arm (where the barrier is unavoidable).
+ *      The seqlock implemented here WITH atomics is:
+ *         reader() {
+ *            int seq0, seq1;
+ *            do {
+ *               seq0 = atomic_load(seq, memory_order_acquire);
+ *               // NB: merging the next two lines into an acquire load
+ *               // has different (and incorrect) behavior.
+ *               atomic_thread_fence(memory_order_acquire);
+ *               seq1 = atomic_load(seq, memory_order_relaxed);
+ *            } while (seq0 != seq1 || seq0 & 1);
+ *            // use copy of data
+ *         }
+ *         writer(...) {
+ *            int seq0 = atomic_load(seq, memory_order_relaxed);
+ *            // NB: merging the next two lines into a release store
+ *            // has different (and incorrect) behavior.
+ *            atomic_store(seq, seq0+1, memory_order_relaxed);
+ *            atomic_thread_fence(memory_order_release);
+ *            // write data
+ *            atomic_store(seq, seq0+2, memory_order_release);
+ *         }
+ *      A few surprising facts deserve mention:
+ *      - Reads of the sequence variable within the writer can be relaxed,
+ *        because of the single-writer assumption.
+ *      - The last read in the reader, and first write in the writer, can
+ *        be relaxed; the thread fences take care of all necessary ordering.
+ *      - Reads within the write critical section could be moved before the
+ *        critical section (by hardware or compiler).
+ *      - Writes within the read critical section could be delayed to after
+ *        the critical section (by hardware or compiler).
+ *
+ *      Future Directions
+ *      -----------------
+ *      Multiple writers can be supported either by using the LSB of the
+ *      version field as a spinlock (BeginWrite loops with a cmpxchg), or
+ *      by putting the entire writer inside an external lock. The external
+ *      lock is probably a better idea.
+ *
+ *      The reader can be slightly tuned by busy-waiting until the LSB is
+ *      not set to avoid some spurious reads. Since contention is expected to
+ *      be very low, this is not currently implemented; keeping the lock
+ *      wait-free (so the caller can deal with contention as needed) is
+ *      more desirable.
+ *
+ *      Recursive use of versioned atomics in writers is not possible.
  */
 
 #ifndef _VERSIONED_ATOMIC_H
@@ -81,6 +166,8 @@
 #include "vm_basic_asm.h"
 #include "vm_assert.h"
 #include "vm_atomic.h"
+#include "vm_atomic_acqrel.h"
+#include "vm_atomic_relaxed.h"
 
 #if defined __cplusplus
 extern "C" {
@@ -96,9 +183,42 @@ extern "C" {
  */
 
 typedef struct {
-   uint32 v0;
-   uint32 v1;
+   Atomic_uint32 atomic;
+   uint32 _pad;   // temporary; don't change the size right now
 } ALIGNED(4) VersionedAtomic;
+typedef uint32 VersionedAtomicCookie;
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * VersionedAtomic_Init --
+ *
+ *      Optional initialization function. (VersionedAtomic can also
+ *      be zero-initialized safely).
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+VersionedAtomic_Init(VersionedAtomic *versions,    // OUT
+                     VersionedAtomicCookie value)  // IN
+{
+   /* Later ASSERTs use LSB to indicate write in progress */
+   ASSERT((value & 0x1) == 0);
+
+   /*
+    * VersionedAtomic assumes single-writer, so initialization does not
+    * need to be atomic.
+    */
+   Atomic_Write32Relaxed(&versions->atomic, value);
+}
 
 
 /*
@@ -122,13 +242,17 @@ typedef struct {
 static INLINE void
 VersionedAtomic_BeginWrite(VersionedAtomic *versions) // IN
 {
+   VersionedAtomicCookie v = Atomic_Read32Relaxed(&versions->atomic);
+
    /* Catch improper initialization or unsupported recursive use. */
-   ASSERT(versions->v1 == versions->v0);
+   ASSERT((v & 0x1) == 0);
 
    /*
     * Do not use Atomic_Inc32() below: it is more expensive than
     * Atomic_Write32() and unnecessary: only the write needs to be atomic, not
     * the whole read + inc + write.
+    * VersionedAtomic assumes single-writer, so reads are always local and
+    * ONLY writes need to be synchronized with other threads.
     */
 #if !defined VMM
    /*
@@ -137,15 +261,10 @@ VersionedAtomic_BeginWrite(VersionedAtomic *versions) // IN
     * PR1055836). So until that PR is fixed, we must check that condition here
     * when VMM is not defined.
     */
-   ASSERT(((uintptr_t)&versions->v0 % sizeof versions->v0) == 0);
+   ASSERT(((uintptr_t)&versions->atomic % sizeof versions->atomic) == 0);
 #endif
-   Atomic_Write32((Atomic_uint32 *)&versions->v0, versions->v0 + 1);
-
-   /*
-    * The write to 'versions->v0' must be observed by all other OS CPUs before
-    * the write(s) to the shared data.
-    */
-   SMP_W_BARRIER_W();
+   Atomic_Write32Relaxed(&versions->atomic, v + 1);
+   Atomic_FenceRelease();  // Do not merge - see comment at top of file
 }
 
 
@@ -170,24 +289,17 @@ VersionedAtomic_BeginWrite(VersionedAtomic *versions) // IN
 static INLINE void
 VersionedAtomic_EndWrite(VersionedAtomic *versions) // IN
 {
-   /*
-    * The write(s) to the shared data must be observed by all other OS CPUs
-    * before the write to 'versions->v1'.
-    */
-   SMP_W_BARRIER_W();
+   VersionedAtomicCookie v = Atomic_Read32Relaxed(&versions->atomic);
 
-   ASSERT(versions->v1 + 1 == versions->v0);
+   /* Catch improper EndWrite without BeginWrite */
+   ASSERT((v & 0x1) != 0);
 
-#if !defined VMM
    /*
-    * Atomic_Write32() below requires the address to be naturally aligned, but
-    * currently only checks that condition when VMM is defined (tracked by
-    * PR1055836). So until that PR is fixed, we must check that condition here
-    * when VMM is not defined.
+    * VersionedAtomic assumes single-writer, so reads are always local and
+    * ONLY writes need to be synchronized with other threads. If this isn't
+    * clear, picture versions->atomic being cached from BeginWrite.
     */
-   ASSERT(((uintptr_t)&versions->v1 % sizeof versions->v1) == 0);
-#endif
-   Atomic_Write32((Atomic_uint32 *)&versions->v1, versions->v0);
+   Atomic_Write32Release(&versions->atomic, v + 1);
 }
 
 
@@ -209,18 +321,10 @@ VersionedAtomic_EndWrite(VersionedAtomic *versions) // IN
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint32
+static INLINE VersionedAtomicCookie
 VersionedAtomic_BeginTryRead(VersionedAtomic const *versions) // IN
 {
-   uint32 readVersion = Atomic_Read32((Atomic_uint32 *)&versions->v1);
-
-   /*
-    * The read from 'versions->v1' must happen on this CPU before the read(s)
-    * from the shared data.
-    */
-   SMP_R_BARRIER_R();
-
-   return readVersion;
+   return Atomic_Read32Acquire(&versions->atomic);
 }
 
 
@@ -246,24 +350,19 @@ VersionedAtomic_BeginTryRead(VersionedAtomic const *versions) // IN
  */
 
 static INLINE Bool
-VersionedAtomic_EndTryRead(VersionedAtomic const *versions, // IN
-                           uint32 readVersion)              // IN
+VersionedAtomic_EndTryRead(VersionedAtomic const *versions,    // IN
+                           VersionedAtomicCookie readVersion)  // IN
 {
-   /*
-    * The read(s) from the shared data must happen on this CPU before the read
-    * from 'versions->v0'.
-    */
-   SMP_R_BARRIER_R();
-
    /*
     * There is a theoretical ABA issue here: if the writer updates the shared
-    * data exactly 2^32 times while a reader reads it, the read will
+    * data exactly 2^31 times while a reader reads it, the read will
     * incorrectly be considered consistent. In practice, this issue is
     * unlikely, so we ignore it. But should we need it, we could make the issue
     * even less likely by using 64-bit version variables.
     */
-   return LIKELY(   Atomic_Read32((Atomic_uint32 *)&versions->v0)
-                 == readVersion);
+   Atomic_FenceAcquire();  // Do not merge - see comment at top of file
+   return LIKELY(Atomic_Read32Relaxed(&versions->atomic) == readVersion && // not torn
+                 (readVersion & 0x1) == 0);  // not writing
 }
 
 
diff --git a/vmmon-only/include/virtual_vt.h b/vmmon-only/include/virtual_vt.h
new file mode 100644
index 00000000..ce2be474
--- /dev/null
+++ b/vmmon-only/include/virtual_vt.h
@@ -0,0 +1,368 @@
+/*********************************************************
+ * Copyright (C) 2008-2021 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _VIRTUAL_VT_H_
+#define _VIRTUAL_VT_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_VMX
+
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMCORE
+#define INCLUDE_ALLOW_VMMON
+#include "includeCheck.h"
+
+#include "x86_basic_defs.h"
+#include "x86vt.h"
+
+/*
+ * Virtualized VT support
+ */
+
+#define VVT_NUM_MSRS                 (MSR_VMX_VMFUNC - MSR_VMX_BASIC + 1)
+
+#define VVT_VMCS_ID                  CONST64U(1)
+#define VVT_VMCS_SIZE                ((uint64)(PAGE_SIZE))
+#define VVT_MEMTYPE                  ((uint64)(MTRR_TYPE_WB))
+
+#define VVT_PINBASED_CTLS0           (VT_PINBASED_CTLS_DEFAULT1 |           \
+                                      VVT_TRUE_PINBASED_CTLS0)
+#define VVT_PINBASED_CTLS1           VVT_TRUE_PINBASED_CTLS1
+#define VVT_PINBASED_CTLS            QWORD(VVT_PINBASED_CTLS1,              \
+                                           VVT_PINBASED_CTLS0)
+
+#define VVT_PROCBASED_CTLS0          (VT_PROCBASED_CTLS_DEFAULT1 |          \
+                                      VVT_TRUE_PROCBASED_CTLS0)
+#define VVT_PROCBASED_CTLS1          VVT_TRUE_PROCBASED_CTLS1
+#define VVT_PROCBASED_CTLS           QWORD(VVT_PROCBASED_CTLS1,             \
+                                           VVT_PROCBASED_CTLS0)
+
+#define VVT_2ND_CTLS0                0
+#define VVT_2ND_CTLS1                (VT_VMCS_2ND_VMEXEC_CTL_VMFUNC |       \
+                                      VT_VMCS_2ND_VMEXEC_CTL_RDRAND |       \
+                                      VT_VMCS_2ND_VMEXEC_CTL_RDSEED |       \
+                                      VT_VMCS_2ND_VMEXEC_CTL_UNRESTRICTED | \
+                                      VT_VMCS_2ND_VMEXEC_CTL_WBINVD |       \
+                                      VT_VMCS_2ND_VMEXEC_CTL_RDTSCP |       \
+                                      VT_VMCS_2ND_VMEXEC_CTL_X2APIC |       \
+                                      VT_VMCS_2ND_VMEXEC_CTL_DT  |          \
+                                      VT_VMCS_2ND_VMEXEC_CTL_EPT |          \
+                                      VT_VMCS_2ND_VMEXEC_CTL_EPT_VIOL_VE |  \
+                                      VT_VMCS_2ND_VMEXEC_CTL_VPID |         \
+                                      VT_VMCS_2ND_VMEXEC_CTL_INVPCID |      \
+                                      VT_VMCS_2ND_VMEXEC_CTL_XSAVES  |      \
+                                      VT_VMCS_2ND_VMEXEC_CTL_PAUSE_LOOP |   \
+                                      VT_VMCS_2ND_VMEXEC_CTL_EPT_MBX |      \
+                                      VT_VMCS_2ND_VMEXEC_CTL_APIC |         \
+                                      VT_VMCS_2ND_VMEXEC_CTL_PML |          \
+                                      VT_VMCS_2ND_VMEXEC_CTL_ENCLS |        \
+                                      VT_VMCS_2ND_VMEXEC_CTL_ENCLV |        \
+                                      VT_VMCS_2ND_VMEXEC_CTL_EPC_VIRT_EXT)
+
+#define VVT_2ND_CTLS                 QWORD(VVT_2ND_CTLS1,                   \
+                                           VVT_2ND_CTLS0)
+
+#define VVT_EXIT_CTLS0               (VT_EXIT_CTLS_DEFAULT1 |               \
+                                      VVT_TRUE_EXIT_CTLS0)
+#define VVT_EXIT_CTLS1               VVT_TRUE_EXIT_CTLS1
+#define VVT_EXIT_CTLS                QWORD(VVT_EXIT_CTLS1,                  \
+                                           VVT_EXIT_CTLS0)
+
+#define VVT_ENTRY_CTLS0              (VT_ENTRY_CTLS_DEFAULT1 |              \
+                                      VVT_TRUE_ENTRY_CTLS0)
+#define VVT_ENTRY_CTLS1              VVT_TRUE_ENTRY_CTLS1
+#define VVT_ENTRY_CTLS               QWORD(VVT_ENTRY_CTLS1,                 \
+                                           VVT_ENTRY_CTLS0)
+
+#define VVT_EPT_VPID                 (VVT_EPT_SUPPORT | VVT_VPID_SUPPORT)
+
+#define VVT_TRUE_PINBASED_CTLS0      VT_PINBASED_CTLS_DEFAULT1
+#define VVT_TRUE_PINBASED_CTLS1      (VT_REQUIRED_PINBASED_CTLS |           \
+                                      VT_VMCS_PIN_VMEXEC_CTL_VNMI)
+#define VVT_TRUE_PINBASED_CTLS       QWORD(VVT_TRUE_PINBASED_CTLS1,         \
+                                           VVT_TRUE_PINBASED_CTLS0)
+
+#define VVT_TRUE_PROCBASED_CTLS0     (VT_PROCBASED_CTLS_DEFAULT1 &          \
+                                      ~(VT_VMCS_CPU_VMEXEC_CTL_LDCR3 |      \
+                                        VT_VMCS_CPU_VMEXEC_CTL_STCR3))
+#define VVT_TRUE_PROCBASED_CTLS1     (VT_REQUIRED_PROCBASED_CTLS |          \
+                                      VT_VMCS_CPU_VMEXEC_CTL_MWAIT |        \
+                                      VT_VMCS_CPU_VMEXEC_CTL_VNMI_WINDOW |  \
+                                      VT_VMCS_CPU_VMEXEC_CTL_IOBITMAP |     \
+                                      VT_VMCS_CPU_VMEXEC_CTL_MTF |          \
+                                      VT_VMCS_CPU_VMEXEC_CTL_MSRBITMAP |    \
+                                      VT_VMCS_CPU_VMEXEC_CTL_MONITOR |      \
+                                      VT_VMCS_CPU_VMEXEC_CTL_PAUSE |        \
+                                      VT_VMCS_CPU_VMEXEC_CTL_USE_2ND)
+#define VVT_TRUE_PROCBASED_CTLS      QWORD(VVT_TRUE_PROCBASED_CTLS1,        \
+                                           VVT_TRUE_PROCBASED_CTLS0)
+
+#define VVT_TRUE_EXIT_CTLS0          (VT_EXIT_CTLS_DEFAULT1 &               \
+                                      ~VT_VMCS_VMEXIT_CTL_SAVE_DEBUGCTL)
+#define VVT_TRUE_EXIT_CTLS1          (VT_REQUIRED_EXIT_CTLS |               \
+                                      VT_VMCS_VMEXIT_CTL_SAVE_EFER |        \
+                                      VT_VMCS_VMEXIT_CTL_LOAD_EFER |        \
+                                      VT_VMCS_VMEXIT_CTL_CLEAR_BNDCFGS |    \
+                                      VT_VMCS_VMEXIT_CTL_LOAD_PKRS |        \
+                                      VT_VMCS_VMEXIT_CTL_LOAD_PGC)
+#define VVT_TRUE_EXIT_CTLS           QWORD(VVT_TRUE_EXIT_CTLS1,             \
+                                           VVT_TRUE_EXIT_CTLS0)
+
+#define VVT_TRUE_ENTRY_CTLS0         (VT_ENTRY_CTLS_DEFAULT1 &              \
+                                      ~VT_VMCS_VMENTRY_CTL_LOAD_DEBUGCTL)
+#define VVT_TRUE_ENTRY_CTLS1         (VT_REQUIRED_ENTRY_CTLS |              \
+                                      VT_VMCS_VMENTRY_CTL_LOAD_EFER |       \
+                                      VT_VMCS_VMENTRY_CTL_LOAD_BNDCFGS |    \
+                                      VT_VMCS_VMENTRY_CTL_LOAD_PKRS    |    \
+                                      VT_VMCS_VMENTRY_CTL_LOAD_PGC)
+#define VVT_TRUE_ENTRY_CTLS          QWORD(VVT_TRUE_ENTRY_CTLS1,            \
+                                           VVT_TRUE_ENTRY_CTLS0)
+
+/*
+ * If bit X is 1 in VVT_CR0_FIXED0, then that bit of CR0 is fixed to 1
+ * in nested VMX operation.  Similarly, if bit X is 0 in VVT_CR0_FIXED1,
+ * then that bit of CR0 is fixed to 0 in nested VMX operation.  Reserved
+ * bits are not fixed to 0; they are simply ignored.
+ */
+#define VVT_CR0_FIXED0               (CR0_PG | CR0_NE | CR0_PE)
+#define VVT_CR0_FIXED1               ~0
+
+/*
+ * If bit X is 1 in VVT_CR4_FIXED0, then that bit of CR4 is fixed to 1
+ * in nested VMX operation.  Similarly, if bit X is 0 in VVT_CR4_FIXED1,
+ * then that bit of CR4 is fixed to 0 in nested VMX operation.
+ */
+#define VVT_CR4_FIXED0               CR4_VMXE
+#define VVT_CR4_FIXED1               (~CR4_RESERVED)
+
+/*
+ * Define VVT_MAX_INDEX as large as possible, given our VVMCS layout.
+ * We have one page total.  2 dwords are used for the revision and abort
+ * fields, and one boolean is used for the launched flag.  The remaining
+ * space is for four two-dimensional arrays--two of uint64, one of uint32
+ * and one of uint16.  The first dimension is VT_ENCODING_NUM_TYPES, and
+ * the other dimension is VVT_MAX_INDEX + 1.
+ *
+ * (The numerical value of VVT_MAX_INDEX is actually 45.)
+ */
+#define VVT_MAX_INDEX                (((PAGE_SIZE - 2 * sizeof(uint32)         \
+                                        - sizeof(Bool))  /                     \
+                                       (VT_ENCODING_NUM_TYPES *                \
+                                        (2 * sizeof(uint64) + sizeof(uint32) + \
+                                         sizeof(uint16)))) - 1)
+
+#define VVT_CR0_MASK                 ~(CR0_ET | CR0_NW | CR0_CD)
+
+#define VVT_CR3_TARGETS              4
+
+#define VVT_MISC                     (MSR_VMX_MISC_ACTSTATE_HLT | \
+                                      MSR_VMX_MISC_ACTSTATE_SHUTDOWN | \
+                                      MSR_VMX_MISC_ACTSTATE_SIPI | \
+                                      MSR_VMX_MISC_VMEXIT_SAVES_LMA | \
+                                      MSR_VMX_MISC_ZERO_VMENTRY_INSTLEN)
+
+#define VVT_EPT_SUPPORT              (VT_REQUIRED_EPT_SUPPORT | \
+                                      MSR_VMX_EPT_VPID_EPTE_X | \
+                                      MSR_VMX_EPT_VPID_ETMT_UC | \
+                                      MSR_VMX_EPT_VPID_INVEPT_EPT_CTX | \
+                                      MSR_VMX_EPT_VPID_INVEPT_GLOBAL | \
+                                      MSR_VMX_EPT_VPID_ACCESS_DIRTY | \
+                                      MSR_VMX_EPT_VPID_ADV_EXIT_INFO)
+
+#define VVT_VPID_SUPPORT             (VT_REQUIRED_VPID_SUPPORT | \
+                                      MSR_VMX_EPT_VPID_INVVPID_VPID_CTX | \
+                                      MSR_VMX_EPT_VPID_INVVPID_VPID_CTX_LOCAL)
+
+
+#define VVT_VMFUNC_SUPPORT           VT_VMFUNC_MASK(SWITCH_EPTP)
+
+#define VVT_SMI_HVSTATE_SHIFT        0
+#define VVT_SMI_HVSTATE_MASK         0x3
+#define VVT_SMI_CPL_SHIFT            2
+#define VVT_SMI_CPL_MASK             (0x3 << VVT_SMI_CPL_SHIFT)
+#define VVT_SMI_VM_SHIFT             4
+#define VVT_SMI_VM_MASK              (1 << VVT_SMI_VM_SHIFT)
+#define VVT_SMI_VMXE_SHIFT           5
+#define VVT_SMI_VMXE_MASK            (1 << VVT_SMI_VMXE_SHIFT)
+
+
+/*
+ * VVT requires certain VMX features from the host.  In the following
+ * requirements, CLEAR refers to VMX feature bits that must be clear,
+ * and SET refers to VMX feature bits that must be set.
+ */
+
+#define VVT_REQUIRED_BASIC_CLEAR      MSR_VMX_BASIC_32BITPA
+#define VVT_REQUIRED_BASIC_SET        (MSR_VMX_BASIC_ADVANCED_IOINFO | \
+                                       MSR_VMX_BASIC_TRUE_CTLS)
+
+#define VVT_REQUIRED_CR0_FIXED0_CLEAR ~(CR0_PG | CR0_NE | CR0_PE)
+#define VVT_REQUIRED_CR0_FIXED1_SET   (~0U)
+
+#define VVT_REQUIRED_CR4_FIXED0_CLEAR (~CR4_VMXE)
+#define VVT_REQUIRED_CR4_FIXED1_SET   (CR4_VMXE | CR4_OSXMMEXCPT | \
+                                       CR4_OSFXSR | CR4_PCE | CR4_PGE | \
+                                       CR4_MCE | CR4_PAE | CR4_PSE | \
+                                       CR4_DE | CR4_TSD | CR4_PVI | CR4_VME)
+
+#define VVT_REQUIRED_EPT_VPID_SET     (MSR_VMX_EPT_VPID_EPTE_X | \
+                                       MSR_VMX_EPT_VPID_GAW_48 | \
+                                       MSR_VMX_EPT_VPID_ETMT_WB | \
+                                       MSR_VMX_EPT_VPID_SP_2MB | \
+                                       MSR_VMX_EPT_VPID_INVEPT | \
+                                       MSR_VMX_EPT_VPID_INVEPT_EPT_CTX | \
+                                       MSR_VMX_EPT_VPID_INVEPT_GLOBAL | \
+                                       MSR_VMX_EPT_VPID_INVVPID | \
+                                       MSR_VMX_EPT_VPID_INVVPID_ADDR | \
+                                       MSR_VMX_EPT_VPID_INVVPID_VPID_CTX | \
+                                       MSR_VMX_EPT_VPID_INVVPID_ALL_CTX | \
+                                       MSR_VMX_EPT_VPID_INVVPID_VPID_CTX_LOCAL)
+
+#define VVT_REQUIRED_MIN_CR3_TARGETS  4
+
+/*
+ * For the remainder of the requirements, CLEAR refers to the low dword
+ * of the MSR (bits that are allowed to be zero), and SET refers to the
+ * high dword of the MSR (bits that are allowed to be one).
+ */
+
+#define VVT_REQUIRED_2ND_CLEAR       ~(VT_VMCS_2ND_VMEXEC_CTL_EPT | \
+                                       VT_VMCS_2ND_VMEXEC_CTL_VPID | \
+                                       VT_VMCS_2ND_VMEXEC_CTL_UNRESTRICTED)
+#define VVT_REQUIRED_2ND_SET          (VT_VMCS_2ND_VMEXEC_CTL_EPT | \
+                                       VT_VMCS_2ND_VMEXEC_CTL_DT | \
+                                       VT_VMCS_2ND_VMEXEC_CTL_RDTSCP | \
+                                       VT_VMCS_2ND_VMEXEC_CTL_VPID | \
+                                       VT_VMCS_2ND_VMEXEC_CTL_WBINVD)
+
+#define VVT_REQUIRED_TRUE_PIN_CLEAR   (~VT_PINBASED_CTLS_DEFAULT1)
+#define VVT_REQUIRED_TRUE_PIN_SET     (VT_PINBASED_CTLS_DEFAULT1 | \
+                                       VT_VMCS_PIN_VMEXEC_CTL_EXTINT_EXIT | \
+                                       VT_VMCS_PIN_VMEXEC_CTL_NMI_EXIT | \
+                                       VT_VMCS_PIN_VMEXEC_CTL_VNMI)
+
+#define VVT_REQUIRED_TRUE_CPU_CLEAR   (~VT_PROCBASED_CTLS_DEFAULT1 | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_LDCR3 | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_STCR3)
+#define VVT_REQUIRED_TRUE_CPU_SET     (VT_PROCBASED_CTLS_DEFAULT1 | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_VINTR_WINDOW | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_TSCOFF | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_HLT | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_INVLPG | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_MWAIT | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_RDPMC | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_RDTSC | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_LDCR3 | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_STCR3 | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_LDCR8 | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_STCR8 | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_TPR_SHADOW | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_VNMI_WINDOW | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_MOVDR | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_IO | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_IOBITMAP | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_MTF | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_MSRBITMAP | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_MONITOR | \
+                                       VT_VMCS_CPU_VMEXEC_CTL_USE_2ND)
+
+
+typedef struct {
+   uint32 revision;
+   uint32 abort;
+   uint64 field64[VT_ENCODING_NUM_TYPES][VVT_MAX_INDEX + 1];
+   uint64 fieldNat[VT_ENCODING_NUM_TYPES][VVT_MAX_INDEX + 1];
+   uint32 field32[VT_ENCODING_NUM_TYPES][VVT_MAX_INDEX + 1];
+   uint16 field16[VT_ENCODING_NUM_TYPES][VVT_MAX_INDEX + 1];
+   Bool   launched;
+} VVMCS;
+
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VVT_SupportedFromFeatures --
+ *
+ *   Returns TRUE if the given VMX features are compatible with our VVT
+ *   implementation.
+ *
+ *   We assume that the un-TRUE VMX capabilities match the TRUE VMX
+ *   capabilities, except that all default1 bits are set.  Since we
+ *   require TRUE VMX capabilities, we only check those.
+ *
+ *   The minimum supported hardware has the intersection of the
+ *   Nehalem feature set with the VMX capabilities of HWv9.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VVT_SupportedFromFeatures(uint64 basic, uint64 misc, uint64 cr0Fixed0,
+                          uint64 cr0Fixed1, uint64 cr4Fixed0,
+                          uint64 cr4Fixed1, uint64 secondary, uint64 eptVPID,
+                          uint64 truePin, uint64 trueCPU)
+{
+   if ((basic & VVT_REQUIRED_BASIC_CLEAR) != 0 ||
+       (basic & VVT_REQUIRED_BASIC_SET) != VVT_REQUIRED_BASIC_SET) {
+      return FALSE;
+   }
+
+   if ((cr0Fixed0 & VVT_REQUIRED_CR0_FIXED0_CLEAR) != 0 ||
+       (cr0Fixed1 & VVT_REQUIRED_CR0_FIXED1_SET) !=
+       VVT_REQUIRED_CR0_FIXED1_SET) {
+      return FALSE;
+   }
+
+   if ((cr4Fixed0 & VVT_REQUIRED_CR4_FIXED0_CLEAR) != 0 ||
+       (cr4Fixed1 & VVT_REQUIRED_CR4_FIXED1_SET) !=
+       VVT_REQUIRED_CR4_FIXED1_SET) {
+      return FALSE;
+   }
+
+   if ((eptVPID & VVT_REQUIRED_EPT_VPID_SET) != VVT_REQUIRED_EPT_VPID_SET) {
+      return FALSE;
+   }
+
+   if (((misc >> MSR_VMX_MISC_CR3_TARGETS_SHIFT) &
+        MSR_VMX_MISC_CR3_TARGETS_MASK) < VVT_REQUIRED_MIN_CR3_TARGETS) {
+      return FALSE;
+   }
+
+   if ((LODWORD(secondary) & VVT_REQUIRED_2ND_CLEAR) != 0 ||
+       (HIDWORD(secondary) & VVT_REQUIRED_2ND_SET) != VVT_REQUIRED_2ND_SET) {
+      return FALSE;
+   }
+
+   if ((LODWORD(truePin) & VVT_REQUIRED_TRUE_PIN_CLEAR) != 0 ||
+       (HIDWORD(truePin) & VVT_REQUIRED_TRUE_PIN_SET) !=
+       VVT_REQUIRED_TRUE_PIN_SET) {
+      return FALSE;
+   }
+
+   if ((LODWORD(trueCPU) & VVT_REQUIRED_TRUE_CPU_CLEAR) != 0 ||
+       (HIDWORD(trueCPU) & VVT_REQUIRED_TRUE_CPU_SET) !=
+       VVT_REQUIRED_TRUE_CPU_SET) {
+      return FALSE;
+   }
+
+   return TRUE;
+}
+
+#endif /* _VIRTUAL_VT_H_ */
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index 76a0fbbc..5d9350b5 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -35,7 +35,7 @@
 #define INCLUDE_ALLOW_USERLEVEL
 #include "includeCheck.h"
 
-#include "x86types.h"
+#include "cpu_types.h"
 #include "x86desc.h"
 #include "x86sel.h"
 #include "x86_basic_defs.h"
@@ -335,6 +335,12 @@ HwInterruptsEnabled(uint32 eflags)
    return (eflags & EFLAGS_IF) != 0;
 }
 
+static INLINE void
+HwInterruptsDisable(uint64 *rflags)
+{
+   *rflags &= ~EFLAGS_IF;
+}
+
 /* Checked against the Intel manual and GCC --hpreg */
 static INLINE void
 CLTS(void)
@@ -490,19 +496,19 @@ _Get_IDT(_GETSET_DTR_TYPE *dtr)
 #define SET_CR4(expr) SET_CR_DR(CR, 4, expr)
 #define SET_CR8(expr) SET_CR_DR(CR, 8, expr)
 
-/*
- * When the ULM macro-defines INTERRUPTS_ENABLED, attempting to define
- * it as a function produces hard-to-diagnose compile-time errors.
- */
-#if !defined(ULM) && !defined(INTERRUPTS_ENABLED)
 static INLINE Bool
 INTERRUPTS_ENABLED(void)
 {
+#if !defined(USERLEVEL)
    uintptr_t flags;
    SAVE_FLAGS(flags);
    return ((flags & EFLAGS_IF) != 0);
-}
+#else
+   /* At userlevel interrupts are always enabled. */
+   return TRUE;
 #endif
+}
+
 
 /*
  * [GS]ET_[GI]DT() are defined as macros wrapping a function
diff --git a/vmmon-only/include/vm_assert.h b/vmmon-only/include/vm_assert.h
index 27f63477..cf344460 100644
--- a/vmmon-only/include/vm_assert.h
+++ b/vmmon-only/include/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -21,8 +21,7 @@
  *
  *	The basic assertion facility for all VMware code.
  *
- *      For proper use, see bora/doc/assert and
- *      http://vmweb.vmware.com/~mts/WebSite/guide/programming/asserts.html.
+ *      For proper use, see bora/doc/assert
  */
 
 #ifndef _VM_ASSERT_H_
@@ -41,6 +40,7 @@
 
 // XXX not necessary except some places include vm_assert.h improperly
 #include "vm_basic_types.h"
+#include <stdarg.h>
 
 #ifdef __cplusplus
 extern "C" {
@@ -64,24 +64,23 @@ extern "C" {
 
 #if !defined VMM || defined MONITOR_APP // {
 
-#if defined (VMKPANIC) 
-#include "vmk_assert.h"
-#else /* !VMKPANIC */
-#define _ASSERT_PANIC(name) \
+# if defined (VMKPANIC)
+#  include "vmk_assert.h"
+# else /* !VMKPANIC */
+#  define _ASSERT_PANIC(name) \
            Panic(_##name##Fmt "\n", __FILE__, __LINE__)
-#define _ASSERT_PANIC_BUG(bug, name) \
+#  define _ASSERT_PANIC_BUG(bug, name) \
            Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
-#define _ASSERT_PANIC_NORETURN(name) \
+#  define _ASSERT_PANIC_NORETURN(name) \
            Panic(_##name##Fmt "\n", __FILE__, __LINE__)
-#define _ASSERT_PANIC_BUG_NORETURN(bug, name) \
+#  define _ASSERT_PANIC_BUG_NORETURN(bug, name) \
            Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
-#endif /* VMKPANIC */
+# endif /* VMKPANIC */
 
 #endif // }
 
 
 // These strings don't have newline so that a bug can be tacked on.
-#define _AssertPanicFmt            "PANIC %s:%d"
 #define _AssertAssertFmt           "ASSERT %s:%d"
 #define _AssertVerifyFmt           "VERIFY %s:%d"
 #define _AssertNotImplementedFmt   "NOT_IMPLEMENTED %s:%d"
@@ -94,19 +93,21 @@ extern "C" {
  * Panic and log functions
  */
 
-void Log(const char *fmt, ...) PRINTF_DECL(1, 2);
+void Log(const char *fmt, ...)     PRINTF_DECL(1, 2);
 void Warning(const char *fmt, ...) PRINTF_DECL(1, 2);
+
 #if defined VMKPANIC
 void Panic_SaveRegs(void);
 
 NORETURN void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
 
-#define Panic(fmt...) do { \
-   Panic_SaveRegs();       \
-   Panic_NoSave(fmt);      \
-} while(0)
+# define Panic(fmt...)        \
+   do {                       \
+      Panic_SaveRegs();       \
+      Panic_NoSave(fmt);      \
+   } while(0)
 
-#else
+#else /* !VMKPANIC */
 NORETURN void Panic(const char *fmt, ...) PRINTF_DECL(1, 2);
 #endif
 
@@ -116,8 +117,6 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 
 #ifndef ASSERT_IFNOT
    /*
-    * PR 271512: When compiling with gcc, catch assignments inside an ASSERT.
-    *
     * 'UNLIKELY' is defined with __builtin_expect, which does not warn when
     * passed an assignment (gcc bug 36050). To get around this, we put 'cond'
     * in an 'if' statement and make sure it never gets executed by putting
@@ -128,75 +127,136 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
     * not clear if this is a problem with other compilers, the ASSERT
     * definition was not changed for them. Using a bare 'cond' with the
     * ternary operator may provide a solution.
+    *
+    * PR 271512: When compiling with gcc, catch assignments inside an ASSERT.
     */
 
-   #ifdef __GNUC__
-      #define ASSERT_IFNOT(cond, panic)                                       \
+# ifdef __GNUC__
+#  define ASSERT_IFNOT(cond, panic)                                       \
          ({if (UNLIKELY(!(cond))) { panic; if (0) { if (cond) {;}}} (void)0;})
-   #else
-      #define ASSERT_IFNOT(cond, panic)                                       \
+# else
+#  define ASSERT_IFNOT(cond, panic)                                       \
          (UNLIKELY(!(cond)) ? (panic) : (void)0)
-   #endif
+# endif
 #endif
 
 
 /*
  * Assert, panic, and log macros
  *
- * Some of these are redefined below undef !VMX86_DEBUG.
- * ASSERT() is special cased because of interaction with Windows DDK.
+ * Some of these are redefined or undef below in !VMX86_DEBUG.
  */
 
 #if defined VMX86_DEBUG
-#undef  ASSERT
-#define ASSERT(cond) ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertAssert))
-#define ASSERT_BUG(bug, cond) \
+   /*
+    * Assert is a debug-only construct.
+    *
+    * Assert should capture (i.e., document and validate) invariants,
+    * including method preconditions, postconditions, loop invariants,
+    * class invariants, data structure invariants, etc.
+    *
+    * ASSERT() is special cased because of interaction with Windows DDK.
+    */
+# undef  ASSERT
+# define ASSERT(cond) ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertAssert))
+# define ASSERT_BUG(bug, cond) \
            ASSERT_IFNOT(cond, _ASSERT_PANIC_BUG(bug, AssertAssert))
 #endif
 
+   /*
+    * Verify is present on all build types.
+    *
+    * Verify should protect against missing functionality (e.g., unhandled
+    * cases), bugs and other forms of gaps, and also be used as the fail-safe
+    * way to plug remaining security risks. Verify is not the correct primitive
+    * to use to validate an invariant, as a condition never being true implies
+    * that it need not be handled.
+    */
 #undef  VERIFY
 #define VERIFY(cond) \
            ASSERT_IFNOT(cond, _ASSERT_PANIC_NORETURN(AssertVerify))
 #define VERIFY_BUG(bug, cond) \
            ASSERT_IFNOT(cond, _ASSERT_PANIC_BUG_NORETURN(bug, AssertVerify))
 
-#define PANIC()        _ASSERT_PANIC(AssertPanic)
-#define PANIC_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertPanic)
-
+   /*
+    * NOT IMPLEMENTED is useful to indicate that a codepath has not yet
+    * been implemented, and should cause execution to forcibly quit if it is
+    * ever reached. Some instances use NOT_IMPLEMENTED for things that will
+    * never be implemented (as implied by ASSERT_NOT_IMPLEMENTED).
+    *
+    * PR1151214 asks for ASSERT_NOT_IMPLEMENTED to be replaced with VERIFY.
+    * ASSERT_NOT_IMPLEMENTED is a conditional NOT_IMPLEMENTED. Despite the
+    * name, ASSERT_NOT_IMPLEMENTED is present in release builds.
+    *
+    * NOT_IMPLEMENTED_BUG is NOT_IMPLEMENTED with the bug number included
+    * in the panic string.
+    */
 #define ASSERT_NOT_IMPLEMENTED(cond) \
            ASSERT_IFNOT(cond, NOT_IMPLEMENTED())
 
 #if defined VMKPANIC || defined VMM
-#define NOT_IMPLEMENTED()        _ASSERT_PANIC_NORETURN(AssertNotImplemented)
+# define NOT_IMPLEMENTED()        _ASSERT_PANIC_NORETURN(AssertNotImplemented)
 #else
-#define NOT_IMPLEMENTED()        _ASSERT_PANIC(AssertNotImplemented)
+# define NOT_IMPLEMENTED()        _ASSERT_PANIC(AssertNotImplemented)
 #endif
 
 #if defined VMM
-#define NOT_IMPLEMENTED_BUG(bug) \
+# define NOT_IMPLEMENTED_BUG(bug) \
           _ASSERT_PANIC_BUG_NORETURN(bug, AssertNotImplemented)
-#else 
-#define NOT_IMPLEMENTED_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertNotImplemented)
+#else
+# define NOT_IMPLEMENTED_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertNotImplemented)
 #endif
 
+   /*
+    * NOT_REACHED is meant to indicate code paths that we can never
+    * execute. This can be very dangerous on release builds due to how
+    * some compilers behave when you do potentially reach the point
+    * indicated by NOT_REACHED and can lead to very difficult to debug
+    * failures. NOT_REACHED should be used sparingly due to this.
+    *
+    * On debug builds, NOT_REACHED is a Panic with a fixed string.
+    */
 #if defined VMKPANIC || defined VMM
-#define NOT_REACHED()            _ASSERT_PANIC_NORETURN(AssertNotReached)
+# define NOT_REACHED()            _ASSERT_PANIC_NORETURN(AssertNotReached)
 #else
-#define NOT_REACHED()            _ASSERT_PANIC(AssertNotReached)
+# define NOT_REACHED()            _ASSERT_PANIC(AssertNotReached)
 #endif
 
-#define ASSERT_MEM_ALLOC(cond) \
+#if !defined VMKERNEL && !defined VMKBOOT && !defined VMKERNEL_MODULE
+   /*
+    * PR 2621164,2624036: ASSERT_MEM_ALLOC is deprecated and should not be
+    * used. Please use VERIFY where applicable, since the latter aligns
+    * better with the consistency model as defined by bora/doc/assert. You
+    * could also consider the Util_Safe*alloc* functions in userland.
+    *
+    * Despite its name, ASSERT_MEM_ALLOC is present in both debug and release
+    * builds.
+    */
+# define ASSERT_MEM_ALLOC(cond) \
            ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertMemAlloc))
-
-#ifdef VMX86_DEVEL
-#define NOT_TESTED()       Warning(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
-#else
-#define NOT_TESTED()       Log(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
 #endif
 
+   /*
+    * ASSERT_NO_INTERRUPTS & ASSERT_HAS_INTERRUPTS are shorthand to
+    * assert whether interrupts are disabled or enabled.
+    */
 #define ASSERT_NO_INTERRUPTS()  ASSERT(!INTERRUPTS_ENABLED())
 #define ASSERT_HAS_INTERRUPTS() ASSERT(INTERRUPTS_ENABLED())
 
+   /*
+    * NOT_TESTED may be used to indicate that we've reached a code path.
+    * It simply puts an entry in the log file.
+    *
+    * ASSERT_NOT_TESTED does the same, conditionally.
+    * NOT_TESTED_ONCE will only log the first time we executed it.
+    * NOT_TESTED_1024 will only log every 1024th time we execute it.
+    */
+#ifdef VMX86_DEVEL
+# define NOT_TESTED()      Warning(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
+#else
+# define NOT_TESTED()      Log(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
+#endif
+
 #define ASSERT_NOT_TESTED(cond) (UNLIKELY(!(cond)) ? NOT_TESTED() : (void)0)
 #define NOT_TESTED_ONCE()       DO_ONCE(NOT_TESTED())
 
@@ -211,17 +271,36 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 
 
 /*
- * Redefine macros that are only in debug versions
+ * Redefine macros that have a different behaviour on release
+ * builds. This includes no behaviour (ie. removed).
  */
 
 #if !defined VMX86_DEBUG // {
 
-#undef  ASSERT
-#define ASSERT(cond)          ((void)0)
-#define ASSERT_BUG(bug, cond) ((void)0)
+# undef  ASSERT
+# define ASSERT(cond)          ((void)0)
+# define ASSERT_BUG(bug, cond) ((void)0)
 
 /*
- * Expand NOT_REACHED() as appropriate for each situation.
+ * NOT_REACHED on debug builds is a Panic; but on release
+ * builds reaching it is __builtin_unreachable()
+ * which is "undefined behaviour" according to
+ * gcc. (https://gcc.gnu.org/onlinedocs/gcc/Other-Builtins.html)
+ *
+ * When used correctly __builtin_unreachable() allows the compiler
+ * to generate slightly better code and eliminates some warnings
+ * when the compiler can't identify a "fallthrough" path that is
+ * never reached.
+ *
+ * When used incorrectly, __builtin_unreachable is a dangerous
+ * construct and we should structure code in such a way that we
+ * need fewer instances of NOT_REACHED to silence the compiler,
+ * and use the function attribute "noreturn" where appropriate
+ * and potentially then using NOT_REACHED as documentation.
+ *
+ * We should *never* have code after NOT_REACHED in a block as
+ * it's unclear to the reader if that path is ever possible, and
+ * as mentioned above, gcc will do weird and wonderful things to us.
  *
  * Mainly, we want the compiler to infer the same control-flow
  * information as it would from Panic().  Otherwise, different
@@ -234,30 +313,31 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
  * (measured at 212 bytes for the release vmm for a minimal infinite
  * loop; panic would cost even more) so it does without and lives
  * with the inconsistency.
+ *
  */
 
-#if defined VMKPANIC || defined VMM
-#undef  NOT_REACHED
-#if defined __GNUC__ && (__GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 5)
-#define NOT_REACHED() (__builtin_unreachable())
-#else
-#define NOT_REACHED() ((void)0)
-#endif
-#else
-// keep debug definition
-#endif
-
-#undef LOG_UNEXPECTED
-#define LOG_UNEXPECTED(bug)     ((void)0)
-
-#undef  ASSERT_NOT_TESTED
-#define ASSERT_NOT_TESTED(cond) ((void)0)
-#undef  NOT_TESTED
-#define NOT_TESTED()            ((void)0)
-#undef  NOT_TESTED_ONCE
-#define NOT_TESTED_ONCE()       ((void)0)
-#undef  NOT_TESTED_1024
-#define NOT_TESTED_1024()       ((void)0)
+# if defined VMKPANIC || defined VMM
+#  undef  NOT_REACHED
+#  if defined __GNUC__ && (__GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 5)
+#   define NOT_REACHED() (__builtin_unreachable())
+#  else
+#   define NOT_REACHED() ((void)0)
+#  endif
+# else
+ // keep debug definition
+# endif
+
+# undef LOG_UNEXPECTED
+# define LOG_UNEXPECTED(bug)     ((void)0)
+
+# undef  ASSERT_NOT_TESTED
+# define ASSERT_NOT_TESTED(cond) ((void)0)
+# undef  NOT_TESTED
+# define NOT_TESTED()            ((void)0)
+# undef  NOT_TESTED_ONCE
+# define NOT_TESTED_ONCE()       ((void)0)
+# undef  NOT_TESTED_1024
+# define NOT_TESTED_1024()       ((void)0)
 
 #endif // !VMX86_DEBUG }
 
@@ -320,9 +400,9 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
  * the __clang_analyzer__ macro defined only when clang SA is parsing files.
  */
 #ifdef __clang_analyzer__
-#define ANALYZER_ASSERT(cond) ASSERT(cond)
+# define ANALYZER_ASSERT(cond) ASSERT(cond)
 #else
-#define ANALYZER_ASSERT(cond) ((void)0)
+# define ANALYZER_ASSERT(cond) ((void)0)
 #endif
 
 #ifdef __cplusplus
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index 52bb5d88..dc378c56 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -23,9 +23,6 @@
  *
  * Note: Only partially tested on ARM processors: Works for View Open
  *       Client, which shouldn't have threads, and ARMv8 processors.
- *
- *       In ARM, GCC intrinsics (__sync*) compile but might not
- *       work, while MS intrinsics (_Interlocked*) do not compile.
  */
 
 #ifndef _ATOMIC_H_
@@ -294,7 +291,7 @@ Atomic_Read8(Atomic_uint8 const *var)  // IN:
 
 #if defined __GNUC__ && defined VM_ARM_32
    val = AtomicUndefined(var);
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    val = _VMATOM_X(R, 8, &var->value);
 #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
    __asm__ __volatile__(
@@ -334,7 +331,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
 {
 #if defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + val);
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 8, TRUE, &var->value, val);
 #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
    __asm__ __volatile__(
@@ -375,7 +372,7 @@ Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
 {
 #if defined __GNUC__ && defined VM_ARM_32
    AtomicUndefined(var + val);
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(W, 8, &var->value, val);
 #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
    __asm__ __volatile__(
@@ -414,7 +411,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
 {
 #if defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + oldVal + newVal);
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RIFEQW, 8, TRUE, &var->value, oldVal, newVal);
 #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
    uint8 val;
@@ -460,7 +457,7 @@ Atomic_ReadAnd8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, and, val);
 #else
    do {
@@ -492,7 +489,7 @@ static INLINE void
 Atomic_And8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, and, val);
 #else
    (void)Atomic_ReadAnd8(var, val);
@@ -522,7 +519,7 @@ Atomic_ReadOr8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, orr, val);
 #else
    do {
@@ -554,7 +551,7 @@ static INLINE void
 Atomic_Or8(Atomic_uint8 *var, // IN/OUT
            uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, orr, val);
 #else
    (void)Atomic_ReadOr8(var, val);
@@ -584,7 +581,7 @@ Atomic_ReadXor8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, eor, val);
 #else
    do {
@@ -616,7 +613,7 @@ static INLINE void
 Atomic_Xor8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, eor, val);
 #else
    (void)Atomic_ReadXor8(var, val);
@@ -646,7 +643,7 @@ Atomic_ReadAdd8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, add, val);
 #else
    do {
@@ -678,7 +675,7 @@ static INLINE void
 Atomic_Add8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, add, val);
 #else
    (void)Atomic_ReadAdd8(var, val);
@@ -706,7 +703,7 @@ static INLINE void
 Atomic_Sub8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, sub, val);
 #else
    Atomic_Add8(var, -val);
@@ -892,8 +889,8 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 retVal;
-   register volatile uint32 res;
+   uint32 retVal;
+   uint32 res;
 
    dmb();
 
@@ -1037,8 +1034,8 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register uint32 retVal;
-   register uint32 res;
+   uint32 retVal;
+   uint32 res;
 
    dmb();
 
@@ -1108,8 +1105,8 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register uint64 retVal;
-   register uint32 res;
+   uint64 retVal;
+   uint32 res;
 
    dmb();
 
@@ -1198,8 +1195,8 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1257,8 +1254,8 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1316,8 +1313,8 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1417,8 +1414,8 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1476,8 +1473,8 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1621,7 +1618,7 @@ Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, orr, val);
 #else
    do {
@@ -1655,7 +1652,7 @@ Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, and, val);
 #else
    do {
@@ -1690,7 +1687,7 @@ Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, orr, val);
 #else
    do {
@@ -1724,7 +1721,7 @@ Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, and, val);
 #else
    do {
@@ -1763,9 +1760,9 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 retVal;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 retVal;
+   uint32 tmp;
 
    dmb();
 
@@ -2074,13 +2071,13 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
       : "m" (*var)
       : "cc"
    );
-#elif defined _MSC_VER && defined __x86_64__
+#elif defined _MSC_VER && defined VM_64BIT
    /*
     * Microsoft docs guarantee "Simple reads and writes to properly
     * aligned 64-bit variables are atomic on 64-bit Windows."
     * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
     *
-    * XXX Verify that value is properly aligned. Bug 61315.
+    * XXX Unconditionally verify that value is properly aligned. Bug 61315.
     */
    return var->value;
 #elif defined _MSC_VER && defined VM_ARM_32
@@ -2157,7 +2154,7 @@ static INLINE uint64
 Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, add, val);
 #elif defined __x86_64__
 
@@ -2213,7 +2210,7 @@ static INLINE uint64
 Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
    return Atomic_ReadAdd64(var, (uint64)-(int64)val);
@@ -2449,24 +2446,20 @@ static INLINE uint64
 Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
                    uint64 val)         // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "xchgq %0, %1"
       : "=r" (val),
-        "+m" (var->value)
+      "+m" (var->value)
       : "0" (val)
       : "memory"
    );
    return val;
-#elif defined _MSC_VER
-   return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
-#else
-#error No compiler defined for Atomic_ReadWrite64
-#endif
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 64, TRUE, &var->value, val);
+#elif defined _MSC_VER && defined VM_64BIT
+   return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
 #else
    uint64 oldVal;
 
@@ -2503,8 +2496,7 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
    ASSERT((uintptr_t)var % 8 == 0);
 #endif
 
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __GNUC__ && defined __x86_64__
    /*
     * There is no move instruction for 64-bit immediate to memory, so unless
     * the immediate value fits in 32-bit (i.e. can be sign-extended), GCC
@@ -2517,21 +2509,18 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
       : "=m" (var->value)
       : "r" (val)
    );
-#elif defined _MSC_VER
+#elif defined __GNUC__ && defined VM_ARM_64
+   _VMATOM_X(W, 64, &var->value, val);
+#elif defined _MSC_VER && defined VM_64BIT
    /*
     * Microsoft docs guarantee "Simple reads and writes to properly aligned
     * 64-bit variables are atomic on 64-bit Windows."
     * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
     *
-    * XXX Verify that value is properly aligned. Bug 61315.
+    * XXX Unconditionally verify that value is properly aligned. Bug 61315.
     */
 
    var->value = val;
-#else
-#error No compiler defined for Atomic_Write64
-#endif
-#elif defined VM_ARM_64
-   _VMATOM_X(W, 64, &var->value, val);
 #else
    (void)Atomic_ReadWrite64(var, val);
 #endif
@@ -2558,8 +2547,7 @@ static INLINE void
 Atomic_Or64(Atomic_uint64 *var, // IN/OUT
             uint64 val)         // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; orq %1, %0"
@@ -2567,14 +2555,11 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined _MSC_VER
+#elif defined __GNUC__ && defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, orr, val);
+#elif defined _MSC_VER && defined VM_64BIT
    _InterlockedOr64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_Or64
-#endif
-#elif defined VM_ARM_64
-   _VMATOM_X(OP, 64, TRUE, &var->value, orr, val);
-#else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    do {
@@ -2605,8 +2590,7 @@ static INLINE void
 Atomic_And64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; andq %1, %0"
@@ -2614,14 +2598,11 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined _MSC_VER
+#elif defined __GNUC__ && defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, and, val);
+#elif defined _MSC_VER && defined VM_64BIT
    _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_And64
-#endif
-#elif defined VM_ARM_64
-   _VMATOM_X(OP, 64, TRUE, &var->value, and, val);
-#else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    do {
@@ -2877,8 +2858,8 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
    );
    return val;
 #elif defined VM_ARM_V7
-   register volatile uint16 retVal;
-   register volatile uint16 res;
+   uint16 retVal;
+   uint16 res;
 
    NOT_TESTED();
 
@@ -2987,8 +2968,8 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
    );
    return val;
 #elif defined VM_ARM_V7
-   register uint16 retVal;
-   register uint16 res;
+   uint16 retVal;
+   uint16 res;
 
    NOT_TESTED();
 
@@ -3047,8 +3028,8 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3104,8 +3085,8 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3161,8 +3142,8 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3218,8 +3199,8 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3275,8 +3256,8 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3440,9 +3421,9 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
    );
    return val;
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 retVal;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 retVal;
+   uint16 tmp;
 
    NOT_TESTED();
 
diff --git a/vmmon-only/include/vm_atomic_acqrel.h b/vmmon-only/include/vm_atomic_acqrel.h
new file mode 100644
index 00000000..1a952732
--- /dev/null
+++ b/vmmon-only/include/vm_atomic_acqrel.h
@@ -0,0 +1,779 @@
+/*********************************************************
+ * Copyright (C) 2018-2021 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_atomic_acqrel.h --
+ *
+ *       Declares atomics with acquire/release ordering.
+ *
+ * NOTE: Usage of these atomics should be rare and limited to implementations
+ *       of lockless algorithms. Most scenarios are better solved with locks -
+ *       which themselves are implemented using these atomics.
+ *
+ *       Inclusion of this header serves as a flag that a file needs careful
+ *       review and auditing due to the difficulty of writing correct lockless
+ *       code. [In the future, bora/doc/atomics will contain documentation
+ *       to explain the subtleties of non-sequential atomics.]
+ *
+ *       A good overview of weak memory orderings and their caveats is from
+ *       Hans-J. Boehm, who chaired the C++ technical committee that defined
+ *       C++11/C11 atomics.
+ *          http://schd.ws/hosted_files/cppcon2016/74/HansWeakAtomics.pdf
+ *          https://hboehm.info/
+ *
+ *
+ *       Acquire/Release can best be thought of using a "roach motel" model,
+ *       defining a box:
+ *           A[ xxxx ]R.
+ *
+ *       The acquire prevents the contents of the box (xxx) from jumping out
+ *       the left side. The release prevents the contents (xxx) from jumping
+ *       out the right side. Some reordering *is* allowed: stuff outside the
+ *       box may legally jump into the box (where-as sequentially consistent,
+ *       aka "full", memory barriers prevent that).
+ *
+ *       Fences are slightly stronger, and may be thought of as an operation
+ *       applied to all memory locations (i.e. they have some
+ *       bi-directionality). However, fences are rarely needed.
+ *       For more information on the difference between operations and fences:
+ *          https://preshing.com/20131125/acquire-and-release-fences-dont-work-the-way-youd-expect/
+ *
+ *       Publishing changes cross-thread is a release activity, consuming
+ *       those changes is an acquire activity.
+ *
+ *
+ *       Acquire/Release semantics are very hard to get right. For example,
+ *       a naive implementor might think:
+ *           IncRef ~= Acquire
+ *           DecRef ~= Release
+ *       struct { ref, x=0 } ptr
+ *       T1: decrements 2->1          T2: decrements 1->0
+ *       ptr->x = 5                   if (DecRef(ptr->ref) == 0)
+ *       DecRef(ptr->ref)                return ptr->x;
+ *
+ *       This can indeterminately return 0 or 5. The 0 return value
+ *       comes from this order, which is permitted by the barriers.
+ *       T2: read ptr->x      <--- reads can can be lofted as long as
+ *       T1: ptr->x = 5            they do not cross an Acquire
+ *       T1: DecRef(ptr->ref)
+ *       T2: DecRef(ptr->ref)
+ *
+ *       This race only occurs on the last DecRef, when the thread which
+ *       dropped the refcount to zero actually must re-acquire the object
+ *       before doing anything further to it (like reading or freeing).
+ *       The simplest correct DecRef is this:
+ *          DecRef(ptr) {
+ *             if (0 == DecAcquireRelease(ptr->ref)) {
+ *                 free(ptr);
+ *             }
+ *          }
+ *       On some platforms (depending on what sort of barrier a decrement is),
+ *       a more optimal DecRef may be:
+ *          DecRef(ptr) {
+ *             if (0 == DecRelease(ptr->ref)) {
+ *                 ReadAcquire(ptr->ref);  // Force writes from other threads
+ *                 free(ptr);              // to be visible to this thread
+ *             }
+ *          }
+ */
+
+#ifndef _ATOMIC_ACQREL_H_
+#define _ATOMIC_ACQREL_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_atomic.h"
+
+#if defined __cplusplus
+extern "C" {
+#endif
+
+/*
+ * Enable use of movq (_mm_loadl_epi64 and _mm_storel_epi64). These SSE2
+ * instructions allow 64bit reads and writes even in 32bit contexts and
+ * are much more efficient than lock cmpxchg64 calls.
+ *
+ * Note: we do *not* enable the use of these intrinsics in x86 kernels.
+ * Why: Both Windows and Linux drivers must explicitly call kernel functions
+ *      to save/restore FPU registers when using the FPU. In Linux, this
+ *      places the thread in "atomic context" where preemption is disabled.
+ *      These functions mustn't place such constraints on the caller.
+ */
+#if !defined USE_XMM_ATOMICS_ON_I386 && defined __i386__ && defined USERLEVEL
+   /* _M_IX86_FP >= 2 is the MSVC equivalent of defined(__SSE2__) */
+#  if (defined __GNUC__ && defined __SSE2__) || \
+      (defined _MSC_VER && _M_IX86_FP >= 2)
+#     define USE_XMM_ATOMICS_ON_I386 1
+#  endif
+#endif
+#if !defined USE_XMM_ATOMICS_ON_I386
+#  define USE_XMM_ATOMICS_ON_I386 0
+#endif
+
+#if USE_XMM_ATOMICS_ON_I386
+#  include <emmintrin.h>
+#endif
+
+
+#if defined VM_ARM_64
+#   include "vm_atomic_arm64_begin.h"
+#endif
+#include "vm_basic_asm.h"
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read8Acquire --
+ *
+ *      Read the value of the specified object atomically (acquire ordering).
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_Read8Acquire(Atomic_uint8 const *var)  // IN:
+{
+   uint8 val;
+
+#if defined __GNUC__
+#  if defined __i386__ || defined __x86_64__
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=q" (val)
+      : "m" (var->value)
+      : "memory" // Must minimally prevent #LoadLoad/#LoadStore compiler reordering
+   );
+
+#  elif defined VM_ARM_64
+   val = _VMATOM_X(R_SC, 8, &var->value);
+#  else
+   /* seq-cst until better code is available */
+   val = Atomic_ReadIfEqualWrite8((Atomic_uint8 *)var, 0, 0);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined VM_ARM_64 && defined _ISO_VOLATILE
+   val = (uint8)__iso_volatile_load8((volatile char *)&var->value);
+#  elif defined __i386__ || defined __x86_64__ || defined VM_ARM_64
+   val = var->value;   // "cl.exe /volatile:ms": volatile reads have acquire semantics
+#  else
+#  error Unimplemented MSVC arch Atomic_Read8Acquire
+#  endif
+#  if defined _ISO_VOLATILE
+   SMP_R_BARRIER_RW(); // Prevent #LoadLoad/#LoadStore reordering
+#  endif
+
+#else
+#error No compiler defined for Atomic_Read8Acquire
+#endif
+
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read16Acquire --
+ *
+ *      Read the value of the specified object atomically (acquire ordering).
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_Read16Acquire(Atomic_uint16 const *var)  // IN:
+{
+   uint16 val;
+
+   ASSERT((uintptr_t)var % 2 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__ || defined __i386__
+   __asm__ __volatile__(
+      "movw %1, %0"
+      : "=r" (val)
+      : "m" (var->value)
+      : "memory" // Must minimally prevent #LoadLoad/#LoadStore compiler reordering
+   );
+
+#  elif defined VM_ARM_64
+   val = _VMATOM_X(R_SC, 16, &var->value);
+#  else
+   /* seq-cst until better code is available */
+   val = Atomic_ReadIfEqualWrite16((Atomic_uint16 *)var, 0, 0);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined VM_ARM_64 && defined _ISO_VOLATILE
+   val = (uint16)__iso_volatile_load16((volatile short *)&var->value);
+#  elif defined __i386__ || defined __x86_64__ || defined VM_ARM_64
+   val = var->value;   // "cl.exe /volatile:ms": volatile reads have acquire semantics
+#  else
+#  error Unimplemented MSVC arch Atomic_Read16Acquire
+#  endif
+#  if defined _ISO_VOLATILE
+   SMP_R_BARRIER_RW(); // Prevent #LoadLoad/#LoadStore reordering
+#  endif
+
+#else
+#error No compiler defined for Atomic_Read16Acquire
+#endif
+
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read32Acquire --
+ *
+ *      Read the value of the specified object atomically (acquire ordering).
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_Read32Acquire(Atomic_uint32 const *var)  // IN:
+{
+   uint32 val;
+
+   ASSERT((uintptr_t)var % 4 == 0);
+
+#if defined __GNUC__
+   /*
+    * Use inline assembler to force using a single load instruction to
+    * ensure that the compiler doesn't split a transfer operation into multiple
+    * instructions.
+    */
+
+#  if defined __x86_64__ || defined __i386__
+   __asm__ __volatile__(
+      "movl %1, %0"
+      : "=r" (val)
+      : "m" (var->value)
+      : "memory" // Must minimally prevent #LoadLoad/#LoadStore compiler reordering
+   );
+#  elif defined VM_ARM_64
+   val = _VMATOM_X(R_SC, 32, &var->value);
+#  else
+   /* seq-cst until better code is available */
+   val = Atomic_ReadIfEqualWrite32((Atomic_uint32 *)var, 0, 0);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined VM_ARM_64 && defined _ISO_VOLATILE
+   val = (uint32)__iso_volatile_load32((volatile int *)&var->value);
+#  elif defined __i386__ || defined __x86_64__ || defined VM_ARM_64
+   val = var->value;   // "cl.exe /volatile:ms": volatile reads have acquire semantics
+#  else
+#  error Unimplemented MSVC arch Atomic_Read32Acquire
+#  endif
+#  if defined _ISO_VOLATILE
+   SMP_R_BARRIER_RW(); // Prevent #LoadLoad/#LoadStore reordering
+#  endif
+
+#else
+#error No compiler defined for Atomic_Read32Acquire
+#endif
+
+   return val;
+}
+#define Atomic_ReadAcquire Atomic_Read32Acquire
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read64Acquire --
+ *
+ *      Read the value of the specified object atomically (acquire ordering).
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_Read64Acquire(Atomic_uint64 const *var)  // IN:
+{
+   uint64 val;
+#if defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   __m128i xmmScratch;
+#endif
+
+   ASSERT((uintptr_t)var % 8 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__
+   __asm__ __volatile__(
+      "movq %1, %0"
+      : "=r" (val)
+      : "m" (var->value)
+      : "memory" // Must minimally prevent #LoadLoad/#LoadStore compiler reordering
+   );
+#  elif defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   /* Use SSE2 to perform the atomic read */
+   __asm__ __volatile__(
+      "movq %2, %1"   "\n\t" // mem to xmm
+      "movq %1, %0"          // xmm to mem (likely stack)
+      : "=m" (val), "=x" (xmmScratch)
+      : "m" (var->value)
+      : "memory" // Must minimally prevent #LoadLoad/#LoadStore compiler reordering
+   );
+#  elif defined __i386__
+   /*
+    * We can't use SSE2, so we use cmpxchg8b.
+    *
+    * Since cmpxchg8b will replace the contents of EDX:EAX with the
+    * value in memory if there is no match, we need only execute the
+    * instruction once in order to atomically read 64 bits from
+    * memory.  The only constraint is that ECX:EBX must have the same
+    * value as EDX:EAX so that if the comparison succeeds.  We
+    * intentionally don't tell gcc that we are using ebx and ecx as we
+    * don't modify them and do not care what value they store.
+    */
+   __asm__ __volatile__(
+      "mov %%ebx, %%eax"   "\n\t"
+      "mov %%ecx, %%edx"   "\n\t"
+      "lock; cmpxchg8b %1"
+      : "=&A" (val)
+      : "m" (*var)
+      : "cc", // no need for "ebx" or "ecx", see above
+        "memory" // Must minimally prevent #LoadLoad/#LoadStore compiler reordering
+   );
+#  elif defined VM_ARM_64
+   val = _VMATOM_X(R_SC, 64, &var->value);
+#  else
+   /* seq-cst until better code is available */
+   val = Atomic_ReadIfEqualWrite64((Atomic_uint64 *)var, 0, 0);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined VM_ARM_64 && defined _ISO_VOLATILE
+   val = (uint64)__iso_volatile_load64((volatile long long *)&var->value);
+#  elif defined VM_ARM_64 || defined __x86_64__
+   val = var->value;   // "cl.exe /volatile:ms": volatile reads have acquire semantics
+#  elif defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   /* Use SSE2 to perform the atomic read and let MSVC unpack the Xmm register */
+   xmmScratch = _mm_loadl_epi64((__m128i const*)&var->value);
+   SMP_R_BARRIER_RW(); // Prevent #LoadLoad/#LoadStore reordering
+   val = xmmScratch.m128i_u64[0];
+#  elif defined __i386__
+   /* We can't use SSE2, so we use cmpxchg8b */
+   val = (uint64)_InterlockedCompareExchange64((__int64 volatile * )&var->value, 0, 0);
+#  else
+#  error Unimplemented MSVC arch Atomic_Read64Acquire
+#  endif
+#  if !defined __i386__ && defined _ISO_VOLATILE
+   SMP_R_BARRIER_RW(); // Prevent #LoadLoad/#LoadStore reordering
+#  endif
+
+#else
+#error No compiler defined for Atomic_Read64Acquire
+#endif
+
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write8Release --
+ *
+ *      Write the specified value to the specified object atomically (release
+ *      ordering).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write8Release(Atomic_uint8 *var,  // OUT:
+                     uint8 val)          // IN:
+{
+#if defined __GNUC__
+#  if defined __i386__ || defined __x86_64__
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=m" (var->value)
+      : "qn" (val)
+      : "memory" // Must minimally prevent #LoadStore and #StoreStore compiler reordering
+   );
+#  elif defined VM_ARM_64
+   _VMATOM_X(W_SC, 8, &var->value, val);
+#  else
+   /* seq-cst until better code is available */
+   (void)Atomic_ReadWrite8(var, val);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined _ISO_VOLATILE
+   SMP_RW_BARRIER_W(); // Prevent #LoadStore and #StoreStore reordering
+#  endif
+#  if defined __x86_64__ || defined __i386__
+   var->value = val;   // "cl.exe /volatile:ms": volatile writes have release semantics
+#  elif defined VM_ARM_64
+   __iso_volatile_store8((volatile char *)&var->value, val);
+#  else
+#  error Unimplemented MSVC arch Atomic_Write8Release
+#  endif
+
+#else
+#error No compiler defined for Atomic_Write8Release
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write16Release --
+ *
+ *      Write the specified value to the specified object atomically (release
+ *      ordering).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write16Release(Atomic_uint16 *var,  // OUT:
+                      uint16 val)          // IN:
+{
+   ASSERT((uintptr_t)var % 2 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__ || defined __i386__
+   __asm__ __volatile__(
+      "movw %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+      : "memory" // Must minimally prevent #LoadStore and #StoreStore compiler reordering
+   );
+#  elif defined VM_ARM_64
+   _VMATOM_X(W_SC, 16, &var->value, val);
+#  else
+   /* seq-cst until better code is available */
+   (void)Atomic_ReadWrite16(var, val);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined _ISO_VOLATILE
+   SMP_RW_BARRIER_W(); // Prevent #LoadStore and #StoreStore reordering
+#  endif
+#  if defined __x86_64__ || defined __i386__
+   var->value = val;   // "cl.exe /volatile:ms": volatile writes have release semantics
+#  elif defined VM_ARM_64
+   __iso_volatile_store16((volatile short *)&var->value, val);
+#  else
+#  error Unimplemented MSVC arch Atomic_Write16Release
+#  endif
+
+#else
+#error No compiler defined for Atomic_Write16Release
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write32Release --
+ *
+ *      Write the specified value to the specified object atomically (release
+ *      ordering).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write32Release(Atomic_uint32 *var,  // OUT:
+                      uint32 val)          // IN:
+{
+   ASSERT((uintptr_t)var % 4 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__ || defined __i386__
+   __asm__ __volatile__(
+      "movl %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+      : "memory" // Must minimally prevent #LoadStore and #StoreStore compiler reordering
+   );
+#  elif defined VM_ARM_64
+   _VMATOM_X(W_SC, 32, &var->value, val);
+#  else
+   /* seq-cst until better code is available */
+   (void)Atomic_ReadWrite32(var, val);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined _ISO_VOLATILE
+   SMP_RW_BARRIER_W(); // Prevent #LoadStore and #StoreStore reordering
+#  endif
+#  if defined __x86_64__ || defined __i386__
+   var->value = val;   // "cl.exe /volatile:ms": volatile writes have release semantics
+#  elif defined VM_ARM_64
+   __iso_volatile_store32((volatile int *)&var->value, val);
+#  else
+#  error Unimplemented MSVC arch Atomic_Write32Release
+#  endif
+
+#else
+#error No compiler defined for Atomic_Write32Release
+#endif
+}
+#define Atomic_WriteRelease Atomic_Write32Release
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write64Release --
+ *
+ *      Write the specified value to the specified object atomically (release
+ *      ordering).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write64Release(Atomic_uint64 *var,  // OUT:
+                      uint64 val)          // IN:
+{
+#if defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   __m128i xmmScratch;
+#endif
+
+   ASSERT((uintptr_t)var % 8 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__
+   __asm__ __volatile__(
+      "movq %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+      : "memory" // Must minimally prevent #LoadStore and #StoreStore compiler reordering
+   );
+#  elif defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   /* Use SSE2 to perform the atomic write */
+   __asm__ __volatile__(
+      "movq %2, %1"   "\n\t"   // Memory (likely stack) to xmm
+      "movq %1, %0"            // xmm to target
+      : "=m" (var->value), "=x" (xmmScratch)
+      : "m" (val)
+      : "memory" // Must minimally prevent #LoadStore and #StoreStore compiler reordering
+   );
+#  elif defined __i386__
+   /* We can't use SSE2, so we use something that turns into cmpxchg8b */
+   (void)Atomic_ReadWrite64(var, val);
+#  elif defined VM_ARM_64
+   _VMATOM_X(W_SC, 64, &var->value, val);
+#  else
+   /* seq-cst until better code is available */
+   (void)Atomic_ReadWrite64(var, val);
+#  endif
+
+#elif defined _MSC_VER
+#  if !defined __i386__ && defined _ISO_VOLATILE
+   SMP_RW_BARRIER_W(); // Prevent #LoadStore and #StoreStore reordering
+#  endif
+#  if defined __x86_64__
+   var->value = val;   // "cl.exe /volatile:ms": volatile writes have release semantics
+#  elif defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   /* Use SSE2 to perform the atomic read and let MSVC unpack the Xmm register */
+    xmmScratch.m128i_u64[0] = val;
+   SMP_RW_BARRIER_W(); // Prevent #LoadStore and #StoreStore reordering
+   _mm_storel_epi64((__m128i*)&var->value, xmmScratch);
+#  elif defined __i386__
+   /* We can't use SSE2, so we use something that turns into cmpxchg8b */
+   (void)Atomic_ReadWrite64(var, val);
+#  elif defined VM_ARM_64
+   __iso_volatile_store64((volatile long long *)&var->value, val);
+#  else
+#  error Unimplemented MSVC arch Atomic_Write64Release
+#  endif
+
+#else
+#error No compiler defined for Atomic_Write64Release
+#endif
+}
+
+#define MAKE_ATOMIC_ACQREL_FUNCS(name, size, in, out, cast)                   \
+   static INLINE out                                                          \
+   Atomic_Read ## name ## Acquire(Atomic_ ## name const *var)                 \
+   {                                                                          \
+      return (out)(cast)Atomic_Read ## size ## Acquire(var);                  \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Write ## name ## Release(Atomic_ ## name *var,                      \
+                                   in val)                                    \
+   {                                                                          \
+      Atomic_Write ## size ## Release(var, (uint ## size)(cast)val);          \
+   }
+
+/*
+ * Since we use a macro to generate these definitions, it is hard to look for
+ * them. So DO NOT REMOVE THIS COMMENT and keep it up-to-date.
+ *
+ * Atomic_Ptr
+ * Atomic_ReadPtrAcquire --
+ * Atomic_WritePtrRelease --
+ *
+ * Atomic_Int
+ * Atomic_ReadIntAcquire --
+ * Atomic_WriteIntRelease --
+ *
+ * Atomic_Bool
+ * Atomic_ReadBoolAcquire --
+ * Atomic_WriteBoolRelease --
+ */
+
+
+#if defined VM_64BIT
+MAKE_ATOMIC_ACQREL_FUNCS(Ptr, 64, void const *, void *, uintptr_t)
+#else
+MAKE_ATOMIC_ACQREL_FUNCS(Ptr, 32, void const *, void *, uintptr_t)
+#endif
+MAKE_ATOMIC_ACQREL_FUNCS(Int, 32, int, int, int)
+MAKE_ATOMIC_ACQREL_FUNCS(Bool, 8, Bool, Bool, Bool)
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_FenceAcquire --
+ * Atomic_FenceRelease --
+ * Atomic_FenceAcqRel --
+ * Atomic_FenceSeqCst --
+ *
+ *      Explicit memory fence (barrier) with specified memory ordering.
+ *      Equivalent to C11 atomic_thread_fence(<barrier>).
+ *
+ *
+ *      Use VERY SPARINGLY; actual need for full barriers are extremely rare.
+ *      Atomic operations (e.g. read-acquire or write-release) are more
+ *      efficient.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      May emit memory barrier (arch-dependent).
+ *      Disallows compiler re-orderings.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_FenceAcquire(void)
+{
+   // C11 atomic_thread_fence(memory_order_acquire);
+   SMP_R_BARRIER_RW();
+}
+
+static INLINE void
+Atomic_FenceRelease(void)
+{
+   // C11 atomic_thread_fence(memory_order_release);
+   SMP_RW_BARRIER_W();
+}
+
+static INLINE void
+Atomic_FenceAcqRel(void)
+{
+   // C11 atomic_thread_fence(memory_order_acq_rel);
+   /* R_RW + RW_W is generally cheaper than RW_RW (W_R is expensive) */
+   SMP_R_BARRIER_RW();
+   SMP_RW_BARRIER_W();
+}
+
+static INLINE void
+Atomic_FenceSeqCst(void)
+{
+   // C11 atomic_thread_fence(memory_order_seq_cst);
+   SMP_RW_BARRIER_RW();
+}
+
+#ifdef VM_ARM_64
+#   include "vm_atomic_arm64_end.h"
+#endif
+
+#if defined __cplusplus
+}  // extern "C"
+#endif
+
+#endif // ifndef _ATOMIC_ACQREL_H_
diff --git a/vmmon-only/include/vm_atomic_relaxed.h b/vmmon-only/include/vm_atomic_relaxed.h
new file mode 100644
index 00000000..86459a45
--- /dev/null
+++ b/vmmon-only/include/vm_atomic_relaxed.h
@@ -0,0 +1,590 @@
+/*********************************************************
+ * Copyright (C) 2018 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+/*
+ * vm_atomic_relaxed.h --
+ *
+ *       Declares atomics with relaxed (i.e. "unordered" / "no-fence")
+ *       ordering.
+ *
+ * NOTE: Usage of these atomics should be rare and limited to adjusting
+ *       unrelated stat counters and possibly reading values in prep for
+ *       computing then atomically writing out an updated values using
+ *       stronger semantics.
+ *
+ *       Inclusion of this header serves as a flag that a file needs careful
+ *       review and auditing due to the difficulty of writing correct lockless
+ *       code. [In the future, bora/doc/atomics will contain documentation
+ *       to explain the subtleties of non-sequential atomics.]
+ *
+ *       Relaxed differ from other atomics in that they may be reordered
+ *       w.r.t. other atomics (even volatiles) and w.r.t. other non-atomic
+ *       memory accesses. For synchronization with signal handlers, this is
+ *       overkill: see vm_uninterruptible.h.
+ */
+
+#ifndef _ATOMIC_RELAXED_H_
+#define _ATOMIC_RELAXED_H_
+
+#define INCLUDE_ALLOW_USERLEVEL
+#define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMMON
+#define INCLUDE_ALLOW_VMKDRIVERS
+#define INCLUDE_ALLOW_VMK_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
+#define INCLUDE_ALLOW_DISTRIBUTE
+#define INCLUDE_ALLOW_VMCORE
+#include "includeCheck.h"
+
+#include "vm_atomic_acqrel.h"
+
+#if defined __cplusplus
+extern "C" {
+#endif
+
+#if defined VM_ARM_64
+#   include "vm_atomic_arm64_begin.h"
+#endif
+#include "vm_basic_asm.h"
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read8Relaxed --
+ *
+ *      Read the value of the specified object atomically (relaxed ordering).
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint8
+Atomic_Read8Relaxed(Atomic_uint8 const *var)  // IN:
+{
+   uint8 val;
+
+#if defined __GNUC__
+#  if defined __i386__ || defined __x86_64__
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=q" (val)
+      : "m" (var->value)
+   );
+#  elif defined VM_ARM_64
+   val = _VMATOM_X(R_NF, 8, &var->value);
+#  else
+   /* Acquire read until better code is available */
+   val = Atomic_Read8Acquire(var);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined VM_ARM_64
+   val = (uint8)__iso_volatile_load8((volatile char *)&var->value);
+#  elif defined __i386__ || defined __x86_64__
+   val = var->value;   // volatile reads are documented not to tear on MSVC
+#  else
+#  error Unimplemented MSVC arch Atomic_Read8Relaxed
+#  endif
+
+#else
+#error No compiler defined for Atomic_Read8Relaxed
+#endif
+
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read16Relaxed --
+ *
+ *      Read the value of the specified object atomically (relaxed ordering).
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_Read16Relaxed(Atomic_uint16 const *var)  // IN:
+{
+   uint16 val;
+
+   ASSERT((uintptr_t)var % 2 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__ || defined __i386__
+   __asm__ __volatile__(
+      "movw %1, %0"
+      : "=r" (val)
+      : "m" (var->value)
+   );
+#  elif defined VM_ARM_64
+   val = _VMATOM_X(R_NF, 16, &var->value);
+#  else
+   /* Acquire read until better code is available */
+   val = Atomic_Read16Acquire(var);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined VM_ARM_64
+   val = (uint16)__iso_volatile_load16((volatile short *)&var->value);
+#  elif defined __i386__ || defined __x86_64__
+   val = var->value;   // volatile reads are documented not to tear on MSVC
+#  else
+#  error Unimplemented MSVC arch Atomic_Read16Relaxed
+#  endif
+
+#else
+#error No compiler defined for Atomic_Read16Relaxed
+#endif
+
+   return val;
+}
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read32Relaxed --
+ *
+ *      Read the value of the specified object atomically (relaxed ordering).
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint32
+Atomic_Read32Relaxed(Atomic_uint32 const *var)  // IN:
+{
+   uint32 val;
+
+   ASSERT((uintptr_t)var % 4 == 0);
+
+#if defined __GNUC__
+   /*
+    * Use inline assembler to force using a single load instruction to
+    * ensure that the compiler doesn't split a transfer operation into multiple
+    * instructions.
+    */
+
+#  if defined __x86_64__ || defined __i386__
+   __asm__ __volatile__(
+      "movl %1, %0"
+      : "=r" (val)
+      : "m" (var->value)
+   );
+#  elif defined VM_ARM_64
+   val = _VMATOM_X(R_NF, 32, &var->value);
+#  else
+   /* Acquire read until better code is available */
+   val = Atomic_Read32Acquire(var);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined VM_ARM_64
+   val = (uint32)__iso_volatile_load32((volatile int *)&var->value);
+#  elif defined __i386__ || defined __x86_64__
+   val = var->value;   // volatile reads are documented not to tear on MSVC
+#  else
+#  error Unimplemented MSVC arch Atomic_Read32Relaxed
+#  endif
+
+#else
+#error No compiler defined for Atomic_Read32Relaxed
+#endif
+
+   return val;
+}
+#define Atomic_ReadRelaxed Atomic_Read32Relaxed
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Read64Relaxed --
+ *
+ *      Read the value of the specified object atomically (relaxed ordering).
+ *
+ * Results:
+ *      The value of the atomic variable.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+Atomic_Read64Relaxed(Atomic_uint64 const *var)  // IN:
+{
+   uint64 val;
+#if defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   __m128i xmmScratch;
+#endif
+
+   ASSERT((uintptr_t)var % 8 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__
+   __asm__ __volatile__(
+      "movq %1, %0"
+      : "=r" (val)
+      : "m" (var->value)
+   );
+#  elif defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   /* Use SSE2 to perform the atomic read */
+   __asm__ __volatile__(
+      "movq %2, %1"   "\n\t" // mem to xmm
+      "movq %1, %0"          // xmm to mem (likely stack)
+      : "=m" (val), "=x" (xmmScratch)
+      : "m" (var->value)
+   );
+#  elif defined __i386__
+   /*
+    * We can't use SSE2, so we use cmpxchg8b.
+    *
+    * Since cmpxchg8b will replace the contents of EDX:EAX with the
+    * value in memory if there is no match, we need only execute the
+    * instruction once in order to atomically read 64 bits from
+    * memory.  The only constraint is that ECX:EBX must have the same
+    * value as EDX:EAX so that if the comparison succeeds.  We
+    * intentionally don't tell gcc that we are using ebx and ecx as we
+    * don't modify them and do not care what value they store.
+    */
+   __asm__ __volatile__(
+      "mov %%ebx, %%eax"   "\n\t"
+      "mov %%ecx, %%edx"   "\n\t"
+      "lock; cmpxchg8b %1"
+      : "=&A" (val)
+      : "m" (*var)
+      : "cc" // no need for "ebx" or "ecx", see above
+   );
+#  elif defined VM_ARM_64
+   val = _VMATOM_X(R_NF, 64, &var->value);
+#  else
+   /* Acquire read until better code is available */
+   val = Atomic_Read64Acquire(var);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined __x86_64__
+   val = var->value;   // volatile reads are documented not to tear on MSVC
+#  elif defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   /* Use SSE2 to perform the atomic read and let MSVC unpack the Xmm register */
+   xmmScratch = _mm_loadl_epi64((__m128i const*)&var->value);
+   val = xmmScratch.m128i_u64[0];
+#  elif defined __i386__
+   /* We can't use SSE2, so we use cmpxchg8b */
+   val = (uint64)_InterlockedCompareExchange64((__int64 volatile * )&var->value, 0, 0);
+#  elif defined VM_ARM_64
+   val = (uint64)__iso_volatile_load64((volatile long long *)&var->value);
+#  else
+#  error Unimplemented MSVC arch Atomic_Read64Relaxed
+#  endif
+
+#else
+#error No compiler defined for Atomic_Read64Relaxed
+#endif
+
+   return val;
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write8Relaxed --
+ *
+ *      Write the specified value to the specified object atomically (relaxed
+ *      ordering).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write8Relaxed(Atomic_uint8 *var,  // OUT:
+                     uint8 val)          // IN:
+{
+#if defined __GNUC__
+#  if defined __i386__ || defined __x86_64__
+   __asm__ __volatile__(
+      "movb %1, %0"
+      : "=m" (var->value)
+      : "qn" (val)
+   );
+#  elif defined VM_ARM_64
+   _VMATOM_X(W_NF, 8, &var->value, val);
+#  else
+   /* Release write until better code is available */
+   Atomic_Write8Release(var, val);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined __x86_64__ || defined __i386__
+   var->value = val;   // volatile reads are documented not to tear on MSVC
+#  elif defined VM_ARM_64
+   __iso_volatile_store8((volatile char *)&var->value, val);
+#  else
+#  error Unimplemented MSVC arch Atomic_Write8Relaxed
+#  endif
+#else
+
+#error No compiler defined for Atomic_Write8Relaxed
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write16Relaxed --
+ *
+ *      Write the specified value to the specified object atomically (relaxed
+ *      ordering).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write16Relaxed(Atomic_uint16 *var,  // OUT:
+                      uint16 val)          // IN:
+{
+   ASSERT((uintptr_t)var % 2 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__ || defined __i386__
+   __asm__ __volatile__(
+      "movw %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#  elif defined VM_ARM_64
+   _VMATOM_X(W_NF, 16, &var->value, val);
+#  else
+   /* Release write until better code is available */
+   Atomic_Write16Release(var, val);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined __x86_64__ || defined __i386__
+   var->value = val;   // volatile reads are documented not to tear on MSVC
+#  elif defined VM_ARM_64
+   __iso_volatile_store16((volatile short *)&var->value, val);
+#  else
+#  error Unimplemented MSVC arch Atomic_Write16Relaxed
+#  endif
+#else
+
+#error No compiler defined for Atomic_Write16Relaxed
+#endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write32Relaxed --
+ *
+ *      Write the specified value to the specified object atomically (relaxed
+ *      ordering).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write32Relaxed(Atomic_uint32 *var, // OUT:
+                      uint32 val)         // IN:
+{
+   ASSERT((uintptr_t)var % 4 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__ || defined __i386__
+   __asm__ __volatile__(
+      "movl %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#  elif defined VM_ARM_64
+   _VMATOM_X(W_NF, 32, &var->value, val);
+#  else
+   /* Release write until better code is available */
+   Atomic_Write32Release(var, val);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined __x86_64__ || defined __i386__
+   var->value = val;   // volatile reads are documented not to tear on MSVC
+#  elif defined VM_ARM_64
+   __iso_volatile_store32((volatile int *)&var->value, val);
+#  else
+#  error Unimplemented MSVC arch Atomic_Write32Relaxed
+#  endif
+
+#else
+#error No compiler defined for Atomic_Write32Relaxed
+#endif
+}
+#define Atomic_WriteRelaxed Atomic_Write32Relaxed
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_Write64Relaxed --
+ *
+ *      Write the specified value to the specified object atomically (relaxed
+ *      ordering).
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      None.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_Write64Relaxed(Atomic_uint64 *var, // OUT:
+                      uint64 val)         // IN:
+{
+#if defined __i386__ && USE_XMM_ATOMICS_ON_I386
+    __m128i xmmScratch;
+#endif
+   ASSERT((uintptr_t)var % 8 == 0);
+
+#if defined __GNUC__
+#  if defined __x86_64__
+   __asm__ __volatile__(
+      "movq %1, %0"
+      : "=m" (var->value)
+      : "r" (val)
+   );
+#  elif defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   /* Use SSE2 to perform the atomic write */
+   __asm__ __volatile__(
+      "movq %2, %1"   "\n\t"   // Memory (likely stack) to xmm
+      "movq %1, %0"            // xmm to target
+      : "=m" (var->value), "=x" (xmmScratch)
+      : "m" (val)
+   );
+#  elif defined __i386__
+   /* We can't use SSE2, so we use something that turns into cmpxchg8b */
+   Atomic_Write64Release(var, val);
+#  elif defined VM_ARM_64
+   _VMATOM_X(W_NF, 64, &var->value, val);
+#  else
+   /* Release write until better code is available */
+   Atomic_Write64Release(var, val);
+#  endif
+
+#elif defined _MSC_VER
+#  if defined __x86_64__
+   var->value = val;   // volatile reads are documented not to tear on MSVC
+#  elif defined __i386__ && USE_XMM_ATOMICS_ON_I386
+   /* Use SSE2 to perform the atomic read and let MSVC unpack the Xmm register */
+    xmmScratch.m128i_u64[0] = val;
+   _mm_storel_epi64((__m128i*)&var->value, xmmScratch);
+#  elif defined __i386__
+   /* We can't use SSE2, so we use something that turns into cmpxchg8b */
+   Atomic_Write64Release(var, val);
+#  elif defined VM_ARM_64
+   __iso_volatile_store64((volatile long long *)&var->value, val);
+#  else
+#  error Unimplemented MSVC arch Atomic_Write64Relaxed
+#  endif
+
+#else
+#error No compiler defined for Atomic_Write64Relaxed
+#endif
+}
+
+#define MAKE_ATOMIC_RELAXED_FUNCS(name, size, in, out, cast)                  \
+   static INLINE out                                                          \
+   Atomic_Read ## name ## Relaxed(Atomic_ ## name const *var)                 \
+   {                                                                          \
+      return (out)(cast)Atomic_Read ## size ## Relaxed(var);                  \
+   }                                                                          \
+                                                                              \
+                                                                              \
+   static INLINE void                                                         \
+   Atomic_Write ## name ## Relaxed(Atomic_ ## name *var,                      \
+                                   in val)                                    \
+   {                                                                          \
+      Atomic_Write ## size ## Relaxed(var, (uint ## size)(cast)val);          \
+   }
+
+/*
+ * Since we use a macro to generate these definitions, it is hard to look for
+ * them. So DO NOT REMOVE THIS COMMENT and keep it up-to-date.
+ *
+ * Atomic_Int
+ * Atomic_ReadIntRelaxed --
+ * Atomic_WriteIntRelaxed --
+ *
+ * Atomic_Bool
+ * Atomic_ReadBoolRelaxed --
+ * Atomic_WriteBoolRelaxed --
+ */
+
+MAKE_ATOMIC_RELAXED_FUNCS(Int, 32, int, int, int)
+MAKE_ATOMIC_RELAXED_FUNCS(Bool, 8, Bool, Bool, Bool)
+
+#ifdef VM_ARM_64
+#   include "vm_atomic_arm64_end.h"
+#endif
+
+#if defined __cplusplus
+}  // extern "C"
+#endif
+
+#endif // ifndef _ATOMIC_RELAXED_H_
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index 8bc743e8..51fd6f66 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -191,7 +191,7 @@ mssb64_0(const uint64 value)
 }
 #endif
 
-#ifdef __GNUC__
+#if defined __GNUC__ || defined __clang__
 
 #ifdef VM_X86_ANY
 #define USE_ARCH_X86_CUSTOM
@@ -222,10 +222,6 @@ mssb64_0(const uint64 value)
  * **********************************************************
  */
 
-#if __GNUC__ < 4
-#define FEWER_BUILTINS
-#endif
-
 static INLINE int
 lssb32_0(uint32 v)
 {
@@ -244,7 +240,6 @@ lssb32_0(uint32 v)
    return __builtin_ffs(value) - 1;
 }
 
-#ifndef FEWER_BUILTINS
 static INLINE int
 mssb32_0(uint32 value)
 {
@@ -297,46 +292,6 @@ lssb64_0(const uint64 v)
 #endif
    return __builtin_ffsll(value) - 1;
 }
-#endif /* !FEWER_BUILTINS */
-
-#ifdef FEWER_BUILTINS
-/* GCC 3.3.x does not like __bulitin_clz or __builtin_ffsll. */
-static INLINE int
-mssb32_0(uint32 value)
-{
-   if (UNLIKELY(value == 0)) {
-      return -1;
-   } else {
-      int pos;
-      __asm__ __volatile__("bsrl %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
-      return pos;
-   }
-}
-
-static INLINE int
-lssb64_0(const uint64 value)
-{
-   if (UNLIKELY(value == 0)) {
-      return -1;
-   } else {
-      intptr_t pos;
-
-#ifdef VM_X86_64
-      __asm__ __volatile__("bsf %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
-#else
-      /* The coding was chosen to minimize conditionals and operations */
-      pos = lssb32_0((uint32) value);
-      if (pos == -1) {
-         pos = lssb32_0((uint32) (value >> 32));
-         if (pos != -1) {
-            return pos + 32;
-         }
-      }
-#endif /* VM_X86_64 */
-      return pos;
-   }
-}
-#endif /* FEWER_BUILTINS */
 
 
 static INLINE int
@@ -683,7 +638,7 @@ uint32set(void *dst, uint32 val, size_t count)
 static INLINE uint16
 Bswap16(uint16 v)
 {
-#if defined(VM_ARM_64)
+#if defined(VM_ARM_64) && !defined(_MSC_VER)
    __asm__("rev16 %w0, %w0" : "+r"(v));
    return v;
 #else
@@ -716,7 +671,7 @@ Bswap32(uint32 v) // IN
 #elif defined(VM_ARM_32) && !defined(__ANDROID__) && !defined(_MSC_VER)
     __asm__("rev %0, %0" : "+r"(v));
     return v;
-#elif defined(VM_ARM_64)
+#elif defined(VM_ARM_64) && !defined(_MSC_VER)
    __asm__("rev32 %x0, %x0" : "+r"(v));
    return v;
 #else
@@ -742,7 +697,7 @@ Bswap32(uint32 v) // IN
 static INLINE uint64
 Bswap64(uint64 v) // IN
 {
-#if defined(VM_ARM_64)
+#if defined(VM_ARM_64) && !defined(_MSC_VER)
    __asm__("rev %0, %0" : "+r"(v));
    return v;
 #else
@@ -773,7 +728,11 @@ PAUSE(void)
 }
 #elif defined(_MSC_VER)
 {
+#ifdef VM_X86_ANY
    _mm_pause();
+#else
+   __yield();
+#endif
 }
 #else  /* __GNUC__  */
 #error No compiler defined for PAUSE
@@ -809,6 +768,11 @@ RDTSC(void)
 
    return tim;
 #elif defined(VM_ARM_64)
+   /*
+    * Keep this implementation in sync with:
+    * bora/lib/vprobe/arm64/vp_emit_tc.c::VpEmit_BuiltinRDTSCWork()
+    * bora/modules/vmkernel/tests/core/xmapTest/xmapTest_arm64.c::XMapTest_SetupLoopCode()
+    */
 #if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1)
    return MRS(CNTPCT_EL0);
 #else
@@ -932,18 +896,27 @@ TestBit64(const uint64 *var, unsigned index)
  *-----------------------------------------------------------------------------
  */
 
+#if defined __GCC_ASM_FLAG_OUTPUTS__
+/*
+ * See https://gcc.gnu.org/onlinedocs/gcc/Extended-Asm.html
+ * 6.47.2.4 Flag Output Operands
+ *
+ * This expands to 0 or 1 instructions followed by the output operand string.
+ */
+#define GCC_ASM_BT_EPILOG : "=@ccc"
+#else
+#define GCC_ASM_BT_EPILOG "\n\tsetc\t%0" : "=qQm"
+#endif
+
 static INLINE Bool
 SetBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
    Bool bit;
-   __asm__ (
-      "bts %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (*(uint32 *)var)
-      : "rI" (index)
-      : "memory", "cc"
-   );
+   __asm__("bts\t%2, %1"
+           GCC_ASM_BT_EPILOG (bit), "+m" (*(uint32 *)var)
+           : "rI" (index)
+           : "memory", "cc");
    return bit;
 #elif defined(_MSC_VER)
    return _bittestandset((long *)var, index) != 0;
@@ -959,13 +932,10 @@ ClearBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
    Bool bit;
-   __asm__ (
-      "btr %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (*(uint32 *)var)
-      : "rI" (index)
-      : "memory", "cc"
-   );
+   __asm__("btr\t%2, %1"
+           GCC_ASM_BT_EPILOG (bit), "+m" (*(uint32 *)var)
+           : "rI" (index)
+           : "memory", "cc");
    return bit;
 #elif defined(_MSC_VER)
    return _bittestandreset((long *)var, index) != 0;
@@ -981,13 +951,10 @@ ComplementBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
    Bool bit;
-   __asm__ (
-      "btc %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (*(uint32 *)var)
-      : "rI" (index)
-      : "memory", "cc"
-   );
+   __asm__("btc\t%2, %1"
+           GCC_ASM_BT_EPILOG (bit), "+m" (*(uint32 *)var)
+           : "rI" (index)
+           : "memory", "cc");
    return bit;
 #elif defined(_MSC_VER)
    return _bittestandcomplement((long *)var, index) != 0;
@@ -1003,13 +970,10 @@ TestBitVector(const void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
    Bool bit;
-   __asm__ (
-      "bt %2, %1;"
-      "setc %0"
-      : "=qQm" (bit)
-      : "m" (*(const uint32 *)var), "rI" (index)
-      : "cc"
-   );
+   __asm__("bt\t%2, %1"
+           GCC_ASM_BT_EPILOG (bit)
+           : "m" (*(const uint32 *)var), "rI" (index)
+           : "cc");
    return bit;
 #elif defined _MSC_VER
    return _bittest((long *)var, index) != 0;
@@ -1018,6 +982,45 @@ TestBitVector(const void *var, int32 index)
 #endif
 }
 
+#undef GCC_ASM_BT_EPILOG
+
+/*
+ *-----------------------------------------------------------------------------
+ * RoundDownPow2_{64,32} --
+ *
+ *   Rounds a value down to the previous power of 2.  Returns the original
+ *   value if it is a power of 2. Returns 0 for input of 0 and 1 for 1.
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+RoundDownPow2_64(uint64 value)
+{
+   if ((value & (value - 1)) == 0) {
+      /*
+       * Already zero or a power of two.
+       */
+      return value;
+   }
+
+   return CONST64U(1) << mssb64_0(value);
+}
+
+
+static INLINE uint32
+RoundDownPow2_32(uint32 value)
+{
+   if ((value & (value - 1)) == 0) {
+      /*
+       * Already a power of two.
+       */
+      return value;
+   }
+
+   return 1U << mssb32_0(value);
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  * RoundUpPow2_{64,32} --
@@ -1155,7 +1158,7 @@ RoundUpPow2_32(uint32 value)
 static INLINE unsigned
 PopCount32(uint32 value)
 {
-#if defined(__GNUC__) && !defined(FEWER_BUILTINS) && defined(__POPCNT__)
+#if defined(__GNUC__) && defined(__POPCNT__)
    return __builtin_popcount(value);
 #else
    /*
@@ -1224,7 +1227,7 @@ PopCount32(uint32 value)
 static INLINE unsigned
 PopCount64(uint64 value)
 {
-#if defined(__GNUC__) && !defined(FEWER_BUILTINS) && defined(__POPCNT__)
+#if defined(__GNUC__) && defined(__POPCNT__)
 #if defined(VM_X86_64)
    return __builtin_popcountll(value);
 #else
@@ -1243,6 +1246,79 @@ PopCount64(uint64 value)
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * INTR_R_BARRIER_R --
+ * INTR_R_BARRIER_W --
+ * INTR_R_BARRIER_RW --
+ * INTR_W_BARRIER_R --
+ * INTR_W_BARRIER_W --
+ * INTR_W_BARRIER_RW --
+ * INTR_RW_BARRIER_R --
+ * INTR_RW_BARRIER_W --
+ * INTR_RW_BARRIER_RW --
+ *
+ *      Enforce ordering on memory operations witnessed by and
+ *      affected by interrupt handlers.
+ *
+ *      This should be used to replace the legacy COMPILER_*_BARRIER
+ *      for code that has been audited to determine it only needs
+ *      ordering with respect to interrupt handlers, and not to other
+ *      CPUs (SMP_*), memory-mapped I/O (MMIO_*), or DMA (DMA_*).
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#ifdef __GNUC__
+
+static INLINE void
+INTR_RW_BARRIER_RW(void)
+{
+   __asm__ __volatile__("" ::: "memory");
+}
+
+#define INTR_R_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_R_BARRIER_W INTR_RW_BARRIER_RW
+#define INTR_R_BARRIER_RW INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_W INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_RW INTR_RW_BARRIER_RW
+#define INTR_RW_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_RW_BARRIER_W INTR_RW_BARRIER_RW
+
+#elif defined _MSC_VER
+
+static INLINE void
+INTR_R_BARRIER_R(void)
+{
+   _ReadBarrier();
+}
+
+static INLINE void
+INTR_W_BARRIER_W(void)
+{
+   _WriteBarrier();
+}
+
+static INLINE void
+INTR_RW_BARRIER_RW(void)
+{
+   _ReadWriteBarrier();
+}
+
+#define INTR_R_BARRIER_W INTR_RW_BARRIER_RW
+#define INTR_R_BARRIER_RW INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_RW INTR_RW_BARRIER_RW
+#define INTR_RW_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_RW_BARRIER_W INTR_RW_BARRIER_RW
+
+#else
+#error No compiler defined for INTR_*_BARRIER_*
+#endif
+
+
 #if defined __cplusplus
 } // extern "C"
 #endif
diff --git a/vmmon-only/include/vm_basic_asm_x86.h b/vmmon-only/include/vm_basic_asm_x86.h
index 9879dc6d..3f6369c9 100644
--- a/vmmon-only/include/vm_basic_asm_x86.h
+++ b/vmmon-only/include/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -328,9 +328,7 @@ Div643264(uint64 dividend,   // IN
  *-----------------------------------------------------------------------------
  */
 
-#if defined(__GNUC__) && \
-   (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 4)) && \
-   !defined(MUL64_NO_ASM)
+#if defined(__GNUC__) && !defined(MUL64_NO_ASM)
 
 static INLINE uint64
 Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
@@ -435,9 +433,7 @@ Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
  *-----------------------------------------------------------------------------
  */
 
-#if defined(__GNUC__) && \
-   (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 4)) && \
-   !defined(MUL64_NO_ASM)
+#if defined(__GNUC__) && !defined(MUL64_NO_ASM)
 
 static INLINE int64
 Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
diff --git a/vmmon-only/include/vm_basic_asm_x86_64.h b/vmmon-only/include/vm_basic_asm_x86_64.h
index 75823a43..d3e2ab9e 100644
--- a/vmmon-only/include/vm_basic_asm_x86_64.h
+++ b/vmmon-only/include/vm_basic_asm_x86_64.h
@@ -19,7 +19,7 @@
 /*
  * vm_basic_asm_x86_64.h
  *
- *	Basic x86_64 asm macros.
+ *      Basic x86_64 asm macros.
  */
 
 #ifndef _VM_BASIC_ASM_X86_64_H_
@@ -41,7 +41,8 @@
 
 #if defined(__GNUC__)
 /*
- * GET_CURRENT_PC
+ * _GET_CURRENT_PC --
+ * GET_CURRENT_PC --
  *
  * Returns the current program counter (i.e. instruction pointer i.e. rip
  * register on x86_64). In the example below:
@@ -51,29 +52,37 @@
  *
  * the return value from GET_CURRENT_PC will point a debugger to L123.
  */
-#define GET_CURRENT_PC() ({                                           \
-      void *__rip;                                                    \
-      asm("lea 0(%%rip), %0;\n\t"                                     \
-         : "=r" (__rip));                                             \
-      __rip;                                                          \
-})
+
+#define _GET_CURRENT_PC(rip)                                                  \
+   asm volatile("lea 0(%%rip), %0" : "=r" (rip))
+
+static INLINE_ALWAYS void *
+GET_CURRENT_PC(void)
+{
+   void *rip;
+
+   _GET_CURRENT_PC(rip);
+   return rip;
+}
 
 /*
- * GET_CURRENT_LOCATION
+ * GET_CURRENT_LOCATION --
  *
  * Updates the arguments with the values of the %rip, %rbp, and %rsp
- * registers at the current code location where the macro is invoked,
- * and the return address.
+ * registers and the return address at the current code location where
+ * the macro is invoked.
  */
-#define GET_CURRENT_LOCATION(rip, rbp, rsp, retAddr)  do {         \
-      asm("lea 0(%%rip), %0\n"                                     \
-          "mov %%rbp, %1\n"                                        \
-          "mov %%rsp, %2\n"                                        \
-          : "=r" (rip), "=r" (rbp), "=r" (rsp));                   \
-      retAddr = (uint64) GetReturnAddress();                       \
-   } while (0)
+
+#define GET_CURRENT_LOCATION(rip, rbp, rsp, retAddr) do {                     \
+   _GET_CURRENT_PC(rip);                                                      \
+   asm volatile("mov %%rbp, %0" "\n\t"                                        \
+                "mov %%rsp, %1"                                               \
+                : "=r" (rbp), "=r" (rsp));                                    \
+   retAddr = (uint64)GetReturnAddress();                                      \
+} while (0)
 #endif
 
+
 /*
  * FXSAVE/FXRSTOR
  *     save/restore SIMD/MMX fpu state
@@ -376,13 +385,13 @@ Mul64x6464(uint64 multiplicand,
     *      discarded by the shift.
     *    Return the low-order 64 bits of the above.
     */
-   uint64 tmplo, tmphi;
-   tmplo = _umul128(multiplicand, multiplier, &tmphi);
    if (shift == 0) {
-      return tmplo;
+      return multiplicand * multiplier;
    } else {
-      return __shiftright128(tmplo, tmphi, (uint8) shift) +
-         ((tmplo >> (shift - 1)) & 1);
+      uint64 lo, hi;
+
+      lo = _umul128(multiplicand, multiplier, &hi);
+      return __shiftright128(lo, hi, (uint8)shift) + (lo >> (shift - 1) & 1);
    }
 }
 
@@ -463,13 +472,13 @@ Muls64x64s64(int64 multiplicand,
     * Note: using an unsigned shift is correct because shift < 64 and
     * we return only the low 64 bits of the shifted result.
     */
-   int64 tmplo, tmphi;
-   tmplo = _mul128(multiplicand, multiplier, &tmphi);
    if (shift == 0) {
-      return tmplo;
+      return multiplicand * multiplier;
    } else {
-      return __shiftright128(tmplo, tmphi, (uint8) shift) +
-         ((tmplo >> (shift - 1)) & 1);
+      int64 lo, hi;
+
+      lo = _mul128(multiplicand, multiplier, &hi);
+      return __shiftright128(lo, hi, (uint8)shift) + (lo >> (shift - 1) & 1);
    }
 }
 
diff --git a/vmmon-only/include/vm_basic_asm_x86_common.h b/vmmon-only/include/vm_basic_asm_x86_common.h
index 8c2ee36e..9b659c8b 100644
--- a/vmmon-only/include/vm_basic_asm_x86_common.h
+++ b/vmmon-only/include/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -150,6 +150,37 @@ GetCallerEFlags(void)
    X86MSR_GetMSR(MSR_BIOS_SIGN_ID))
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CLFLUSH --
+ *
+ *      Wrapper around the CLFLUSH instruction.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      See CLFLUSH instruction in Intel SDM or AMD Programmer's Manual.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+CLFLUSH(const void *addr)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "clflush %0"
+      :: "m" (*(uint8 *)addr));
+#elif defined _MSC_VER
+   _mm_clflush(addr);
+#else
+#error No compiler defined for CLFLUSH
+#endif
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -365,12 +396,22 @@ LOCKED_INSN_BARRIER(void)
  * accesses accross the barrier. It is not a CPU instruction, it is a compiler
  * directive (i.e. it does not emit any code).
  *
+ * => A compiler memory barrier on its own is useful for coordinating
+ *    with an interrupt handler (or preemption logic in the scheduler)
+ *    on the same CPU, so that the order of read and write
+ *    instructions in code that might be interrupted is consistent
+ *    with the barriers. But when there are other CPUs involved, or
+ *    other types of devices like memory-mapped I/O and DMA
+ *    controllers, a compiler memory barrier is not enough.
+ *
  * A CPU memory barrier prevents the CPU from re-ordering memory accesses
  * accross the barrier. It is a CPU instruction.
  *
+ * => On its own the CPU instruction isn't useful because the compiler
+ *    may reorder loads and stores around the CPU instruction.  It is
+ *    useful only when combined with a compiler memory barrier.
+ *
  * A memory barrier is the union of a compiler memory barrier and a CPU memory
- * barrier. A compiler memory barrier is a useless construct by itself. It is
- * only useful when combined with a CPU memory barrier, to implement a memory
  * barrier.
  *
  *    Semantics
@@ -418,12 +459,11 @@ LOCKED_INSN_BARRIER(void)
  * <mem_type/purpose>_<before_access_type>_BARRIER_<after_access_type>
  *
  * where:
- *   <mem_type/purpose> is either SMP, DMA, or MMIO.
+ *   <mem_type/purpose> is either INTR, SMP, DMA, or MMIO.
  *   <*_access type> is either R(load), W(store) or RW(any).
  *
  * Above every use of these memory barriers in the code, there _must_ be a
  * comment to justify the use, i.e. a comment which:
- *
  * 1) Precisely identifies which memory accesses must not be re-ordered across
  *    the memory barrier.
  * 2) Explains why it is important that the memory accesses not be re-ordered.
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index f683168c..0ec30b33 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -130,9 +130,22 @@ Max(int a, int b)
 #define ROUNDUPBITS(x, bits)	(((uintptr_t) (x) + MASK(bits)) & ~MASK(bits))
 #define ROUNDDOWNBITS(x, bits)	((uintptr_t) (x) & ~MASK(bits))
 #define CEILING(x, y)		(((x) + (y) - 1) / (y))
+
+#if defined VMKERNEL || defined VMKBOOT
+# define CEIL(_a, _b)        CEILING(_a, _b)
+# define FLOOR(_a, _b)       ((_a)/(_b))
+# define ALIGN_DOWN(_a, _b)  ROUNDDOWN(_a, _b)
+# define ALIGN_UP(_a, _b)    ROUNDUP(_a, _b)
+# define IS_ALIGNED(_a, _b)  (ALIGN_DOWN(_a, _b) == _a)
+#endif
+
 #if defined __APPLE__
 #include <machine/param.h>
 #undef MASK
+#include <mach/machine/vm_param.h>
+#undef PAGE_SHIFT
+#undef PAGE_SIZE
+#undef PAGE_MASK
 #endif
 
 /*
@@ -188,34 +201,54 @@ Max(int a, int b)
  * Page operations
  *
  * It has been suggested that these definitions belong elsewhere
- * (like x86types.h).  However, I deem them common enough
+ * (like cpu_types.h).  However, I deem them common enough
  * (since even regular user-level programs may want to do
  * page-based memory manipulation) to be here.
  * -- edward
  */
 
+#define PAGE_SHIFT_4KB   12
+#define PAGE_SHIFT_16KB  14
+#define PAGE_SHIFT_64KB  16
+
 #ifndef PAGE_SHIFT // {
 #if defined __x86_64__ || defined __i386__
-   #define PAGE_SHIFT    12
+   #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #elif defined __APPLE__
-   #define PAGE_SHIFT    12
+   #if defined VM_ARM_ANY
+      #define PAGE_SHIFT    PAGE_SHIFT_16KB
+   #else
+      #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #endif
 #elif defined VM_ARM_64
-   #define PAGE_SHIFT    12
+   #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #elif defined __arm__
-   #define PAGE_SHIFT    12
+   #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #else
    #error
 #endif
 #endif // }
 
+#define PAGE_SIZE_4KB    (1 << PAGE_SHIFT_4KB)
+#define PAGE_SIZE_16KB   (1 << PAGE_SHIFT_16KB)
+#define PAGE_SIZE_64KB   (1 << PAGE_SHIFT_64KB)
+
 #ifndef PAGE_SIZE
 #define PAGE_SIZE     (1 << PAGE_SHIFT)
 #endif
 
+#define PAGE_MASK_4KB    (PAGE_SIZE_4KB - 1)
+#define PAGE_MASK_16KB   (PAGE_SIZE_16KB - 1)
+#define PAGE_MASK_64KB   (PAGE_SIZE_64KB - 1)
+
 #ifndef PAGE_MASK
 #define PAGE_MASK     (PAGE_SIZE - 1)
 #endif
 
+#define PAGE_OFFSET_4KB(_addr)   ((uintptr_t)(_addr) & (PAGE_SIZE_4KB - 1))
+#define PAGE_OFFSET_16KB(_addr)  ((uintptr_t)(_addr) & (PAGE_SIZE_16KB - 1))
+#define PAGE_OFFSET_64KB(_addr)  ((uintptr_t)(_addr) & (PAGE_SIZE_64KB - 1))
+
 #ifndef PAGE_OFFSET
 #define PAGE_OFFSET(_addr)  ((uintptr_t)(_addr) & (PAGE_SIZE - 1))
 #endif
@@ -254,6 +287,10 @@ Max(int a, int b)
    ((uint64)(_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
+#ifndef PAGES_2_KBYTES
+#define PAGES_2_KBYTES(_npages) ((_npages) << (PAGE_SHIFT - KBYTES_SHIFT))
+#endif
+
 #ifndef PAGES_2_MBYTES
 #define PAGES_2_MBYTES(_npages) ((_npages) >> (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
@@ -392,34 +429,14 @@ void *_ReturnAddress(void);
 
 
 #ifdef __GNUC__
-#ifndef sun
-
-/*
- * A bug in __builtin_frame_address was discovered in gcc 4.1.1, and
- * fixed in 4.2.0; assume it originated in 4.0. PR 147638 and 554369.
- */
-#if  !(__GNUC__ == 4 && (__GNUC_MINOR__ == 0 || __GNUC_MINOR__ == 1))
 #define GetFrameAddr() __builtin_frame_address(0)
-#endif
-
-#endif // sun
 #endif // __GNUC__
 
-/*
- * Data prefetch was added in gcc 3.1.1
- * http://www.gnu.org/software/gcc/gcc-3.1/changes.html
- */
 #ifdef __GNUC__
-#  if ((__GNUC__ > 3) || (__GNUC__ == 3 && __GNUC_MINOR__ > 1) || \
-       (__GNUC__ == 3 && __GNUC_MINOR__ == 1 && __GNUC_PATCHLEVEL__ >= 1))
-#     define PREFETCH_R(var) __builtin_prefetch((var), 0 /* read */, \
-                                                3 /* high temporal locality */)
-#     define PREFETCH_W(var) __builtin_prefetch((var), 1 /* write */, \
-                                                3 /* high temporal locality */)
-#  else
-#     define PREFETCH_R(var) ((void)(var))
-#     define PREFETCH_W(var) ((void)(var))
-#  endif
+#  define PREFETCH_R(var) __builtin_prefetch((var), 0 /* read */, \
+                                             3 /* high temporal locality */)
+#  define PREFETCH_W(var) __builtin_prefetch((var), 1 /* write */, \
+                                             3 /* high temporal locality */)
 #endif /* __GNUC__ */
 
 
@@ -482,14 +499,6 @@ typedef int pid_t;
 // The macOS kernel SDK defines va_copy in stdarg.h.
 #include <stdarg.h>
 
-#elif defined(__GNUC__) && (__GNUC__ < 3)
-
-/*
- * Old versions of gcc recognize __va_copy, but not va_copy.
- */
-
-#define va_copy(dest, src) __va_copy(dest, src)
-
 #endif // _WIN32
 
 #endif // va_copy
@@ -595,6 +604,12 @@ typedef int pid_t;
 #define HOSTED_ONLY(x) x
 #endif
 
+#ifdef VMX86_ESXIO
+#define vmx86_esxio      1
+#else
+#define vmx86_esxio      0
+#endif
+
 #ifdef VMKERNEL
 #define vmkernel 1
 #define VMKERNEL_ONLY(x) x
@@ -652,8 +667,26 @@ typedef int pid_t;
 #ifdef ULM
 #define vmx86_ulm 1
 #define ULM_ONLY(x) x
+#ifdef ULM_MAC
+#define ulm_mac 1
+#else
+#define ulm_mac 0
+#endif
+#ifdef ULM_WIN
+#define ulm_win 1
+#else
+#define ulm_win 0
+#endif
+#ifdef ULM_ESX
+#define ulm_esx 1
+#else
+#define ulm_esx 0
+#endif
 #else
 #define vmx86_ulm 0
+#define ulm_mac 0
+#define ulm_win 0
+#define ulm_esx 0
 #define ULM_ONLY(x)
 #endif
 
@@ -720,7 +753,7 @@ typedef int pid_t;
  * Bug 827422 and 838523.
  */
 
-#if defined __GNUC__ && __GNUC__ >= 4
+#if defined __GNUC__
 #define VISIBILITY_HIDDEN __attribute__((visibility("hidden")))
 #else
 #define VISIBILITY_HIDDEN /* nothing */
@@ -812,4 +845,17 @@ typedef int pid_t;
 #define VMW_CLANG_ANALYZER_NORETURN() ((void)0)
 #endif
 
+/* VMW_FALLTHROUGH
+ *
+ *   Instructs GCC 9 and above to not warn when a case label of a
+ *   'switch' statement falls through to the next label.
+ *
+ *   If not GCC 9 or above, expands to nothing.
+ */
+#if __GNUC__ >= 9
+#define VMW_FALLTHROUGH() __attribute__((fallthrough))
+#else
+#define VMW_FALLTHROUGH()
+#endif
+
 #endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index d32cde0d..8a0d41de 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,12 +39,24 @@
 #include "includeCheck.h"
 
 /*
- * Macros __i386__ and __ia64 are intrinsically defined by GCC
+ * Standardize MSVC arch macros to GCC arch macros.
  */
 #if defined _MSC_VER && defined _M_X64
-#  define __x86_64__
+#  define __x86_64__ 1
 #elif defined _MSC_VER && defined _M_IX86
-#  define __i386__
+#  define __i386__ 1
+#elif defined _MSC_VER && defined _M_ARM64
+#  define __aarch64__ 1
+#elif defined _MSC_VER && defined _M_ARM
+#  define __arm__ 1
+#endif
+
+/*
+ * Apple/Darwin uses __arm64__, but defines the more standard
+ * __aarch64__ too. Code below assumes __aarch64__.
+ */
+#if defined __arm64__ && !defined __aarch64__
+#  error Unexpected: defined __arm64__ without __aarch64__
 #endif
 
 /*
@@ -95,6 +107,25 @@
 #define vm_arm_64 0
 #endif
 
+#ifdef VM_ARM_ANY
+#define vm_arm_any 1
+#else
+#define vm_arm_any 0
+#endif
+
+#ifdef VM_X86_ANY
+#define vm_x86_any 1
+#else
+#define vm_x86_any 0
+#endif
+
+#if defined(__APPLE__) && defined(VM_ARM_64)
+#define VM_MAC_ARM
+#define vm_mac_arm 1
+#else
+#define vm_mac_arm 0
+#endif
+
 #define vm_64bit (sizeof (void *) == 8)
 
 #ifdef _MSC_VER
@@ -117,19 +148,22 @@
 
 /*
  * C99 <stdint.h> or equivalent
- * Special cases:
- * - Linux kernel lacks <stdint.h>, preferring <linux/types.h>
+ * Userlevel: 100% <stdint.h>
+ * - gcc-4.5 or later, and earlier for some sysroots
+ * - vs2010 or later
+ * Kernel: <stdint.h> is often unavailable (and no common macros)
+ * - Linux: uses <linux/types.h> instead
  *   (and defines uintptr_t since 2.6.24, but not intptr_t)
- * - Solaris collides with gcc <stdint.h>, but has <sys/stdint.h>
- * - VMKernel + FreeBSD collides with gcc <stdint.h>, but has <sys/stdint.h>
- * - VMKernel (+DECODERLIB) share macros with Linux kernel
- * - Windows only added <stdint.h> in vc10/vs2010 (MSC ver 1600),
- *   and WDKs lack it.
+ * - Solaris: conflicts with gcc <stdint.h>, but has <sys/stdint.h>
+ * - VMKernel + FreeBSD combination collides with gcc <stdint.h>,
+ *   but has <sys/stdint.h>
+ * - Windows: some types in <crtdefs.h>, no definitions for other types.
  *
  * NB about LLP64 in LP64 environments:
  * - Apple uses 'long long' uint64_t
  * - Linux kernel uses 'long long' uint64_t
  * - Linux userlevel uses 'long' uint64_t
+ * - Windows uses 'long long' uint64_t
  */
 #if !defined(VMKERNEL) && !defined(DECODERLIB) && \
     defined(__linux__) && defined(__KERNEL__)
@@ -143,11 +177,8 @@
       (defined(VMKERNEL) && defined(__FreeBSD__)) || \
       defined(_SYS_STDINT_H_)
 #  include <sys/stdint.h>
-#elif !defined(_MSC_VER)
-   /* Common case */
-#  include <stdint.h>
-#else
-   /* COMPAT: until pre-vc10 is retired */
+#elif defined(_MSC_VER) && defined(_KERNEL_MODE)
+   /* Windows driver headers (km/crt) lack stdint.h */
 #  include <crtdefs.h>  // uintptr_t
    typedef unsigned __int64   uint64_t;
    typedef unsigned int       uint32_t;
@@ -158,6 +189,9 @@
    typedef int                int32_t;
    typedef short              int16_t;
    typedef signed char        int8_t;
+#else
+   /* Common case */
+#  include <stdint.h>
 #endif
 
 /*
@@ -355,12 +389,6 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
  * Suffix for 64-bit constants.  Use it like this:
  *    CONST64(0x7fffffffffffffff) for signed or
  *    CONST64U(0x7fffffffffffffff) for unsigned.
- *
- * 2004.08.30(thutt):
- *   The vmcore/asm64/gen* programs are compiled as 32-bit
- *   applications, but must handle 64 bit constants.  If the
- *   64-bit-constant defining macros are already defined, the
- *   definition will not be overwritten.
  */
 
 #if !defined(CONST64) || !defined(CONST64U)
@@ -459,6 +487,7 @@ typedef uint64    PageNum;
 typedef unsigned  MemHandle;
 typedef unsigned  IoHandle;
 typedef int32     World_ID;
+typedef uint64    VSCSI_HandleID;
 
 /* !! do not alter the definition of INVALID_WORLD_ID without ensuring
  * that the values defined in both bora/public/vm_basic_types.h and
@@ -496,8 +525,9 @@ typedef  int128  Reg128;
 typedef uint128 UReg128;
 #endif
 
-#if defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
-    defined (VMKERNEL) || defined (VMKBOOT) || defined (ULM)
+#if (defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
+     defined (VMKERNEL) || defined (VMKBOOT) || defined (ULM)) &&  \
+    !defined (FROBOS)
 typedef  Reg64  Reg;
 typedef UReg64 UReg;
 #endif
@@ -688,19 +718,20 @@ typedef void * UserVA;
 
 /*
  * At present, we effectively require a compiler that is at least
- * gcc-4.1 (circa 2006).  Enforce this here, various things below
+ * gcc-4.4 (circa 2009).  Enforce this here, various things below
  * this line depend upon it.
  *
  * Current oldest compilers:
- * - guest tools: 4.1.2 (freebsd/solaris)
  * - buildhost compiler: 4.4.3
  * - hosted kernel modules: 4.5
+ * - widespread usage: 4.8
  *
  * SWIG's preprocessor is exempt.
+ * clang pretends to be gcc (4.2.1 by default), so needs to be excluded.
  */
-#ifndef SWIG
-#if defined __GNUC__ && (__GNUC__ < 4 || (__GNUC__ == 4 && __GNUC_MINOR__ < 1))
-#error "gcc version is too old, need gcc-4.1 or better"
+#if !defined __clang__ && !defined SWIG
+#if defined __GNUC__ && (__GNUC__ < 4 || (__GNUC__ == 4 && __GNUC_MINOR__ < 4))
+#error "gcc version is too old, need gcc-4.4 or better"
 #endif
 #endif
 
@@ -797,7 +828,7 @@ typedef void * UserVA;
  *    Note that there is no annotation for "neither."
  */
 
-#if defined __GNUC__ && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3))
+#if defined __GNUC__
 #define HOT __attribute__((hot))
 #define COLD __attribute__((cold))
 #else
diff --git a/vmmon-only/include/vm_idt_x86.h b/vmmon-only/include/vm_idt_x86.h
index 52c1d840..0c8ba3fc 100644
--- a/vmmon-only/include/vm_idt_x86.h
+++ b/vmmon-only/include/vm_idt_x86.h
@@ -46,6 +46,7 @@ extern "C" {
 #define TSS_RSP1 1
 #define TSS_RSP2 2
 
+#define IDT_NUM_GATES              0x100
 /*
  * The monitor and the vmkernel use gate stub handlers of a single size in
  * their IDTs.  The only exception is the #PF gate (#14) which is twice as
diff --git a/vmmon-only/include/vm_pagetable.h b/vmmon-only/include/vm_pagetable.h
index a433e57b..bbc6b472 100644
--- a/vmmon-only/include/vm_pagetable.h
+++ b/vmmon-only/include/vm_pagetable.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2014-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2014-2019,2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -44,25 +44,36 @@
  *   levels (with standard page sizes).
  */
 
+#define PT_LEVELS_FOREACH(f, ...) \
+   f(1, __VA_ARGS__) \
+   f(2, __VA_ARGS__) \
+   f(3, __VA_ARGS__) \
+   f(4, __VA_ARGS__) \
+   f(5, __VA_ARGS__) \
+
+#define PT_LEVEL_X(X) PT_LEVEL_##X
+#define PT_LXE(X) PT_L##X##E
+
 typedef uint64 PT_Entry;
-typedef PT_Entry PT_L5E;
-typedef PT_Entry PT_L4E;
-typedef PT_Entry PT_L3E;
-typedef PT_Entry PT_L2E;
-typedef PT_Entry PT_L1E;
+#define PT_LXE_DECL(lvl, ...) typedef PT_Entry PT_LXE(lvl);
+PT_LEVELS_FOREACH(PT_LXE_DECL);
+#undef PT_LXE_DECL
 
 typedef enum {
-   PT_LEVEL_1 = 1,
-   PT_LEVEL_2,
-   PT_LEVEL_3,
-   PT_LEVEL_4,
-   PT_LEVEL_5,
+#define PT_LEVEL_X_DECL(lvl, ...) PT_LEVEL_X(lvl) = lvl,
+PT_LEVELS_FOREACH(PT_LEVEL_X_DECL)
+#undef PT_LEVEL_X_DECL
    PT_LEVEL_STOP = PT_LEVEL_1,
    PT_MAX_LEVELS = PT_LEVEL_5
 } PT_Level;
 
 #define PT_PTE_SIZE           8
-#define PT_LEVEL_SHIFT        9
+
+#if defined __BUILD_DEFINED_PT_LEVEL_SHIFT__
+   #define PT_LEVEL_SHIFT        __BUILD_DEFINED_PT_LEVEL_SHIFT__
+#else
+   #define PT_LEVEL_SHIFT        9
+#endif
 
 #define PT_PTE_PFN_SHIFT      PAGE_SHIFT
 #define PT_ENTRIES_PER_PT     (1 << PT_LEVEL_SHIFT)
@@ -137,4 +148,11 @@ typedef enum {
 #define PT_LE_NXT_PG(_a, _l)  ((((_a) >> PT_LE_PG_SHIFT(_l)) + 1) \
                                << PT_LE_PG_SHIFT(_l))
 
+#else
+
+#if defined __BUILD_DEFINED_PT_LEVEL_SHIFT__ && \
+    __BUILD_DEFINED_PT_LEVEL_SHIFT__ !=  PT_LEVEL_SHIFT
+#error "vm_pagetable.h included multiple times with different page size"
+#endif
+
 #endif
diff --git a/vmmon-only/include/vmmem_shared.h b/vmmon-only/include/vmmem_shared.h
deleted file mode 100644
index 90b5905e..00000000
--- a/vmmon-only/include/vmmem_shared.h
+++ /dev/null
@@ -1,119 +0,0 @@
-/*********************************************************
- * Copyright (C) 2000-2015,2017-2020 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * vmmem_shared.h --
- *
- *      This is the header file for machine memory manager.
- */
-
-
-#ifndef _VMMEM_SHARED_H
-#define _VMMEM_SHARED_H
-
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_VMX
-#include "includeCheck.h"
-#include "community_source.h"
-
-/*
- * Page remapping definitions.
- */
-
-#define VMMEM_FLAG_BIT(x) (1 << (x))
-
-#define VMMEM_ANON_LOW_MEM        VMMEM_FLAG_BIT(0)
-#define VMMEM_ANON_CONTIG         VMMEM_FLAG_BIT(1)
-#define VMMEM_ANON_CAN_FAIL       VMMEM_FLAG_BIT(2)
-#define VMMEM_ANON_USE_PREALLOC   VMMEM_FLAG_BIT(3)
-#define VMMEM_ANON_IOABLE_PAGE    VMMEM_FLAG_BIT(4)
-#define VMMEM_ANON_ALL_FLAGS      MASK(5)
-
-#define VMMEM_GUEST_NO_FLAGS      0
-#define VMMEM_GUEST_WRITEABLE     VMMEM_FLAG_BIT(0)
-#define VMMEM_GUEST_BREAKCOW      VMMEM_FLAG_BIT(1)
-#define VMMEM_GUEST_2M_PAGE       VMMEM_FLAG_BIT(2)
-#define VMMEM_GUEST_1G_PAGE       VMMEM_FLAG_BIT(3)
-#define VMMEM_GUEST_CAN_FAIL      VMMEM_FLAG_BIT(4)
-#define VMMEM_GUEST_TEST_ZEROCOW  VMMEM_FLAG_BIT(5)
-#define VMMEM_GUEST_TRY_ZEROCOW   VMMEM_FLAG_BIT(6)
-#define VMMEM_GUEST_TRY_POISONCOW VMMEM_FLAG_BIT(7)
-#define VMMEM_GUEST_PREALLOC      VMMEM_FLAG_BIT(8)
-#define VMMEM_GUEST_ALL_FLAGS     MASK(9)
-#define VMMEM_GUEST_TRY_COW       (VMMEM_GUEST_TEST_ZEROCOW | \
-                                   VMMEM_GUEST_TRY_ZEROCOW  | \
-                                   VMMEM_GUEST_TRY_POISONCOW)
-#define VMMEM_GUEST_LARGE_PAGE    (VMMEM_GUEST_2M_PAGE | \
-                                   VMMEM_GUEST_1G_PAGE)
-
-#define VMMEM_PLATFORM_CHECK_OK           VMMEM_FLAG_BIT(0)
-#define VMMEM_PLATFORM_KEY_OK             VMMEM_FLAG_BIT(1)
-#define VMMEM_PLATFORM_COW                VMMEM_FLAG_BIT(2)
-#define VMMEM_PLATFORM_EXPOSED_TO_VMM     VMMEM_FLAG_BIT(3)
-#define VMMEM_PLATFORM_P2M_UPDATE_PENDING VMMEM_FLAG_BIT(4)
-#define VMMEM_PLATFORM_DIRTY              VMMEM_FLAG_BIT(5)
-#define VMMEM_PLATFORM_IS_2M_PAGE         VMMEM_FLAG_BIT(6)
-#define VMMEM_PLATFORM_IS_1G_PAGE         VMMEM_FLAG_BIT(7)
-#define VMMEM_PLATFORM_LARGE_RETRY        VMMEM_FLAG_BIT(8)
-#define VMMEM_PLATFORM_TRY_COW_SUCCESS    VMMEM_FLAG_BIT(9)
-
-#define VMMEM_PLATFORM_BACKED_LARGE      (VMMEM_PLATFORM_IS_2M_PAGE |   \
-                                          VMMEM_PLATFORM_IS_1G_PAGE)
-
-
-#define MAX_PLATFORM_PAGE_INFO_PAGES  240
-
-/*
- * Structure used to query platform about the page state.
- */
-typedef struct PlatformPageInfoList {
-   PageCnt numPages;
-   BPN     bpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // bpns to check
-   MPN     mpn[MAX_PLATFORM_PAGE_INFO_PAGES];    // filled in by host
-   uint8   flags[MAX_PLATFORM_PAGE_INFO_PAGES];  // filled in by host
-} PlatformPageInfoList;
-
-#define VMMEM_SERVICES_TYPE_2_MASK(type)                  \
-           (1 << type)
-#define VMMEM_SERVICES_IN_MASK(typeMask, type)            \
-           (VMMEM_SERVICES_TYPE_2_MASK(type) & typeMask)
-#define VMMEM_SERVICES_CLEAR_MASK(typeMask, type)         \
-           (typeMask & ~VMMEM_SERVICES_TYPE_2_MASK(type))
-
-#define MDEF_DRAINER
-
-#define VMMEM_SERVICES_DEFS                                       \
-   MDEF(VMMEM_SERVICES_TYPE_P2M,         P2MUpdate_FilterPages)   \
-   MDEF(VMMEM_SERVICES_TYPE_SWAP,        BusMemSwap_FilterPages)  \
-   MDEF_DRAINER
-
-#define MDEF(_type, _cb) _type,
-typedef enum VmMemServices_Type {
-   VMMEM_SERVICES_DEFS
-#undef MDEF
-   VMMEM_SERVICES_TYPE_MAX
-} VmMemServices_Type;
-#define VMMEM_SERVICES_TYPE_INVALID (VMMEM_SERVICES_TYPE_MAX)
-
-void VmMem_DisableLargePageAllocations(void);
-void VmMem_EnableLargePageAllocations(void);
-
-#endif
diff --git a/vmmon-only/include/vmware.h b/vmmon-only/include/vmware.h
deleted file mode 100644
index 4e2fa8b0..00000000
--- a/vmmon-only/include/vmware.h
+++ /dev/null
@@ -1,57 +0,0 @@
-/*********************************************************
- * Copyright (C) 2003-2016 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * vmware.h --
- *
- *	Standard include file for VMware source code.
- */
-
-#ifndef _VMWARE_H_
-#define _VMWARE_H_
-
-#define INCLUDE_ALLOW_USERLEVEL
-#define INCLUDE_ALLOW_VMCORE
-#define INCLUDE_ALLOW_MODULE
-#define INCLUDE_ALLOW_VMMON
-#define INCLUDE_ALLOW_VMKERNEL
-#define INCLUDE_ALLOW_VMK_MODULE
-#define INCLUDE_ALLOW_DISTRIBUTE
-#include "includeCheck.h"
-
-#include "vm_basic_types.h"
-#include "vm_basic_defs.h"
-#include "vm_assert.h"
-
-/*
- * Global error codes. Currently used internally, but may be exported
- * to customers one day, like VM_E_XXX in vmcontrol_constants.h
- */
-
-typedef enum VMwareStatus {
-   VMWARE_STATUS_SUCCESS,  /* success */
-   VMWARE_STATUS_ERROR,    /* generic error */
-   VMWARE_STATUS_NOMEM,    /* generic memory allocation error */
-   VMWARE_STATUS_INSUFFICIENT_RESOURCES, /* internal or system resource limit exceeded */
-   VMWARE_STATUS_INVALID_ARGS  /* invalid arguments */
-} VMwareStatus;
-
-#define VMWARE_SUCCESS(s) ((s) == VMWARE_STATUS_SUCCESS)
-
-
-#endif // ifndef _VMWARE_H_
diff --git a/vmmon-only/include/vmware_pack_begin.h b/vmmon-only/include/vmware_pack_begin.h
deleted file mode 100644
index fe0aec8d..00000000
--- a/vmmon-only/include/vmware_pack_begin.h
+++ /dev/null
@@ -1,43 +0,0 @@
-/*********************************************************
- * Copyright (C) 2002-2016 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * vmware_pack_begin.h --
- *
- *    Begin of structure packing. See vmware_pack_init.h for details.
- *
- *    Note that we do not use the following construct in this include file,
- *    because we want to emit the code every time the file is included --hpreg
- *
- *    #ifndef foo
- *    #   define foo
- *    ...
- *    #endif
- *
- */
-
-
-#include "vmware_pack_init.h"
-
-
-#ifdef _MSC_VER
-#   pragma pack(push, 1)
-#elif __GNUC__
-#else
-#   error Compiler packing...
-#endif
diff --git a/vmmon-only/include/vmware_pack_end.h b/vmmon-only/include/vmware_pack_end.h
deleted file mode 100644
index 75575590..00000000
--- a/vmmon-only/include/vmware_pack_end.h
+++ /dev/null
@@ -1,44 +0,0 @@
-/*********************************************************
- * Copyright (C) 2002-2016 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-/*
- * vmware_pack_end.h --
- *
- *    End of structure packing. See vmware_pack_init.h for details.
- *
- *    Note that we do not use the following construct in this include file,
- *    because we want to emit the code every time the file is included --hpreg
- *
- *    #ifndef foo
- *    #   define foo
- *    ...
- *    #endif
- *
- */
-
-
-#include "vmware_pack_init.h"
-
-
-#ifdef _MSC_VER
-#   pragma pack(pop)
-#elif __GNUC__
-__attribute__((__packed__))
-#else
-#   error Compiler packing...
-#endif
diff --git a/vmmon-only/include/vmware_pack_init.h b/vmmon-only/include/vmware_pack_init.h
deleted file mode 100644
index 4aa426e7..00000000
--- a/vmmon-only/include/vmware_pack_init.h
+++ /dev/null
@@ -1,65 +0,0 @@
-/*********************************************************
- * Copyright (C) 2002-2016 VMware, Inc. All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License as published by the
- * Free Software Foundation version 2 and no later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
- * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
- *
- *********************************************************/
-
-#ifndef __VMWARE_PACK_INIT_H__
-#   define __VMWARE_PACK_INIT_H__
-
-
-/*
- * vmware_pack_init.h --
- *
- *    Platform-independent code to make the compiler pack (i.e. have them
- *    occupy the smallest possible space) structure definitions. The following
- *    constructs are known to work --hpreg
- *
- *    #include "vmware_pack_begin.h"
- *    struct foo {
- *       ...
- *    }
- *    #include "vmware_pack_end.h"
- *    ;
- *
- *    typedef
- *    #include "vmware_pack_begin.h"
- *    struct foo {
- *       ...
- *    }
- *    #include "vmware_pack_end.h"
- *    foo;
- */
-
-
-#ifdef _MSC_VER
-/*
- * MSVC 6.0 emits warning 4103 when the pack push and pop pragma pairing is
- * not balanced within 1 included file. That is annoying because our scheme
- * is based on the pairing being balanced between 2 included files.
- *
- * So we disable this warning, but this is safe because the compiler will also
- * emit warning 4161 when there is more pops than pushes within 1 main
- * file --hpreg
- */
-
-#   pragma warning(disable:4103)
-#elif __GNUC__
-#else
-#   error Compiler packing...
-#endif
-
-
-#endif /* __VMWARE_PACK_INIT_H__ */
diff --git a/vmmon-only/include/x86types.h b/vmmon-only/include/x86/cpu_types_arch.h
similarity index 97%
rename from vmmon-only/include/x86types.h
rename to vmmon-only/include/x86/cpu_types_arch.h
index 4ad854fd..bf3663b0 100644
--- a/vmmon-only/include/x86types.h
+++ b/vmmon-only/include/x86/cpu_types_arch.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,13 +17,13 @@
  *********************************************************/
 
 /*
- * x86types.h --
+ * cpu_types_arch.h --
  *
- *      Type definitions for the x86 architecture.
+ *     Low-level CPU type definitions for the x86.
  */
 
-#ifndef _X86TYPES_H_
-#define _X86TYPES_H_
+#if !defined(_X86_CPU_TYPES_ARCH_H_)
+#define _X86_CPU_TYPES_ARCH_H_
 
 #define INCLUDE_ALLOW_USERLEVEL
 
@@ -58,19 +58,6 @@ typedef uint64 VM_PDPTE;
 
 typedef uint64 VM_EPTE;
 
-/*
- * Registers
- */
-
-typedef union SharedUReg64 {
-   UReg8  ureg8[2];
-   UReg16 ureg16;
-   UReg32 ureg32;
-   UReg32 ureg32Pair[2];
-   UReg64 ureg64;
-} SharedUReg64;
-
-typedef uint8 Instruction;
 
 typedef uint16 Selector;
 
@@ -122,6 +109,7 @@ typedef struct Task32 {
    uint32     ldt;
    uint16     trap;
    uint16     IOMapBase;
+   uint32     ssp;  // shadow stack pointer
 } Task32;
 #pragma pack(pop)
 
@@ -133,7 +121,7 @@ typedef struct {
    uint16     sp1;  // static
    uint16     ss1;  // static
    uint16     sp2;  // static
-   uint16     ss2;  // static 
+   uint16     ss2;  // static
    uint16     ip;
    uint16     flags;
    uint16     ax;
@@ -398,14 +386,14 @@ typedef struct DebugControlRegister {
    int g2:1;
    int l3:1;
    int g3:1;
-   
+
    int le:1;
    int ge:1;
    int oo1:3;
-   
+
    int gd:1;
    int oo:2;
-   
+
    int rw0:2;
    int len0:2;
    int rw1:2;
@@ -414,7 +402,7 @@ typedef struct DebugControlRegister {
    int len2:2;
    int rw3:2;
    int len3:2;
-   
+
 } DebugControlRegister;
 
 /*
@@ -445,9 +433,9 @@ typedef struct ExcFrame64ForCopy {
    UReg64      r13;                  // Pushed by SW. Used as temp reg.
    UReg64      r14;                  // Pushed by SW. Used as temp reg.
    UReg64      r15;                  // Pushed by SW. Pushed by gate.
-   
+
    UReg64      errorCode;            // Pushed by SW or HW.
-   
+
    UReg64      rip;                  // Pushed by HW.
    uint16      cs, __csu[3];         // Pushed by HW.
    uint64      rflags;               // Pushed by HW.
@@ -465,4 +453,13 @@ typedef struct LretFrame64 {
    uint64 cs;
 } LretFrame64;
 
-#endif // ifndef _X86TYPES_H_
+typedef union SharedUReg64 {
+   UReg8  ureg8[2];
+   UReg16 ureg16;
+   UReg32 ureg32;
+   UReg32 ureg32Pair[2];
+   UReg64 ureg64;
+} SharedUReg64;
+
+#endif /* _X86_CPU_TYPES_ARCH_H_ */
+
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index 5fe018c3..e6fcee45 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -100,7 +100,8 @@
 #define CR4_SMAP       0x00200000
 #define CR4_PKE        0x00400000
 #define CR4_CET        0x00800000
-#define CR4_RESERVED   CONST64U(0xffffffffff889000)
+#define CR4_PKS        0x01000000
+#define CR4_RESERVED   CONST64U(0xfffffffffe089000)
 #define CR8_RESERVED   CONST64U(0xfffffffffffffff0)
 
 /*
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index b8272b7d..4d4de26e 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -71,9 +71,14 @@ typedef union CPUIDRegsUnion {
 #pragma warning (disable :4100) // unreferenced parameters
 #endif
 
-typedef
-#include "vmware_pack_begin.h"
-struct CPUIDReply {
+#if defined VMKERNEL || (!defined(__FreeBSD__) && !defined(__sun__))
+/*
+ * FreeBSD and Solaris do not support pragma pack until gcc-4.6,
+ * but do not need these structures (which are part of vmmon).
+ * Vmkernel sets __FreeBSD__ for a few files.
+ */
+#pragma pack(push, 1)
+typedef struct CPUIDReply {
    /*
     * Unique host logical CPU identifier. It does not change across queries, so
     * we use it to correlate the replies of multiple queries.
@@ -81,20 +86,16 @@ struct CPUIDReply {
    uint64 tag;                // OUT
 
    CPUIDRegs regs;            // OUT
-}
-#include "vmware_pack_end.h"
-CPUIDReply;
+} CPUIDReply;
 
-typedef
-#include "vmware_pack_begin.h"
-struct CPUIDQuery {
+typedef struct CPUIDQuery {
    uint32 eax;                // IN
    uint32 ecx;                // IN
    uint32 numLogicalCPUs;     // IN/OUT
    CPUIDReply logicalCPUs[0]; // OUT
-}
-#include "vmware_pack_end.h"
-CPUIDQuery;
+} CPUIDQuery;
+#pragma pack(pop)
+#endif
 
 /*
  * CPUID levels the monitor caches.
@@ -130,7 +131,7 @@ CPUIDQuery;
    CPUIDLEVEL(TRUE,  9,   0x9,        0, 17) \
    CPUIDLEVEL(FALSE, A,   0xa,        0,  0) \
    CPUIDLEVEL(FALSE, B,   0xb,        3,  0) \
-   CPUIDLEVEL(TRUE,  D,   0xd,       10,  0) \
+   CPUIDLEVEL(TRUE,  D,   0xd,       19,  0) \
    CPUIDLEVEL(TRUE,  F,   0xf,        2, 13) \
    CPUIDLEVEL(TRUE,  10,  0x10,       4, 13) \
    CPUIDLEVEL(TRUE,  12,  0x12,       4, 13) \
@@ -139,9 +140,14 @@ CPUIDQuery;
    CPUIDLEVEL(TRUE,  16,  0x16,       0, 13) \
    CPUIDLEVEL(TRUE,  17,  0x17,       4, 14) \
    CPUIDLEVEL(TRUE,  18,  0x18,       8, 17) \
+   CPUIDLEVEL(TRUE,  19,  0x19,       0, 20) \
    CPUIDLEVEL(TRUE,  1A,  0x1a,       0, 17) \
    CPUIDLEVEL(TRUE,  1B,  0x1b,       2, 17) \
+   CPUIDLEVEL(TRUE,  1C,  0x1c,       0, 20) \
+   CPUIDLEVEL(TRUE,  1D,  0x1d,       2, 19) \
+   CPUIDLEVEL(TRUE,  1E,  0x1e,       1, 19) \
    CPUIDLEVEL(FALSE, 1F,  0x1f,       6, 17) \
+   CPUIDLEVEL(TRUE,  20,  0x20,       1, 20) \
    CPUIDLEVEL(FALSE, 400, 0x40000000, 0,  0) \
    CPUIDLEVEL(FALSE, 401, 0x40000001, 0,  0) \
    CPUIDLEVEL(FALSE, 402, 0x40000002, 0,  0) \
@@ -189,17 +195,18 @@ enum {
 
 
 /* Named feature leaves */
-#define CPUID_FEATURE_INFORMATION  0x01
-#define CPUID_PROCESSOR_TOPOLOGY   4
-#define CPUID_MWAIT_FEATURES       5
-#define CPUID_PMC_FEATURES         0xa
-#define CPUID_XSAVE_FEATURES       0xd
-#define CPUID_SGX_FEATURES         0x12
-#define CPUID_PT_FEATURES          0x14
-#define CPUID_HYPERVISOR_LEVEL_0   0x40000000
-#define CPUID_VMW_FEATURES         0x40000010
-#define CPUID_SVM_FEATURES         0x8000000a
-#define CPUID_SEV_INFO             0x8000001f
+#define CPUID_FEATURE_INFORMATION    0x01
+#define CPUID_PROCESSOR_TOPOLOGY     4
+#define CPUID_MWAIT_FEATURES         5
+#define CPUID_PMC_FEATURES           0xa
+#define CPUID_XSAVE_FEATURES         0xd
+#define CPUID_SGX_FEATURES           0x12
+#define CPUID_PT_FEATURES            0x14
+#define CPUID_HYPERVISOR_LEVEL_0     0x40000000
+#define CPUID_VMW_FEATURES           0x40000010
+#define CPUID_HYPERVISOR_LEVEL_MAX   0x400000FF
+#define CPUID_SVM_FEATURES           0x8000000a
+#define CPUID_SEV_INFO               0x8000001f
 
 /*
  * CPUID result registers
@@ -470,10 +477,12 @@ FLAG(   6,  0, EAX, 17,  1, HWP_FLEXIBLE,                        NO,    0 ) \
 FLAG(   6,  0, EAX, 18,  1, HWP_FAST_ACCESS,                     NO,    0 ) \
 FLAG(   6,  0, EAX, 19,  1, HW_FEEDBACK,                         NO,    0 ) \
 FLAG(   6,  0, EAX, 20,  1, HWP_IGNORE_IDLE_REQUEST,             NO,    0 ) \
+FLAG(   6,  0, EAX, 23,  1, HW_FEEDBACK_ENHANCED,                NO,    0 ) \
 FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,                 NO,    0 ) \
 FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                   NO,    0 ) \
 FLAG(   6,  0, ECX,  1,  1, ACNT2,                               ANY,  13 ) \
 FLAG(   6,  0, ECX,  3,  1, ENERGY_PERF_BIAS,                    NO,    0 ) \
+FIELD(  6,  0, ECX,  8,  4, HW_FEEDBACK_NUM_CLASSES,             NO,    0 ) \
 FLAG(   6,  0, EDX,  0,  1, PERF_CAP_REPORTING,                  NO,    0 ) \
 FLAG(   6,  0, EDX,  1,  1, ENERGY_CAP_REPORTING,                NO,    0 ) \
 FIELD(  6,  0, EDX,  8,  4, HW_FEEDBACK_SIZE,                    NO,    0 ) \
@@ -496,7 +505,7 @@ FLAG(   7,  0, EBX, 10,  1, INVPCID,                             YES,  11 ) \
 FLAG(   7,  0, EBX, 11,  1, RTM,                                 YES,  11 ) \
 FLAG(   7,  0, EBX, 12,  1, PQM,                                 NO,    0 ) \
 FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                     ANY,  11 ) \
-FLAG(   7,  0, EBX, 14,  1, MPX,                                 YES,  13 ) \
+FLAG(   7,  0, EBX, 14,  1, MPX,                                 ANY,  13 ) \
 FLAG(   7,  0, EBX, 15,  1, PQE,                                 NO,    0 ) \
 FLAG(   7,  0, EBX, 16,  1, AVX512F,                             YES,  13 ) \
 FLAG(   7,  0, EBX, 17,  1, AVX512DQ,                            YES,  13 ) \
@@ -506,7 +515,7 @@ FLAG(   7,  0, EBX, 20,  1, SMAP,                                YES,  11 ) \
 FLAG(   7,  0, EBX, 21,  1, AVX512IFMA,                          YES,  17 ) \
 FLAG(   7,  0, EBX, 23,  1, CLFLUSHOPT,                          YES,  13 ) \
 FLAG(   7,  0, EBX, 24,  1, CLWB,                                YES,  13 ) \
-FLAG(   7,  0, EBX, 25,  1, PT,                                  YES, FUT ) \
+FLAG(   7,  0, EBX, 25,  1, PT,                                  NO,    0 ) \
 FLAG(   7,  0, EBX, 26,  1, AVX512PF,                            YES,  13 ) \
 FLAG(   7,  0, EBX, 27,  1, AVX512ER,                            YES,  13 ) \
 FLAG(   7,  0, EBX, 28,  1, AVX512CD,                            YES,  13 ) \
@@ -526,33 +535,48 @@ FLAG(   7,  0, ECX,  9,  1, VAES,                                YES,  17 ) \
 FLAG(   7,  0, ECX, 10,  1, VPCLMULQDQ,                          YES,  17 ) \
 FLAG(   7,  0, ECX, 11,  1, AVX512VNNI,                          YES,  17 ) \
 FLAG(   7,  0, ECX, 12,  1, AVX512BITALG,                        YES,  17 ) \
+FLAG(   7,  0, ECX, 13,  1, TME_EN,                              NO,    0 ) \
 FLAG(   7,  0, ECX, 14,  1, AVX512VPOPCNTDQ,                     YES,  16 ) \
 FLAG(   7,  0, ECX, 16,  1, VA57,                                NO,    0 ) \
 FIELD(  7,  0, ECX, 17,  5, MAWA,                                NO,    0 ) \
 FLAG(   7,  0, ECX, 22,  1, RDPID,                               YES,  17 ) \
+FLAG(   7,  0, ECX, 23,  1, KEY_LOCKER,                          NO,    0 ) \
 FLAG(   7,  0, ECX, 25,  1, CLDEMOTE,                            YES,  18 ) \
 FLAG(   7,  0, ECX, 27,  1, MOVDIRI,                             YES,  18 ) \
 FLAG(   7,  0, ECX, 28,  1, MOVDIR64B,                           YES,  18 ) \
 FLAG(   7,  0, ECX, 29,  1, ENQCMD,                              NO,    0 ) \
 FLAG(   7,  0, ECX, 30,  1, SGX_LC,                              ANY,  17 ) \
+FLAG(   7,  0, ECX, 31,  1, PKS,                                 YES,  20 ) \
 FLAG(   7,  0, EDX,  2,  1, AVX512QVNNIW,                        YES,  16 ) \
 FLAG(   7,  0, EDX,  3,  1, AVX512QFMAPS,                        YES,  16 ) \
 FLAG(   7,  0, EDX,  4,  1, FAST_SHORT_REPMOV,                   YES,  18 ) \
+FLAG(   7,  0, EDX,  5,  1, UINTR,                               NO,    0 ) \
 FLAG(   7,  0, EDX,  8,  1, AVX512VP2INTERSECT,                  YES,  18 ) \
 FLAG(   7,  0, EDX, 10,  1, MDCLEAR,                             YES,   9 ) \
-FLAG(   7,  0, EDX, 13,  1, TSX_MICROCODE_UPDATE,                NO,    0 ) \
-FLAG(   7,  0, EDX, 14,  1, SERIALIZE,                           NO,    0 ) \
+FLAG(   7,  0, EDX, 13,  1, TSX_FORCE_ABORT,                     NO,    0 ) \
+FLAG(   7,  0, EDX, 14,  1, SERIALIZE,                           YES,  20 ) \
 FLAG(   7,  0, EDX, 15,  1, HYBRID,                              NO,    0 ) \
 FLAG(   7,  0, EDX, 16,  1, TSXLDTRK,                            NO,    0 ) \
 FLAG(   7,  0, EDX, 18,  1, PCONFIG,                             NO,    0 ) \
+FLAG(   7,  0, EDX, 19,  1, ARCH_LBR,                            NO,    0 ) \
 FLAG(   7,  0, EDX, 20,  1, CET_IBT,                             NO,    0 ) \
+FLAG(   7,  0, EDX, 22,  1, AMX_BF16,                            NO,    0 ) \
+FLAG(   7,  0, EDX, 23,  1, AVX512FP16,                          NO,    0 ) \
+FLAG(   7,  0, EDX, 24,  1, AMX_TILE,                            NO,    0 ) \
+FLAG(   7,  0, EDX, 25,  1, AMX_INT8,                            NO,    0 ) \
 FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                            ANY,   9 ) \
 FLAG(   7,  0, EDX, 27,  1, STIBP,                               YES,   9 ) \
 FLAG(   7,  0, EDX, 28,  1, FCMD,                                YES,   9 ) \
 FLAG(   7,  0, EDX, 29,  1, ARCH_CAPABILITIES,                   ANY,   9 ) \
 FLAG(   7,  0, EDX, 30,  1, CORE_CAPABILITIES,                   NO,    0 ) \
 FLAG(   7,  0, EDX, 31,  1, SSBD,                                YES,   9 ) \
-FLAG(   7,  1, EAX,  5,  1, AVX512BF16,                          YES,  18 )
+FLAG(   7,  1, EAX,  4,  1, AVX_VNNI,                            YES,  20 ) \
+FLAG(   7,  1, EAX,  5,  1, AVX512BF16,                          YES,  18 ) \
+FLAG(   7,  1, EAX, 10,  1, FAST_ZERO_MOVSB,                     NO,    0 ) \
+FLAG(   7,  1, EAX, 11,  1, FAST_SHORT_STOSB,                    NO,    0 ) \
+FLAG(   7,  1, EAX, 12,  1, FAST_SHORT_CMPSB_SCASB,              NO,    0 ) \
+FLAG(   7,  1, EAX, 22,  1, HRESET,                              NO,    0 ) \
+FLAG(   7,  1, EAX, 26,  1, LAM,                                 NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_9                                            \
@@ -598,9 +622,9 @@ FLAG(   D,  0, EAX,  4,  1, XCR0_MASTER_BNDCSR,                  YES,  13 ) \
 FLAG(   D,  0, EAX,  5,  1, XCR0_MASTER_OPMASK,                  YES,  13 ) \
 FLAG(   D,  0, EAX,  6,  1, XCR0_MASTER_ZMM_H,                   YES,  13 ) \
 FLAG(   D,  0, EAX,  7,  1, XCR0_MASTER_HI16_ZMM,                YES,  13 ) \
-FLAG(   D,  0, EAX,  8,  1, XCR0_MASTER_XSS,                     NO,    0 ) \
 FLAG(   D,  0, EAX,  9,  1, XCR0_MASTER_PKRU,                    YES,  13 ) \
-FIELD(  D,  0, EAX, 10, 22, XCR0_MASTER_LOWER,                   NO,    0 ) \
+FLAG(   D,  0, EAX, 17,  1, XCR0_MASTER_XTILECFG,                NO,    0 ) \
+FLAG(   D,  0, EAX, 18,  1, XCR0_MASTER_XTILEDATA,               NO,    0 ) \
 FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                  ANY,   8 ) \
 FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                      YES,   8 ) \
 FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                   NO,    0 ) \
@@ -610,60 +634,94 @@ FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                            YES,  11 ) \
 FLAG(   D,  1, EAX,  1,  1, XSAVEC,                              YES,  13 ) \
 FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                         YES,  17 ) \
 FLAG(   D,  1, EAX,  3,  1, XSAVES,                              YES,  13 ) \
+FLAG(   D,  1, EAX,  4,  1, XFD,                                 NO,    0 ) \
 FIELD(  D,  1, EBX,  0, 32, XSAVES_ENABLED_SIZE,                 ANY,  13 ) \
-FIELD(  D,  1, ECX,  0,  7, XSS_XCR0_USED0,                      NO,    0 ) \
-FLAG(   D,  1, ECX,  8,  1, XSS_PT,                              NO,    0 ) \
-FIELD(  D,  1, ECX,  9,  1, XSS_XCR0_USED1,                      NO,    0 ) \
-FIELD(  D,  1, ECX, 10, 22, XSS_RSVD0,                           NO,    0 ) \
-FIELD(  D,  1, EDX,  0, 32, XSS_RSVD1,                           NO,    0 ) \
+FLAG(   D,  1, ECX,  8,  1, XSS_MASTER_PT,                       NO,    0 ) \
+FLAG(   D,  1, ECX, 10,  1, XSS_MASTER_PASID,                    NO,    0 ) \
+FLAG(   D,  1, ECX, 11,  1, XSS_MASTER_CET_U,                    NO,    0 ) \
+FLAG(   D,  1, ECX, 12,  1, XSS_MASTER_CET_S,                    NO,    0 ) \
+FLAG(   D,  1, ECX, 13,  1, XSS_MASTER_HDC,                      NO,    0 ) \
+FLAG(   D,  1, ECX, 14,  1, XSS_MASTER_UINTR,                    NO,    0 ) \
+FLAG(   D,  1, ECX, 15,  1, XSS_MASTER_LBR,                      NO,    0 ) \
+FLAG(   D,  1, ECX, 16,  1, XSS_MASTER_HWP,                      NO,    0 ) \
+FIELD(  D,  1, EDX,  0, 32, XSS_MASTER_UPPER,                    NO,    0 ) \
 FIELD(  D,  2, EAX,  0, 32, XSAVE_YMM_SIZE,                      YES,   8 ) \
 FIELD(  D,  2, EBX,  0, 32, XSAVE_YMM_OFFSET,                    YES,   8 ) \
 FLAG(   D,  2, ECX,  0,  1, XSAVE_YMM_SUP_BY_XSS,                NO,    0 ) \
 FLAG(   D,  2, ECX,  1,  1, XSAVE_YMM_ALIGN,                     YES,  13 ) \
-FIELD(  D,  2, ECX,  2, 30, XSAVE_YMM_RSVD1,                     NO,    0 ) \
-FIELD(  D,  2, EDX,  0, 32, XSAVE_YMM_RSVD2,                     NO,    0 ) \
+FLAG(   D,  2, ECX,  2,  1, XSAVE_YMM_XFD,                       NO,    0 ) \
 FIELD(  D,  3, EAX,  0, 32, XSAVE_BNDREGS_SIZE,                  YES,  13 ) \
 FIELD(  D,  3, EBX,  0, 32, XSAVE_BNDREGS_OFFSET,                YES,  13 ) \
 FLAG(   D,  3, ECX,  0,  1, XSAVE_BNDREGS_SUP_BY_XSS,            NO,    0 ) \
 FLAG(   D,  3, ECX,  1,  1, XSAVE_BNDREGS_ALIGN,                 YES,  13 ) \
-FIELD(  D,  3, ECX,  2, 30, XSAVE_BNDREGS_RSVD1,                 NO,    0 ) \
-FIELD(  D,  3, EDX,  0, 32, XSAVE_BNDREGS_RSVD2,                 NO,    0 ) \
+FLAG(   D,  3, ECX,  2,  1, XSAVE_BNDREGS_XFD,                   NO,    0 ) \
 FIELD(  D,  4, EAX,  0, 32, XSAVE_BNDCSR_SIZE,                   YES,  13 ) \
 FIELD(  D,  4, EBX,  0, 32, XSAVE_BNDCSR_OFFSET,                 YES,  13 ) \
 FLAG(   D,  4, ECX,  0,  1, XSAVE_BNDCSR_SUP_BY_XSS,             NO,    0 ) \
 FLAG(   D,  4, ECX,  1,  1, XSAVE_BNDCSR_ALIGN,                  YES,  13 ) \
-FIELD(  D,  4, ECX,  2, 30, XSAVE_BNDCSR_RSVD1,                  NO,    0 ) \
-FIELD(  D,  4, EDX,  0, 32, XSAVE_BNDCSR_RSVD2,                  NO,    0 ) \
+FLAG(   D,  4, ECX,  2,  1, XSAVE_BNDCSR_XFD,                    NO,    0 ) \
 FIELD(  D,  5, EAX,  0, 32, XSAVE_OPMASK_SIZE,                   YES,  13 ) \
 FIELD(  D,  5, EBX,  0, 32, XSAVE_OPMASK_OFFSET,                 YES,  13 ) \
 FLAG(   D,  5, ECX,  0,  1, XSAVE_OPMASK_SUP_BY_XSS,             NO,    0 ) \
 FLAG(   D,  5, ECX,  1,  1, XSAVE_OPMASK_ALIGN,                  YES,  13 ) \
-FIELD(  D,  5, ECX,  2, 30, XSAVE_OPMASK_RSVD1,                  NO,    0 ) \
-FIELD(  D,  5, EDX,  0, 32, XSAVE_OPMASK_RSVD2,                  NO,    0 ) \
+FLAG(   D,  5, ECX,  2,  1, XSAVE_OPMASK_XFD,                    NO,    0 ) \
 FIELD(  D,  6, EAX,  0, 32, XSAVE_ZMM_H_SIZE,                    YES,  13 ) \
 FIELD(  D,  6, EBX,  0, 32, XSAVE_ZMM_H_OFFSET,                  YES,  13 ) \
 FLAG(   D,  6, ECX,  0,  1, XSAVE_ZMM_H_SUP_BY_XSS,              NO,    0 ) \
 FLAG(   D,  6, ECX,  1,  1, XSAVE_ZMM_H_ALIGN,                   YES,  13 ) \
-FIELD(  D,  6, ECX,  2, 30, XSAVE_ZMM_H_RSVD1,                   NO,    0 ) \
-FIELD(  D,  6, EDX,  0, 32, XSAVE_ZMM_H_RSVD2,                   NO,    0 ) \
+FLAG(   D,  6, ECX,  2,  1, XSAVE_ZMM_H_XFD,                     NO,    0 ) \
 FIELD(  D,  7, EAX,  0, 32, XSAVE_HI16_ZMM_SIZE,                 YES,  13 ) \
 FIELD(  D,  7, EBX,  0, 32, XSAVE_HI16_ZMM_OFFSET,               YES,  13 ) \
 FLAG(   D,  7, ECX,  0,  1, XSAVE_HI16_ZMM_SUP_BY_XSS,           NO,    0 ) \
 FLAG(   D,  7, ECX,  1,  1, XSAVE_HI16_ZMM_ALIGN,                YES,  13 ) \
-FIELD(  D,  7, ECX,  2, 30, XSAVE_HI16_ZMM_RSVD1,                NO,    0 ) \
-FIELD(  D,  7, EDX,  0, 32, XSAVE_HI16_ZMM_RSVD2,                NO,    0 ) \
-FIELD(  D,  8, EAX,  0, 32, XSAVE_PT_STATE_SIZE,                 NO,    0 ) \
-FIELD(  D,  8, EBX,  0, 32, XSAVE_PT_STATE_OFFSET,               NO,    0 ) \
-FLAG(   D,  8, ECX,  0,  1, XSAVE_PT_STATE_SUP_BY_XSS,           NO,    0 ) \
-FLAG(   D,  8, ECX,  1,  1, XSAVE_PT_STATE_ALIGN,                NO,    0 ) \
-FIELD(  D,  8, ECX,  2, 30, XSAVE_PT_STATE_RSVD1,                NO,    0 ) \
-FIELD(  D,  8, EDX,  0, 32, XSAVE_PT_STATE_RSVD2,                NO,    0 ) \
+FLAG(   D,  7, ECX,  2,  1, XSAVE_HI16_ZMM_XFD,                  NO,    0 ) \
+FIELD(  D,  8, EAX,  0, 32, XSAVES_PT_STATE_SIZE,                NO,    0 ) \
+FLAG(   D,  8, ECX,  0,  1, XSAVES_PT_STATE_SUP_BY_XSS,          NO,    0 ) \
+FLAG(   D,  8, ECX,  1,  1, XSAVES_PT_STATE_ALIGN,               NO,    0 ) \
+FLAG(   D,  8, ECX,  2,  1, XSAVES_PT_STATE_XFD,                 NO,    0 ) \
 FIELD(  D,  9, EAX,  0, 32, XSAVE_PKRU_SIZE,                     YES,  13 ) \
 FIELD(  D,  9, EBX,  0, 32, XSAVE_PKRU_OFFSET,                   YES,  13 ) \
 FLAG(   D,  9, ECX,  0,  1, XSAVE_PKRU_SUP_BY_XSS,               NO,    0 ) \
 FLAG(   D,  9, ECX,  1,  1, XSAVE_PKRU_ALIGN,                    YES,  13 ) \
-FIELD(  D,  9, ECX,  2, 30, XSAVE_PKRU_RSVD1,                    NO,    0 ) \
-FIELD(  D,  9, EDX,  0, 32, XSAVE_PKRU_RSVD2,                    NO,    0 )
+FLAG(   D,  9, ECX,  2,  1, XSAVE_PKRU_XFD,                      NO,    0 ) \
+FIELD(  D, 10, EAX,  0, 32, XSAVES_PASID_STATE_SIZE,             NO,    0 ) \
+FLAG(   D, 10, ECX,  0,  1, XSAVES_PASID_STATE_SUP_BY_XSS,       NO,    0 ) \
+FLAG(   D, 10, ECX,  1,  1, XSAVES_PASID_STATE_ALIGN,            NO,    0 ) \
+FLAG(   D, 10, ECX,  2,  1, XSAVES_PASID_STATE_XFD,              NO,    0 ) \
+FIELD(  D, 11, EAX,  0, 32, XSAVES_CET_U_SIZE,                   NO,    0 ) \
+FLAG(   D, 11, ECX,  0,  1, XSAVES_CET_U_SUP_BY_XSS,             NO,    0 ) \
+FLAG(   D, 11, ECX,  1,  1, XSAVES_CET_U_ALIGN,                  NO,    0 ) \
+FLAG(   D, 11, ECX,  2,  1, XSAVES_CET_U_XFD,                    NO,    0 ) \
+FIELD(  D, 12, EAX,  0, 32, XSAVES_CET_S_SIZE,                   NO,    0 ) \
+FLAG(   D, 12, ECX,  0,  1, XSAVES_CET_S_SUP_BY_XSS,             NO,    0 ) \
+FLAG(   D, 12, ECX,  1,  1, XSAVES_CET_S_ALIGN,                  NO,    0 ) \
+FLAG(   D, 12, ECX,  2,  1, XSAVES_CET_S_XFD,                    NO,    0 ) \
+FIELD(  D, 13, EAX,  0, 32, XSAVES_HDT_SIZE,                     NO,    0 ) \
+FLAG(   D, 13, ECX,  0,  1, XSAVES_HDT_SUP_BY_XSS,               NO,    0 ) \
+FLAG(   D, 13, ECX,  1,  1, XSAVES_HDT_ALIGN,                    NO,    0 ) \
+FLAG(   D, 13, ECX,  2,  1, XSAVES_HDT_XFD,                      NO,    0 ) \
+FIELD(  D, 14, EAX,  0, 32, XSAVES_UINTR_SIZE,                   NO,    0 ) \
+FLAG(   D, 14, ECX,  0,  1, XSAVES_UINTR_SUP_BY_XSS,             NO,    0 ) \
+FLAG(   D, 14, ECX,  1,  1, XSAVES_UINTR_ALIGN,                  NO,    0 ) \
+FLAG(   D, 14, ECX,  2,  1, XSAVES_UINTR_XFD,                    NO,    0 ) \
+FIELD(  D, 15, EAX,  0, 32, XSAVES_LBR_SIZE,                     NO,    0 ) \
+FLAG(   D, 15, ECX,  0,  1, XSAVES_LBR_SUP_BY_XSS,               NO,    0 ) \
+FLAG(   D, 15, ECX,  1,  1, XSAVES_LBR_ALIGN,                    NO,    0 ) \
+FLAG(   D, 15, ECX,  2,  1, XSAVES_LBR_XFD,                      NO,    0 ) \
+FIELD(  D, 16, EAX,  0, 32, XSAVES_HWP_SIZE,                     NO,    0 ) \
+FLAG(   D, 16, ECX,  0,  1, XSAVES_HWP_SUP_BY_XSS,               NO,    0 ) \
+FLAG(   D, 16, ECX,  1,  1, XSAVES_HWP_ALIGN,                    NO,    0 ) \
+FLAG(   D, 16, ECX,  2,  1, XSAVES_HWP_XFD,                      NO,    0 ) \
+FIELD(  D, 17, EAX,  0, 32, XSAVE_XTILECFG_SIZE,                 NO,    0 ) \
+FIELD(  D, 17, EBX,  0, 32, XSAVE_XTILECFG_OFFSET,               NO,    0 ) \
+FLAG(   D, 17, ECX,  0,  1, XSAVE_XTILECFG_SUP_BY_XSS,           NO,    0 ) \
+FLAG(   D, 17, ECX,  1,  1, XSAVE_XTILECFG_ALIGN,                NO,    0 ) \
+FLAG(   D, 17, ECX,  2,  1, XSAVE_XTILECFG_XFD,                  NO,    0 ) \
+FIELD(  D, 18, EAX,  0, 32, XSAVE_XTILEDATA_SIZE,                NO,    0 ) \
+FIELD(  D, 18, EBX,  0, 32, XSAVE_XTILEDATA_OFFSET,              NO,    0 ) \
+FLAG(   D, 18, ECX,  0,  1, XSAVE_XTILEDATA_SUP_BY_XSS,          NO,    0 ) \
+FLAG(   D, 18, ECX,  1,  1, XSAVE_XTILEDATA_ALIGN,               NO,    0 ) \
+FLAG(   D, 18, ECX,  2,  1, XSAVE_XTILEDATA_XFD,                 NO,    0 ) \
 /* D, 62: AMD LWP leaf on BD, PD, SR. Dropped in Zen. Never referenced. */
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
@@ -713,22 +771,22 @@ FIELD( 12,  3, EDX,  0, 20, EPC01_SIZE_HIGH,                     NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_14                                           \
-FIELD( 14,  0, EAX,  0, 32, PT_MAX_SUBLEAF,                     YES, FUT ) \
-FLAG(  14,  0, EBX,  0,  1, PT_CR3_FILTER,                      YES, FUT ) \
-FLAG(  14,  0, EBX,  1,  1, PT_CFG_PSB_CYC,                     YES, FUT ) \
-FLAG(  14,  0, EBX,  2,  1, PT_IP_FILTER_PERSIST_MSR,           YES, FUT ) \
-FLAG(  14,  0, EBX,  3,  1, PT_MTC,                             YES, FUT ) \
-FLAG(  14,  0, EBX,  4,  1, PT_PTWRITE,                         NO,    0 ) \
-FLAG(  14,  0, EBX,  5,  1, PT_POWER_EVENT,                     NO,    0 ) \
-FLAG(  14,  0, ECX,  0,  1, PT_TOPA,                            YES, FUT ) \
-FLAG(  14,  0, ECX,  1,  1, PT_TOPA_MULTI,                      YES, FUT ) \
-FLAG(  14,  0, ECX,  2,  1, PT_SRO,                             YES, FUT ) \
-FLAG(  14,  0, ECX,  3,  1, PT_TRACE_TRANS,                     NO,    0 ) \
-FLAG(  14,  0, ECX, 31,  1, PT_LIP,                             YES, FUT ) \
-FIELD( 14,  1, EAX,  0,  3, PT_NUM_ADDR_RANGES,                 YES, FUT ) \
-FIELD( 14,  1, EAX, 16, 16, PT_AVAIL_MTC_ENCS,                  YES, FUT ) \
-FIELD( 14,  1, EBX,  0, 16, PT_AVAIL_CYC_THRESH_ENCS,           YES, FUT ) \
-FIELD( 14,  1, EBX, 16, 16, PT_AVAIL_PSB_FREQ_ENCS,             YES, FUT ) \
+FIELD( 14,  0, EAX,  0, 32, PT_MAX_SUBLEAF,                      NO,    0 ) \
+FLAG(  14,  0, EBX,  0,  1, PT_CR3_FILTER,                       NO,    0 ) \
+FLAG(  14,  0, EBX,  1,  1, PT_CFG_PSB_CYC,                      NO,    0 ) \
+FLAG(  14,  0, EBX,  2,  1, PT_IP_FILTER_PERSIST_MSR,            NO,    0 ) \
+FLAG(  14,  0, EBX,  3,  1, PT_MTC,                              NO,    0 ) \
+FLAG(  14,  0, EBX,  4,  1, PT_PTWRITE,                          NO,    0 ) \
+FLAG(  14,  0, EBX,  5,  1, PT_POWER_EVENT,                      NO,    0 ) \
+FLAG(  14,  0, ECX,  0,  1, PT_TOPA,                             NO,    0 ) \
+FLAG(  14,  0, ECX,  1,  1, PT_TOPA_MULTI,                       NO,    0 ) \
+FLAG(  14,  0, ECX,  2,  1, PT_SRO,                              NO,    0 ) \
+FLAG(  14,  0, ECX,  3,  1, PT_TRACE_TRANS,                      NO,    0 ) \
+FLAG(  14,  0, ECX, 31,  1, PT_LIP,                              NO,    0 ) \
+FIELD( 14,  1, EAX,  0,  3, PT_NUM_ADDR_RANGES,                  NO,    0 ) \
+FIELD( 14,  1, EAX, 16, 16, PT_AVAIL_MTC_ENCS,                   NO,    0 ) \
+FIELD( 14,  1, EBX,  0, 16, PT_AVAIL_CYC_THRESH_ENCS,            NO,    0 ) \
+FIELD( 14,  1, EBX, 16, 16, PT_AVAIL_PSB_FREQ_ENCS,              NO,    0 ) \
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_15                                           \
@@ -777,6 +835,17 @@ FIELD( 18,  0, EDX,  5,  3, TLB_INFO_LEVEL,                      NO,    0 ) \
 FLAG(  18,  0, EDX,  8,  1, TLB_INFO_FULLY_ASSOCIATIVE,          NO,    0 ) \
 FIELD( 18,  0, EDX, 14, 12, TLB_INFO_MAX_ADDRESSABLE_IDS,        NO,    0 )
 
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_19                                           \
+FLAG(  19,  0, EAX,  0,  1, KEY_LOCKER_CPL0_ONLY,                NO,    0 ) \
+FLAG(  19,  0, EAX,  1,  1, KEY_LOCKER_NO_ENCRYPT,               NO,    0 ) \
+FLAG(  19,  0, EAX,  2,  1, KEY_LOCKER_NO_DECRYPT,               NO,    0 ) \
+FLAG(  19,  0, EBX,  0,  1, AESKLE,                              NO,    0 ) \
+FLAG(  19,  0, EBX,  2,  1, AESKLE_WIDE,                         NO,    0 ) \
+FLAG(  19,  0, EBX,  4,  1, KEY_LOCKER_MSRS,                     NO,    0 ) \
+FLAG(  19,  0, ECX,  0,  1, LOADWKEY_NOBACKUP,                   NO,    0 ) \
+FLAG(  19,  0, ECX,  1,  1, KEY_LOCKER_KEY_SOURCE,               NO,    0 )
+
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1A                                           \
 FIELD( 1A,  0, EAX,  0, 24, NATIVE_MODEL_ID,                     NO,    0 ) \
@@ -789,6 +858,32 @@ FIELD( 1B,  0, EBX,  0, 32, PCONFIG_TARGET_ID1,                  NO,    0 ) \
 FIELD( 1B,  0, ECX,  0, 32, PCONFIG_TARGET_ID2,                  NO,    0 ) \
 FIELD( 1B,  0, EDX,  0, 32, PCONFIG_TARGET_ID3,                  NO,    0 )
 
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_1C                                           \
+FIELD( 1C,  0, EAX,  0,  8, LBR_DEPTH,                           NO,    0 ) \
+FLAG(  1C,  0, EAX, 30,  1, LBR_DEEP_CSTATE_RESET,               NO,    0 ) \
+FLAG(  1C,  0, EAX, 31,  1, LBR_IP_CONTAINS_LIP,                 NO,    0 ) \
+FLAG(  1C,  0, EBX,  0,  1, LBR_CPL_FILTERING,                   NO,    0 ) \
+FLAG(  1C,  0, EBX,  1,  1, LBR_BRANCH_FILTERING,                NO,    0 ) \
+FLAG(  1C,  0, EBX,  2,  1, LBR_CALL_STACK_MODE,                 NO,    0 ) \
+FLAG(  1C,  0, ECX,  0,  1, LBR_MISPREDICT,                      NO,    0 ) \
+FLAG(  1C,  0, ECX,  1,  1, LBR_TIMED_LBRS,                      NO,    0 ) \
+FLAG(  1C,  0, ECX,  2,  1, LBR_BRANCH_TYPE,                     NO,    0 ) \
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_1D                                           \
+FIELD( 1D,  0, EAX,  0, 32, TILE_PALETTE_MAX,                    NO,    0 ) \
+FIELD( 1D,  1, EAX,  0, 16, TILE_PALETTE1_TOTAL_BYTES,           NO,    0 ) \
+FIELD( 1D,  1, EAX, 16, 16, TILE_PALETTE1_BYTES_PER_TILE,        NO,    0 ) \
+FIELD( 1D,  1, EBX,  0, 16, TILE_PALETTE1_BYTES_PER_ROW,         NO,    0 ) \
+FIELD( 1D,  1, EBX, 16, 16, TILE_PALETTE1_NUM_REGS,              NO,    0 ) \
+FIELD( 1D,  1, ECX,  0, 16, TILE_PALETTE1_MAX_ROWS,              NO,    0 )
+
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_1E                                           \
+FIELD( 1E,  0, EBX,  0,  8, TMUL_MAX_K,                          NO,    0 ) \
+FIELD( 1E,  0, EBX,  8, 16, TMUL_MAX_N,                          NO,    0 )
+
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1F                                           \
 FIELD( 1F,  0, EAX,  0,  5, TOPOLOGY_V2_MASK_WIDTH,              NA,    0 ) \
@@ -797,6 +892,11 @@ FIELD( 1F,  0, ECX,  0,  8, TOPOLOGY_V2_LEVEL_NUMBER,            NA,    0 ) \
 FIELD( 1F,  0, ECX,  8,  8, TOPOLOGY_V2_LEVEL_TYPE,              NA,    0 ) \
 FIELD( 1F,  0, EDX,  0, 32, TOPOLOGY_V2_X2APIC_ID,               NA,    0 )
 
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_20                                           \
+FIELD( 20,  0, EAX,  0, 32, HRESET_MAX_SUBLEAF,                  NO,    0 ) \
+FIELD( 20,  0, EBX,  0, 32, HRESET_ENABLE_MSR_VALID_BITS,        NO,    0 )
+
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_400                                          \
 FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                       NA,    0 ) \
@@ -900,7 +1000,9 @@ FLAG( 406,  0, EAX,  6,  1, MEMORY_PATROL_SCRUBBER,              NA,    0 )
 FIELD(410,  0, EAX,  0, 32, TSC_HZ,                              NA,    0 ) \
 FIELD(410,  0, EBX,  0, 32, APICBUS_HZ,                          NA,    0 ) \
 FLAG( 410,  0, ECX,  0,  1, VMMCALL_BACKDOOR,                    NA,    0 ) \
-FLAG( 410,  0, ECX,  1,  1, VMCALL_BACKDOOR,                     NA,    0 )
+FLAG( 410,  0, ECX,  1,  1, VMCALL_BACKDOOR,                     NA,    0 ) \
+FLAG( 410,  0, ECX,  2,  1, TDX_ENABLED,                         NA,    0 ) \
+FLAG( 410,  0, ECX,  3,  1, TDX_API_ENABLED,                     NA,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_80                                           \
@@ -1081,9 +1183,10 @@ FLAG(  88,  0, EBX, 18,  1, LEAF88_PREFER_IBRS,                  NO,    0 ) \
 FLAG(  88,  0, EBX, 19,  1, LEAF88_IBRS_SAME_MODE,               NO,    0 ) \
 FLAG(  88,  0, EBX, 20,  1, LMSLE_UNSUPPORTED,                   NO,    0 ) \
 FLAG(  88,  0, EBX, 23,  1, PPIN,                                NO,    0 ) \
-FLAG(  88,  0, EBX, 24,  1, LEAF88_SSBD_SPEC_CTRL,               ANY,   9 ) \
-FLAG(  88,  0, EBX, 25,  1, LEAF88_SSBD_VIRT_SPEC_CTRL,          ANY,   9 ) \
+FLAG(  88,  0, EBX, 24,  1, LEAF88_SSBD_SPEC_CTRL,               YES,  20 ) \
+FLAG(  88,  0, EBX, 25,  1, LEAF88_SSBD_VIRT_SPEC_CTRL,          NO,    0 ) \
 FLAG(  88,  0, EBX, 26,  1, LEAF88_SSBD_NOT_NEEDED,              NO,    0 ) \
+FLAG(  88,  0, EBX, 28,  1, LEAF88_PSFD,                         YES,  20 ) \
 FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                   YES,   4 ) \
 FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                  YES,   7 ) \
 FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                        NO,    0 ) \
@@ -1262,9 +1365,14 @@ FIELD(820,  1, EDX,  0, 32, NUM_SERVICE_CLASSES,                 NO,    0 )
    CPUID_FIELD_DATA_LEVEL_16                                          \
    CPUID_FIELD_DATA_LEVEL_17                                          \
    CPUID_FIELD_DATA_LEVEL_18                                          \
+   CPUID_FIELD_DATA_LEVEL_19                                          \
    CPUID_FIELD_DATA_LEVEL_1A                                          \
    CPUID_FIELD_DATA_LEVEL_1B                                          \
+   CPUID_FIELD_DATA_LEVEL_1C                                          \
+   CPUID_FIELD_DATA_LEVEL_1D                                          \
+   CPUID_FIELD_DATA_LEVEL_1E                                          \
    CPUID_FIELD_DATA_LEVEL_1F                                          \
+   CPUID_FIELD_DATA_LEVEL_20                                          \
    CPUID_FIELD_DATA_LEVEL_400                                         \
    CPUID_FIELD_DATA_LEVEL_401                                         \
    CPUID_FIELD_DATA_LEVEL_402                                         \
@@ -1480,58 +1588,63 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_FAMILY_DHYANA          0x18
 
 /* Intel model information */
-#define CPUID_MODEL_PPRO              1
-#define CPUID_MODEL_PII_03            3
-#define CPUID_MODEL_PII_05            5
-#define CPUID_MODEL_CELERON_06        6
-#define CPUID_MODEL_PM_09             9
-#define CPUID_MODEL_PM_0D            13
-#define CPUID_MODEL_PM_0E            14  // Yonah / Sossaman
-#define CPUID_MODEL_CORE_0F          15  // Conroe / Merom
-#define CPUID_MODEL_CORE_17        0x17  // Penryn
-#define CPUID_MODEL_NEHALEM_1A     0x1a  // Nehalem / Gainestown
-#define CPUID_MODEL_ATOM_1C        0x1c  // Silverthorne / Diamondville
-#define CPUID_MODEL_CORE_1D        0x1d  // Dunnington
-#define CPUID_MODEL_NEHALEM_1E     0x1e  // Lynnfield
-#define CPUID_MODEL_NEHALEM_1F     0x1f  // Havendale
-#define CPUID_MODEL_NEHALEM_25     0x25  // Westmere / Clarkdale
-#define CPUID_MODEL_ATOM_26        0x26  // Lincroft
-#define CPUID_MODEL_ATOM_27        0x27  // Saltwell
-#define CPUID_MODEL_SANDYBRIDGE_2A 0x2a  // Sandybridge (desktop/mobile)
-#define CPUID_MODEL_NEHALEM_2C     0x2c  // Westmere-EP
-#define CPUID_MODEL_SANDYBRIDGE_2D 0x2d  // Sandybridge-EP
-#define CPUID_MODEL_NEHALEM_2E     0x2e  // Nehalem-EX
-#define CPUID_MODEL_NEHALEM_2F     0x2f  // Westmere-EX
-#define CPUID_MODEL_ATOM_35        0x35  // Cloverview
-#define CPUID_MODEL_ATOM_36        0x36  // Cedarview
-#define CPUID_MODEL_ATOM_37        0x37  // Bay Trail
-#define CPUID_MODEL_SANDYBRIDGE_3A 0x3a  // Ivy Bridge
-#define CPUID_MODEL_HASWELL_3C     0x3c  // Haswell DT
-#define CPUID_MODEL_BROADWELL_3D   0x3d  // Broadwell-Ult
-#define CPUID_MODEL_SANDYBRIDGE_3E 0x3e  // Ivy Bridge-EP
-#define CPUID_MODEL_HASWELL_3F     0x3f  // Haswell EP/EN/EX
-#define CPUID_MODEL_HASWELL_45     0x45  // Haswell Ultrathin
-#define CPUID_MODEL_HASWELL_46     0x46  // Haswell (Crystal Well)
-#define CPUID_MODEL_BROADWELL_47   0x47  // Broadwell (Denlow)
-#define CPUID_MODEL_ATOM_4A        0x4a  // Future Silvermont
-#define CPUID_MODEL_ATOM_4C        0x4c  // Airmont
-#define CPUID_MODEL_ATOM_4D        0x4d  // Avoton
-#define CPUID_MODEL_SKYLAKE_4E     0x4e  // Skylake-Y / Kaby Lake U/Y ES
-#define CPUID_MODEL_BROADWELL_4F   0x4f  // Broadwell EP/EN/EX
-#define CPUID_MODEL_SKYLAKE_55     0x55  // Skylake EP/EN/EX
-#define CPUID_MODEL_BROADWELL_56   0x56  // Broadwell DE
-#define CPUID_MODEL_KNL_57         0x57  // Knights Landing
-#define CPUID_MODEL_ATOM_5A        0x5a  // Future Silvermont
-#define CPUID_MODEL_ATOM_5D        0x5d  // Future Silvermont
-#define CPUID_MODEL_SKYLAKE_5E     0x5e  // Skylake-S / Kaby Lake S/H ES
-#define CPUID_MODEL_ATOM_5F        0x5f  // Denverton
-#define CPUID_MODEL_ATOM_86        0x86  // Snow Ridge
-#define CPUID_MODEL_CANNONLAKE_66  0x66  // Cannon Lake
-#define CPUID_MODEL_KNM_85         0x85  // Knights Mill
-#define CPUID_MODEL_KABYLAKE_8E    0x8e  // Kaby Lake U/Y QS
-#define CPUID_MODEL_KABYLAKE_9E    0x9e  // Kaby Lake S/H QS
-#define CPUID_MODEL_COMETLAKE_A5   0xa5  // Comet Lake S
-#define CPUID_MODEL_COMETLAKE_A6   0xa6  // Comet Lake U
+#define CPUID_MODEL_PPRO                 1
+#define CPUID_MODEL_PII_03               3
+#define CPUID_MODEL_PII_05               5
+#define CPUID_MODEL_CELERON_06           6
+#define CPUID_MODEL_PM_09                9
+#define CPUID_MODEL_PM_0D               13
+#define CPUID_MODEL_PM_0E               14  // Yonah / Sossaman
+#define CPUID_MODEL_CORE_0F             15  // Conroe / Merom
+#define CPUID_MODEL_CORE_17           0x17  // Penryn
+#define CPUID_MODEL_NEHALEM_1A        0x1a  // Nehalem / Gainestown
+#define CPUID_MODEL_ATOM_1C           0x1c  // Silverthorne / Diamondville
+#define CPUID_MODEL_CORE_1D           0x1d  // Dunnington
+#define CPUID_MODEL_NEHALEM_1E        0x1e  // Lynnfield
+#define CPUID_MODEL_NEHALEM_1F        0x1f  // Havendale
+#define CPUID_MODEL_NEHALEM_25        0x25  // Westmere / Clarkdale
+#define CPUID_MODEL_ATOM_26           0x26  // Lincroft
+#define CPUID_MODEL_ATOM_27           0x27  // Saltwell
+#define CPUID_MODEL_SANDYBRIDGE_2A    0x2a  // Sandybridge (desktop/mobile)
+#define CPUID_MODEL_NEHALEM_2C        0x2c  // Westmere-EP
+#define CPUID_MODEL_SANDYBRIDGE_2D    0x2d  // Sandybridge-EP
+#define CPUID_MODEL_NEHALEM_2E        0x2e  // Nehalem-EX
+#define CPUID_MODEL_NEHALEM_2F        0x2f  // Westmere-EX
+#define CPUID_MODEL_ATOM_35           0x35  // Cloverview
+#define CPUID_MODEL_ATOM_36           0x36  // Cedarview
+#define CPUID_MODEL_ATOM_37           0x37  // Bay Trail
+#define CPUID_MODEL_SANDYBRIDGE_3A    0x3a  // Ivy Bridge
+#define CPUID_MODEL_HASWELL_3C        0x3c  // Haswell DT
+#define CPUID_MODEL_BROADWELL_3D      0x3d  // Broadwell-Ult
+#define CPUID_MODEL_SANDYBRIDGE_3E    0x3e  // Ivy Bridge-EP
+#define CPUID_MODEL_HASWELL_3F        0x3f  // Haswell EP/EN/EX
+#define CPUID_MODEL_HASWELL_45        0x45  // Haswell Ultrathin
+#define CPUID_MODEL_HASWELL_46        0x46  // Haswell (Crystal Well)
+#define CPUID_MODEL_BROADWELL_47      0x47  // Broadwell (Denlow)
+#define CPUID_MODEL_ATOM_4A           0x4a  // Future Silvermont
+#define CPUID_MODEL_ATOM_4C           0x4c  // Airmont
+#define CPUID_MODEL_ATOM_4D           0x4d  // Avoton
+#define CPUID_MODEL_SKYLAKE_4E        0x4e  // Skylake-Y / Kaby Lake U/Y ES
+#define CPUID_MODEL_BROADWELL_4F      0x4f  // Broadwell EP/EN/EX
+#define CPUID_MODEL_SKYLAKE_55        0x55  // Skylake EP/EN/EX
+#define CPUID_MODEL_BROADWELL_56      0x56  // Broadwell DE
+#define CPUID_MODEL_KNL_57            0x57  // Knights Landing
+#define CPUID_MODEL_ATOM_5A           0x5a  // Future Silvermont
+#define CPUID_MODEL_ATOM_5D           0x5d  // Future Silvermont
+#define CPUID_MODEL_SKYLAKE_5E        0x5e  // Skylake-S / Kaby Lake S/H ES
+#define CPUID_MODEL_ATOM_5F           0x5f  // Denverton
+#define CPUID_MODEL_ATOM_86           0x86  // Snow Ridge
+#define CPUID_MODEL_CANNONLAKE_66     0x66  // Cannon Lake
+#define CPUID_MODEL_ICELAKE_7E        0x7e  // Ice Lake U/Y
+#define CPUID_MODEL_ICELAKE_6A        0x6a  // Ice Lake SP (ICX)
+#define CPUID_MODEL_ICELAKE_6C        0x6c  // Ice Lake D
+#define CPUID_MODEL_TIGERLAKE_8C      0x8c  // Tiger Lake
+#define CPUID_MODEL_KNM_85            0x85  // Knights Mill
+#define CPUID_MODEL_KABYLAKE_8E       0x8e  // Kaby Lake U/Y QS
+#define CPUID_MODEL_KABYLAKE_9E       0x9e  // Kaby Lake S/H QS
+#define CPUID_MODEL_COMETLAKE_A5      0xa5  // Comet Lake S
+#define CPUID_MODEL_COMETLAKE_A6      0xa6  // Comet Lake U
+#define CPUID_MODEL_ROCKETLAKE_A7     0xa7  // Rocket Lake S
 
 /* Intel stepping information */
 #define CPUID_STEPPING_KABYLAKE_ES     0x8  // Kaby Lake S/H/U/Y ES
@@ -1541,6 +1654,7 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_STEPPING_CASCADELAKE_B1  0x7  // Cascade Lake B1-step
 #define CPUID_STEPPING_WHISKEYLAKE     0xB  // Whiskey Lake U
 #define CPUID_STEPPING_AMBERLAKE       0xC  // Amber Lake Y
+#define CPUID_STEPPING_COOPERLAKE      0xA  // Cooper Lake-SP
 
 #define CPUID_MODEL_PIII_07    7
 #define CPUID_MODEL_PIII_08    8
@@ -1785,6 +1899,14 @@ CPUID_MODEL_IS_CASCADELAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
           CPUID_EFFECTIVE_STEPPING(v) <= CPUID_STEPPING_CASCADELAKE_B1;
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_COOPERLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_55 &&
+          CPUID_EFFECTIVE_STEPPING(v) == CPUID_STEPPING_COOPERLAKE;
+}
 
 static INLINE Bool
 CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
@@ -1794,6 +1916,7 @@ CPUID_MODEL_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
           ((CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_5E &&
             CPUID_EFFECTIVE_STEPPING(v) != CPUID_STEPPING_KABYLAKE_ES) ||
            (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_55 &&
+            !CPUID_MODEL_IS_COOPERLAKE(v)                      &&
             !CPUID_MODEL_IS_CASCADELAKE(v))                            ||
            (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SKYLAKE_4E &&
             CPUID_EFFECTIVE_STEPPING(v) != CPUID_STEPPING_KABYLAKE_ES));
@@ -1872,9 +1995,45 @@ CPUID_UARCH_IS_SKYLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
           CPUID_MODEL_IS_COMETLAKE(v)   ||
           CPUID_MODEL_IS_AMBERLAKE(v)   ||
           CPUID_MODEL_IS_CASCADELAKE(v) ||
+          CPUID_MODEL_IS_COOPERLAKE(v)  ||
           CPUID_MODEL_IS_CANNONLAKE(v);
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_ICELAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ICELAKE_7E ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ICELAKE_6A ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ICELAKE_6C);
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_TIGERLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_TIGERLAKE_8C);
+}
+
+static INLINE Bool
+CPUID_MODEL_IS_ROCKETLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ROCKETLAKE_A7);
+}
+
+static INLINE Bool
+CPUID_UARCH_IS_ICELAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_MODEL_IS_ICELAKE(v)  ||
+          CPUID_MODEL_IS_TIGERLAKE(v) ||
+          CPUID_MODEL_IS_ROCKETLAKE(v);
+}
+
 
 static INLINE Bool
 CPUID_UARCH_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
@@ -2299,30 +2458,6 @@ CPUID_LevelUsesEcx(uint32 level) {
    }
 }
 
-/*
- *----------------------------------------------------------------------
- *
- * CPUID_SupportsMsrPlatformInfo --
- *
- *    Uses vendor and cpuid.1.0.eax to determine if the processor
- *    supports MSR_PLATFORM_INFO.
- *
- *----------------------------------------------------------------------
- */
-static INLINE Bool
-CPUID_SupportsMsrPlatformInfo(CpuidVendor vendor, uint32 version)
-{
-   return vendor == CPUID_VENDOR_INTEL &&
-          (CPUID_UARCH_IS_NEHALEM(version)     ||
-           CPUID_UARCH_IS_SANDYBRIDGE(version) ||
-           CPUID_UARCH_IS_HASWELL(version)     ||
-           CPUID_UARCH_IS_SKYLAKE(version)     ||
-           CPUID_MODEL_IS_KNIGHTS_LANDING(version) ||
-           CPUID_MODEL_IS_DENVERTON(version)   ||
-           CPUID_UARCH_IS_SILVERMONT(version)  ||
-           CPUID_UARCH_IS_TREMONT(version));
-}
-
 #ifdef _MSC_VER
 #pragma warning (pop)
 #endif
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 139617f9..88c7f269 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -51,30 +51,24 @@ extern "C" {
 #pragma warning (disable :4200) // non-std extension: zero-sized array in struct
 #endif
 
-typedef
-#include "vmware_pack_begin.h"
-struct MSRReply {
+#pragma pack(push, 1)
+typedef struct MSRReply {
    /*
     * Unique host logical CPU identifier. It does not change across queries, so
     * we use it to correlate the replies of multiple queries.
     */
    uint64 tag;              // OUT
    uint64 msrVal;           // OUT
-   uint8  implemented;      // OUT
-   uint8  _pad[7];
-}
-#include "vmware_pack_end.h"
-MSRReply;
+} MSRReply;
+#pragma pack(pop)
 
-typedef
-#include "vmware_pack_begin.h"
-struct MSRQuery {
+#pragma pack(push, 1)
+typedef struct MSRQuery {
    uint32 msrNum;           // IN
    uint32 numLogicalCPUs;   // IN/OUT
    MSRReply logicalCPUs[0]; // OUT
-}
-#include "vmware_pack_end.h"
-MSRQuery;
+} MSRQuery;
+#pragma pack(pop)
 
 #define MSR_TSC               0x00000010
 #define MSR_PLATFORM_ID       0x00000017
@@ -106,6 +100,7 @@ MSRQuery;
 #define MSR_MISC_ENABLE       0x000001a0
 #define MSR_DEBUGCTL          0x000001d9
 #define MSR_TSC_DEADLINE      0x000006e0
+#define MSR_PKRS              0x000006e1
 #define MSR_EFER              0xc0000080
 #define MSR_FSBASE            0xc0000100
 #define MSR_GSBASE            0xc0000101
@@ -144,6 +139,7 @@ MSRQuery;
 #define MSR_SPEC_CTRL_IBRS                        (1UL << 0)
 #define MSR_SPEC_CTRL_STIBP                       (1UL << 1)
 #define MSR_SPEC_CTRL_SSBD                        (1UL << 2)
+#define MSR_SPEC_CTRL_PSFD                        (1UL << 7)
 
 #define MSR_PRED_CMD_IBPB                         (1UL << 0)
 
@@ -153,6 +149,9 @@ MSRQuery;
 
 #define MSR_MISC_FEATURES_ENABLES            0x140
 
+#define MSR_XFD                              0x1c4
+#define MSR_XFD_ERR                          0x1c5
+
 /* Intel Core Architecture and later: use only architected counters. */
 #define IA32_MSR_PERF_CAPABILITIES                   0x345
 #define MSR_PERF_CAPABILITIES_LBRFMT_SHIFT           0
@@ -168,6 +167,10 @@ MSRQuery;
 
 #define IA32_MSR_PEBS_ENABLE                      0x3f1
 
+#define MSR_UMWAIT_CONTROL                        0xe1
+#define MSR_UMWAIT_CONTROL_C0_MASK                0x1
+#define MSR_UMWAIT_CONTROL_TSC_MASK               0xfffffffc
+
 #define MSR_MTRR_BASE0        0x00000200
 #define MSR_MTRR_MASK0        0x00000201
 #define MSR_MTRR_BASE1        0x00000202
@@ -207,21 +210,52 @@ MSRQuery;
 
 #define MSR_DS_AREA          0x00000600
 
-#define MSR_LASTBRANCHFROMIP 0x000001db // Intel P6 Family
-#define MSR_LASTBRANCHTOIP   0x000001dc // Intel P6 Family
-#define MSR_LASTINTFROMIP    0x000001dd // Intel P6 Family
-#define MSR_LASTINTTOIP      0x000001de // Intel P6 Family
-
-#define MSR_LER_FROM_LIP     0x000001d7 // Intel Pentium4 Family
-#define MSR_LER_TO_LIP       0x000001d8 // Intel Pentium4 Family
-#define MSR_LASTBRANCH_TOS   0x000001da // Intel Pentium4 Family
-#define MSR_LASTBRANCH_0     0x000001db // Intel Pentium4 Family
-#define MSR_LASTBRANCH_1     0x000001dc // Intel Pentium4 Family
-#define MSR_LASTBRANCH_2     0x000001dd // Intel Pentium4 Family
-#define MSR_LASTBRANCH_3     0x000001de // Intel Pentium4 Family
+#define MSR_LASTBRANCHFROMIP   0x000001db // Intel P6 Family
+#define MSR_LASTBRANCHTOIP     0x000001dc // Intel P6 Family
+#define MSR_LASTINTFROMIP      0x000001dd // Intel P6 Family
+#define MSR_LASTINTTOIP        0x000001de // Intel P6 Family
+#define MSR_LASTBRANCH_TOS_P6  0x000001c9 // Intel P6 Family
+
+#define MSR_LER_FROM_LIP       0x000001d7 // Intel Pentium4 Family
+#define MSR_LER_TO_LIP         0x000001d8 // Intel Pentium4 Family
+#define MSR_LASTBRANCH_TOS_P4  0x000001da // Intel Pentium4 Family
+#define MSR_LASTBRANCH_0       0x000001db // Intel Pentium4 Family
+#define MSR_LASTBRANCH_1       0x000001dc // Intel Pentium4 Family
+#define MSR_LASTBRANCH_2       0x000001dd // Intel Pentium4 Family
+#define MSR_LASTBRANCH_3       0x000001de // Intel Pentium4 Family
+
+#define MSR_LER_INFO           0x000001e0 // with architectural LBR support
+#define MSR_LASTBRANCH_FROM_IP 0x00000680 // From 1st gen Intel Core
+#define MSR_LASTBRANCH_TO_IP   0x000006c0 // From 1st gen Intel Core
+#define MSR_LASTBRANCH_INFO    0x00000dc0 // From 6th gen Intel Core
+#define MSR_LBR_SELECT         0x000001c8 // From 1st gen Intel Core
 
 #define CORE_LBR_SIZE        8
 #define CORE2_LBR_SIZE       4
+#define CORE_GEN1_LBR_SIZE   16     // From 1st to 5th gen Intel Core
+#define CORE_GEN6_LBR_SIZE   32     // From 6th gen Intel Core
+#define LBR_STACK_SIZE_MAX   32
+
+/* Architectural LBR MSRs */
+#define MSR_ARCH_LBR_CTL     0x000014ce
+#define MSR_ARCH_LBR_DEPTH   0x000014cf
+#define MSR_ARCH_LBR_FROM_IP 0x00001500
+#define MSR_ARCH_LBR_TO_IP   0x00001600
+#define MSR_ARCH_LBR_INFO    0x00001200
+
+/* MSR_ARCH_LBR_CTL bits */
+#define MSR_ARCH_LBR_CTL_LBREN         0x000001
+#define MSR_ARCH_LBR_CTL_OS            0x000002
+#define MSR_ARCH_LBR_CTL_USR           0x000004
+#define MSR_ARCH_LBR_CTL_CALL_STACK    0x000008
+#define MSR_ARCH_LBR_CTL_JCC           0x010000
+#define MSR_ARCH_LBR_CTL_NEAR_REL_JMP  0x020000
+#define MSR_ARCH_LBR_CTL_NEAR_IND_JMP  0x040000
+#define MSR_ARCH_LBR_CTL_NEAR_REL_CALL 0x080000
+#define MSR_ARCH_LBR_CTL_NEAR_IND_CALL 0x100000
+#define MSR_ARCH_LBR_CTL_NEAR_RET      0x200000
+#define MSR_ARCH_LBR_CTL_OTHER_BRANCH  0x400000
+#define MSR_ARCH_LBR_CTL_ALL           0x7f000f
 
 /* Power Management MSRs */
 #define MSR_PERF_STATUS      0x00000198 // Current Performance State (ro)
@@ -245,6 +279,71 @@ MSRQuery;
 #define MSR_MPERF            0x000000e7 // Maximum Performance (rw)
 #define MSR_APERF            0x000000e8 // Actual Performance (rw)
 
+/* Hardware-Controlled Performance States (HWP) related MSRs */
+#define MSR_PM_ENABLE               0x00000770
+#define MSR_HWP_CAPABILITIES        0x00000771
+#define MSR_HWP_REQUEST_PKG         0x00000772
+#define MSR_HWP_INTERRUPT           0x00000773
+#define MSR_HWP_REQUEST             0x00000774
+#define MSR_HWP_PECI_REQUEST_INFO   0x00000775
+#define MSR_HWP_STATUS              0x00000777
+
+/* Power Management Enable MSR bits */
+#define MSR_PM_ENABLE_HWP  (1LL<<0)
+
+/* IA32_HWP_CAPABILITIES */
+#define MSR_HWP_CAP_PERF_MASK CONST64U(0xff)
+
+#define MSR_HWP_CAP_HIGHEST_PERF_SHIFT 0
+#define MSR_HWP_CAP_HIGHEST_PERF(_msr)  \
+       (((_msr) >> MSR_HWP_CAP_HIGHEST_PERF_SHIFT) & MSR_HWP_CAP_PERF_MASK)
+
+#define MSR_HWP_CAP_GUARANTEED_PERF_SHIFT 8
+#define MSR_HWP_CAP_GUARANTEED_PERF(_msr)  \
+       (((_msr) >> MSR_HWP_CAP_GUARANTEED_PERF_SHIFT) & MSR_HWP_CAP_PERF_MASK)
+
+#define MSR_HWP_CAP_MOSTEFFICIENT_PERF_SHIFT 16
+#define MSR_HWP_CAP_MOSTEFFICIENT_PERF(_msr)  \
+       (((_msr) >> MSR_HWP_CAP_MOSTEFFICIENT_PERF_SHIFT) & MSR_HWP_CAP_PERF_MASK)
+
+#define MSR_HWP_CAP_LOWEST_PERF_SHIFT 24
+#define MSR_HWP_CAP_LOWEST_PERF(_msr)  \
+       (((_msr) >> MSR_HWP_CAP_LOWEST_PERF_SHIFT) & MSR_HWP_CAP_PERF_MASK)
+
+/* IA32_HWP_REQUEST valid bits for request fields. */
+#define MSR_HWP_REQ_MIN_VALID          (1LL << 63)
+#define MSR_HWP_REQ_MAX_VALID          (1LL << 62)
+#define MSR_HWP_REQ_DESIRED_VALID      (1LL << 61)
+#define MSR_HWP_REQ_EPP_VALID          (1LL << 60)
+#define MSR_HWP_REQ_ACT_WINDOW_VALID   (1LL << 59)
+/* Set the _PKG_CTRL bit in IA32_HWP_REQUEST to derive its inputs from IA32_HWP_REQUEST_PKG */
+#define MSR_HWP_REQ_PKG_CTRL           (1LL << 42)
+
+/* IA32_HWP_REQUEST(_PKG) */
+#define MSR_HWP_REQ_PERF_MASK       CONST64U(0xff)
+#define MSR_HWP_REQ_EPP_MASK        CONST64U(0xff)
+#define MSR_HWP_REQ_ACT_WINDOW_MASK CONST64U(0x3ff)
+
+#define MSR_HWP_REQ_MIN_PERF_SHIFT 0
+#define MSR_HWP_REQ_MIN_PERF(_msr)  \
+       (((_msr) >> MSR_HWP_REQ_MIN_PERF_SHIFT) & MSR_HWP_REQ_PERF_MASK)
+
+#define MSR_HWP_REQ_MAX_PERF_SHIFT 8
+#define MSR_HWP_REQ_MAX_PERF(_msr)  \
+       (((_msr) >> MSR_HWP_REQ_MAX_PERF_SHIFT) & MSR_HWP_REQ_PERF_MASK)
+
+#define MSR_HWP_REQ_DESIRED_PERF_SHIFT 16
+#define MSR_HWP_REQ_DESIRED_PERF(_msr)  \
+       (((_msr) >> MSR_HWP_REQ_DESIRED_PERF_SHIFT) & MSR_HWP_REQ_PERF_MASK)
+
+#define MSR_HWP_REQ_EPP_SHIFT 24
+#define MSR_HWP_REQ_EPP(_msr)  \
+       (((_msr) >> MSR_HWP_REQ_EPP_SHIFT) & MSR_HWP_REQ_EPP_MASK)
+
+#define MSR_HWP_REQ_ACT_WINDOW_SHIFT 32
+#define MSR_HWP_REQ_ACT_WINDOW(_msr)  \
+       (((_msr) >> MSR_HWP_REQ_ACT_WINDOW_SHIFT) & MSR_HWP_REQ_ACT_WINDOW_MASK)
+
 /* Software Controlled Clock Modulation and Thermal Monitors (Intel) */
 #define MSR_CLOCK_MODULATION 0x0000019a // Thermal Monitor Control (rw)
 #define MSR_THERM_INTERRUPT  0x0000019b // Thermal Interrupt Control (rw)
@@ -537,18 +636,52 @@ MSRQuery;
 /* SEV related MSRs. */
 #define MSR_VMPAGE_FLUSH           0xc001011e
 #define MSR_GHCB_PA                0xc0010130
-#define MSR_GHCB_PA_FUNCTION_MASK       0xfff
-#define MSR_GHCB_PA_SEVINFO_HV              1
-#define MSR_GHCB_PA_SEVINFO_REQ             2
-#define MSR_GHCB_PA_AP_JUMP_TABLE           3
-#define MSR_GHCB_PA_CPUID_REQ               4
-#define MSR_GHCB_PA_CPUID_RESP              5
-#define MSR_GHCB_PA_TERMINATE             256
 #define MSR_SEV_STATUS             0xc0010131
 
-#define MSR_SEV_STATUS_SEV_EN      0x0000000000000001ULL // SEV is enabled
-#define MSR_SEV_STATUS_SEV_ES_EN   0x0000000000000002ULL // SEV-ES is enabled
-#define MSR_SEV_STATUS_SEV_SNP_EN  0x0000000000000004ULL // SEV-SNP is enabled
+/* Commands identifiers used in the MSR_GHCB_PA MSR protocol. */
+#define MSR_GHCB_PA_FUNCTION_MASK           0xfffULL
+#define MSR_GHCB_PA_SEVINFO_HV              0x1
+#define MSR_GHCB_PA_SEVINFO_REQ             0x2
+#define MSR_GHCB_PA_AP_JUMP_TABLE           0x3
+#define MSR_GHCB_PA_CPUID_REQ               0x4
+#define MSR_GHCB_PA_CPUID_RESP              0x5
+#define MSR_GHCB_PA_PREFERRED_GHCB_GPA_REQ  0x10
+#define MSR_GHCB_PA_PREFERRED_GHCB_GPA_RESP 0x11
+#define MSR_GHCB_PA_REGISTER_GHCB_GPA_REQ   0x12
+#define MSR_GHCB_PA_REGISTER_GHCB_GPA_RESP  0x13
+#define MSR_GHCB_PA_TERMINATE               0x100
+
+/* Field definitions for SEVInfo block returned by MSR_GHCB_PA_SEVINFO_REQ. */
+#define MSR_GHCB_PA_SEVINFO_MINVER_SHIFT    32
+#define MSR_GHCB_PA_SEVINFO_MINVER_MASK     0xffffULL
+#define MSR_GHCB_PA_SEVINFO_MAXVER_SHIFT    48
+#define MSR_GHCB_PA_SEVINFO_MAXVER_MASK     0xffffULL
+#define MSR_GHCB_PA_SEVINFO_CBIT_SHIFT      24
+#define MSR_GHCB_PA_SEVINFO_CBIT_MASK       0xffULL
+
+#define SEVINFO_GET(_si, _fd) (((_si) >> MSR_GHCB_PA_SEVINFO_##_fd##_SHIFT) & \
+                                         MSR_GHCB_PA_SEVINFO_##_fd##_MASK)
+#define SEVINFO_MINVER(_si) SEVINFO_GET(_si, MINVER)
+#define SEVINFO_MAXVER(_si) SEVINFO_GET(_si, MAXVER)
+
+/* Field definitions for MSR_GHCB_PA_TERMINATE request. */
+#define MSR_GHCB_PA_TERMINATE_ECS_MASK      0xfULL
+#define MSR_GHCB_PA_TERMINATE_ECS_SHIFT     12
+#define MSR_GHCB_PA_TERMINATE_EC_MASK       0xffULL
+#define MSR_GHCB_PA_TERMINATE_EC_SHIFT      16
+
+/* Define a couple of error code sets (ECS) for terminate requests. */
+#define SEV_TERM_ECS_AMD    0    /* AMD reserves ECS 0.         */
+#define SEV_TERM_ECS_EFI    1    /* Used for VMware EFI errors. */
+#define SEV_TERM_ECS_FROBOS 2    /* Used for FrobOS errors.     */
+
+/* SEV feature-enabled bits in MSR_SEV_STATUS. */
+#define MSR_SEV_STATUS_SEV_EN_BIT      0
+#define MSR_SEV_STATUS_SEV_EN          (1ULL << MSR_SEV_STATUS_SEV_EN_BIT)
+#define MSR_SEV_STATUS_SEV_ES_EN_BIT   1
+#define MSR_SEV_STATUS_SEV_ES_EN       (1ULL << MSR_SEV_STATUS_SEV_ES_EN_BIT)
+#define MSR_SEV_STATUS_SEV_SNP_EN_BIT  2
+#define MSR_SEV_STATUS_SEV_SNP_EN      (1ULL << MSR_SEV_STATUS_SEV_SNP_EN_BIT)
 
 /* SEV-SNP (Secure Nested Paging) MSRs. */
 #define MSR_RMP_BASE              0xc0010132 // Address of first byte of RMP
@@ -658,12 +791,80 @@ MSRQuery;
 #define MSR_HYPERV_GUESTOSID_OS_WINNT_DERIVATIVE 4ULL
 
 /* MSR for forcing RTM abort to recover PMC3 (see PR 2333817) */
+/* See SKZ87 in intel 335901-009 6th-gen-x-series-spec-update.pdf */
 #define MSR_TSX_FORCE_ABORT                      0x0000010f
 #define MSR_TSX_FORCE_ABORT_RTM_BIT_INDEX        0
 
+/*
+ * Total Memory Encryption MSRs
+ */
+#define MSR_MK_TME_KEYID_PART                           0x00000087
+#define MSR_TME_CAPABILITY                              0x00000981
+#define MSR_TME_ACTIVATE                                0x00000982
+#define MSR_TME_EXCLUDE_MASK                            0x00000983
+#define MSR_TME_EXCLUDE_BASE                            0x00000984
+
+/*
+ * MSR_MKTME_KEYID_PART bits
+ */
+#define MSR_MKTME_KEYID_PART_NUM_MK_TME_KEYIDS_SHIFT    0
+#define MSR_MKTME_KEYID_PART_NUM_MK_TME_KEYIDS_MASK     CONST64U(0xFFFFFFFF)
+#define MSR_MKTME_KEYID_PART_NUM_TDX_PRIV_KEYIDS_SHIFT  32
+#define MSR_MKTME_KEYID_PART_NUM_TDX_PRIV_KEYIDS_MASK   CONST64U(0xFFFFFFFF)
+
+/*
+ * MSR_TME_CAPABILITY bits
+ */
+#define MSR_TME_CAPABILITY_AES_XTS_128                  (1ULL << 0)
+#define MSR_TME_CAPABILITY_AES_XTS_128_WITH_INTEGRITY   (1ULL << 1)
+#define MSR_TME_CAPABILITY_AES_XTS_256                  (1ULL << 2)
+#define MSR_TME_CAPABILITY_TME_BYPASS                   (1ULL << 31)
+#define MSR_TME_CAPABILITY_MK_TME_MAX_KEYID_BITS_SHIFT  31
+#define MSR_TME_CAPABILITY_MK_TME_MAX_KEYID_BITS_MASK   CONST64U(0xF)
+#define MSR_TME_CAPABILITY_MK_TME_MAX_KEYS_SHIFT        36
+#define MSR_TME_CAPABILITY_MK_TME_MAX_KEYS_MASK         CONST64U(0xFFFF)
+
+/*
+ * MSR_TME_ACTIVATE bits
+ */
+#define TME_POLICY_AES_XTS_128                          0b0000
+#define TME_POLICY_AES_XTS_256                          0b0010
+
+#define MSR_TME_ACTIVATE_LOCK                           (1ULL << 0)
+#define MSR_TME_ACTIVATE_HW_ENC_ENABLE                  (1ULL << 1)
+#define MSR_TME_ACTIVATE_KEY_SELECT                     (1ULL << 2)
+#define MSR_TME_ACTIVATE_SAVE_TME_KEY_FOR_STANDBY       (1ULL << 3)
+#define MSR_TME_ACTIVATE_TME_POLICY_SHIFT               4
+#define MSR_TME_ACTIVATE_TME_POLICY_MASK                CONST64U(0xF)
+#define MSR_TME_ACTIVATE_TME_BYPASS_ENABLE              (1ULL << 31)
+#define MSR_TME_ACTIVATE_MK_TME_KEYID_BITS_SHIFT        32
+#define MSR_TME_ACTIVATE_MK_TME_KEYID_BITS_MASK         CONST64U(0xF)
+#define MSR_TME_ACTIVATE_TDX_RESERVED_KEYID_BITS_SHIFT  36
+#define MSR_TME_ACTIVATE_TDX_RESERVED_KEYID_BITS_MASK   CONST64U(0xF)
+#define MSR_TME_ACTIVATE_MK_TME_AES_XTS_128             (1ULL << 48)
+#define MSR_TME_ACTIVATE_MK_TME_AES_XTS_256             (1ULL << 50)
+
+/*
+ * TDX SEAM range register MSRs
+ */
+#define MSR_SEAMRR_PHYS_BASE                   0x00001400
+#define MSR_SEAMRR_PHYS_MASK                   0x00001401
+
+/*
+ * MSR_SEAMRR_PHYS_BASE bits
+ */
+#define MSR_SEAMRR_PHYS_BASE_RANGE_CONFIGURED  (1ULL << 3)
+
+/*
+ * MSR_SEAMRR_PHYS_MASK bits
+ */
+#define MSR_SEAMRR_PHYS_MASK_SEAMRR_LOCK       (1ULL << 10)
+#define MSR_SEAMRR_PHYS_MASK_SEAMRR_ENABLE     (1ULL << 11)
+
 /*
  * MTRR bit description
  */
+#define MTRR_CAP_SEAMRR       0x8000
 #define MTRR_CAP_WC           0x400
 #define MTRR_CAP_FIX          0x100
 #define MTRR_CAP_VCNT_MASK    0xff
@@ -752,6 +953,8 @@ X86MSR_SysRetCS(uint64 star)
 }
 
 
+#ifdef VM_X86_ANY
+
 /*
  *----------------------------------------------------------------------
  *
@@ -839,6 +1042,7 @@ X86MSR_SetMSR(uint32 cx, uint64 value)
 #error No compiler defined for RDMSR/WRMSR.
 #endif
 
+#endif  // ifdef VM_X86_ANY
 
 #if defined __cplusplus
 }
diff --git a/vmmon-only/include/x86paging_64.h b/vmmon-only/include/x86paging_64.h
index 39b46587..632ec818 100644
--- a/vmmon-only/include/x86paging_64.h
+++ b/vmmon-only/include/x86paging_64.h
@@ -37,7 +37,7 @@
 #include "includeCheck.h"
 
 #include "vm_basic_types.h"
-#include "x86types.h"
+#include "x86/cpu_types_arch.h"
 #include "vm_pagetable.h"
 #include "x86paging_common.h"
 #include "vm_assert.h"
diff --git a/vmmon-only/include/x86paging_common.h b/vmmon-only/include/x86paging_common.h
index 4a8c9dc3..65716198 100644
--- a/vmmon-only/include/x86paging_common.h
+++ b/vmmon-only/include/x86paging_common.h
@@ -86,14 +86,15 @@
 #define PK_RIGHTS(_pkru, _key) (((_pkru) >> ((_key) * PKR_WIDTH)) & PKR_MASK);
 
 /* Error code flags */
-#define PF_P            0x0001
-#define PF_RW           0x0002
-#define PF_US           0x0004
-#define PF_RSVD         0x0008
-#define PF_ID           0x0010
-#define PF_PK           0x0020
-#define PF_SS           0x0040
-#define PF_SGX          0x8000
+#define PF_P            (1 << 0)
+#define PF_RW           (1 << 1)
+#define PF_US           (1 << 2)
+#define PF_RSVD         (1 << 3)
+#define PF_ID           (1 << 4)
+#define PF_PK           (1 << 5)
+#define PF_SS           (1 << 6)
+#define PF_SGX          (1 << 15)
+#define PF_RMP          (1 << 31)
 
 /*
  * Operand definitions for the INVPCID instruction. See SDM Vol. 2A.
diff --git a/vmmon-only/include/x86segdescrs.h b/vmmon-only/include/x86segdescrs.h
index bbb3be0a..ac884bee 100644
--- a/vmmon-only/include/x86segdescrs.h
+++ b/vmmon-only/include/x86segdescrs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -62,9 +62,8 @@ typedef struct Descriptor {
  * 16-byte system descriptors for 64-bit mode.
  */
 
-typedef 
-#include "vmware_pack_begin.h"
-struct Descriptor64 {
+#pragma pack(push, 1)
+typedef struct Descriptor64 {
    uint64   limit_lo  : 16;   // Limit bits 15-0.
    uint64   base_lo   : 24;   // Base bits  23-0.
    uint64   type      : 4;
@@ -80,9 +79,8 @@ struct Descriptor64 {
    uint64   reserved1 : 8;
    uint64   ext_attrs : 5;
    uint64   reserved2 : 19;
-}
-#include "vmware_pack_end.h"
-Descriptor64;
+} Descriptor64;
+#pragma pack(pop)
 
 typedef union {
    Descriptor desc;
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
index ae26c258..1e4d8a85 100644
--- a/vmmon-only/include/x86svm.h
+++ b/vmmon-only/include/x86svm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005-2014,2017-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2014,2017-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,13 +39,20 @@
 #define INCLUDE_ALLOW_VMMON
 #include "includeCheck.h"
 
+#include "community_source.h"
+#include "vm_basic_defs.h"
+#include "vm_assert.h"
+#include "x86cpuid.h"
 #include "x86msr.h"
+#include "x86vendor.h"
 #if defined(USERLEVEL) || defined(MONITOR_APP)
 #include "vm_basic_asm.h"
 #else
 #include "vm_asm.h"
 #endif
+#ifdef VM_X86_ANY
 #include "x86cpuid_asm.h"
+#endif
 
 #define SVM_VMCB_IO_BITMAP_PAGES   (3)
 #define SVM_VMCB_IO_BITMAP_SIZE    PAGES_2_BYTES(SVM_VMCB_IO_BITMAP_PAGES)
@@ -116,6 +123,14 @@
 #define SVM_VMCB_EXEC_CTL_CR_WR_TRAP(n) (0x0001000000000000ULL << (n))
 #define SVM_VMCB_EXEC_CTL_CR_WR_TRAP_ALL 0xffff000000000000ULL
 
+/* VMCB.execCtl2 */
+#define SVM_VMCB_EXEC_CTL2_ALL_INVLPGB     0x00000001
+#define SVM_VMCB_EXEC_CTL2_ILLEGAL_INVLPGB 0x00000002
+#define SVM_VMCB_EXEC_CTL2_PCID            0x00000004
+#define SVM_VMCB_EXEC_CTL2_MCOMMIT         0x00000008
+#define SVM_VMCB_EXEC_CTL2_TLBSYNC         0x00000010
+#define SVM_VMCB_EXEC_CTL2_RSVD            0xffffffe0
+
 /* VMCB.tlbCtl */
 #define SVM_VMCB_TLB_CTL_FLUSH              0x01
 #define SVM_VMCB_TLB_CTL_FLUSH_ONLY_CURRENT 0x02
@@ -160,7 +175,8 @@
    CLEANBIT(SEG,  8)   \
    CLEANBIT(CR2,  9)   \
    CLEANBIT(LBR,  10)  \
-   CLEANBIT(AVIC, 11)
+   CLEANBIT(AVIC, 11)  \
+   CLEANBIT(CET,  12)
 
 #define SVM_VMCB_CLEAN_MASK           ((1 << SVM_VMCB_NUM_CLEANBITS) - 1)
 
@@ -191,6 +207,17 @@
 #define SVM_VMCB_AR_DB_SHIFT        (AR_DB_SHIFT       - 4)
 #define SVM_VMCB_AR_GRAN_SHIFT      (AR_GRAN_SHIFT     - 4)
 
+/* VMSA.sevFeatures */
+#define SVM_VMSA_SEV_FEAT_SNP_ACTIVE   0x0000000000000001ULL
+#define SVM_VMSA_SEV_FEAT_VTOM         0x0000000000000002ULL
+#define SVM_VMSA_SEV_FEAT_REFLECT_VC   0x0000000000000004ULL
+#define SVM_VMSA_SEV_FEAT_RESTR_INJ    0x0000000000000008ULL
+#define SVM_VMSA_SEV_FEAT_ALT_INJ      0x0000000000000010ULL
+#define SVM_VMSA_SEV_FEAT_DBG_SWAP     0x0000000000000020ULL
+#define SVM_VMSA_SEV_FEAT_NO_HOST_IBS  0x0000000000000040ULL
+#define SVM_VMSA_SEV_FEAT_BTB_ISOLATE  0x0000000000000080ULL
+#define SVM_VMSA_SEV_FEAT_RSVD         0xffffffffffffff00ULL
+
 /* Unique Exit Codes */
 #define SVM_EXITCODE_CR_READ(n)             (0 + (n))
 #define SVM_EXITCODE_CR_WRITE(n)           (16 + (n))
@@ -249,9 +276,11 @@
 #define SVM_EXITCODE_AVIC_INCOMPLETE_IPI 1025
 #define SVM_EXITCODE_AVIC_NOACCEL        1026
 #define SVM_EXITCODE_VMGEXIT             1027
+#define SVM_EXITCODE_PVALIDATE           1028
 #define SVM_EXITCODE_MMIO_READ           0x80000001   // SW only
 #define SVM_EXITCODE_MMIO_WRITE          0x80000002   // SW only
 #define SVM_EXITCODE_NMI_COMPLETE        0x80000003   // SW only
+#define SVM_EXITCODE_AP_RESET_HOLD       0x80000004   // SW only
 #define SVM_EXITCODE_AP_JUMP_TABLE       0x80000005   // SW only
 #define SVM_EXITCODE_UNSUPPORTED         0x8000FFFF   // SW only
 #define SVM_EXITCODE_INVALID             (-1ULL)
@@ -460,6 +489,7 @@ SVM_EnabledCPU(void)
 
 
 #ifndef VMM
+#ifdef VM_X86_ANY
 /*
  *----------------------------------------------------------------------
  * SVM_CapableCPU --
@@ -476,6 +506,7 @@ SVM_CapableCPU(void)
            CPUID_GET(0x8000000a, EAX, SVM_REVISION,
                      __GET_EAX_FROM_CPUID(CPUID_SVM_FEATURES)) != 0);
 }
+#endif  // ifdef VM_X86_ANY
 
 
 /*
diff --git a/vmmon-only/include/x86vt-exit-reasons.h b/vmmon-only/include/x86vt-exit-reasons.h
index 263f840a..7961d766 100644
--- a/vmmon-only/include/x86vt-exit-reasons.h
+++ b/vmmon-only/include/x86vt-exit-reasons.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2018,2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -94,8 +94,8 @@ VT_EXIT(XSAVES,               63)
 VT_EXIT(XRSTORS,              64)
 VT_EXIT(VMEXIT65,             65)
 VT_EXIT(VMEXIT66,             66)
-VT_EXIT(VMEXIT67,             67)
-VT_EXIT(VMEXIT68,             68)
+VT_EXIT(UMWAIT,               67)
+VT_EXIT(TPAUSE,               68)
 VT_EXIT(VMEXIT69,             69)
 VT_EXIT(ENCLV,                70)
 VT_EXIT(SGX_CONFLICT,         71)
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
index 69a3479f..93be5876 100644
--- a/vmmon-only/include/x86vt-vmcs-fields.h
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -341,7 +341,7 @@ VMCS_FIELD(PDPTE3,                  0x2810, _S64, _TG,  8, _NC,  _V,  _RW, _NS)
 VMCS_FIELD(BNDCFGS,                 0x2812, _S64, _TG,  9, _NC,  _V,  _NA, _NS)
 VMCS_UNUSED(                        0x2814, _S64, _TG,  10)
 VMCS_UNUSED(                        0x2816, _S64, _TG,  11)
-VMCS_UNUSED(                        0x2818, _S64, _TG,  12)
+VMCS_FIELD(PKRS,                    0x2818, _S64, _TG,  12,_NC,  _V,  _NA, _NS)
 VMCS_UNUSED(                        0x281A, _S64, _TG,  13)
 VMCS_UNUSED(                        0x281C, _S64, _TG,  14)
 VMCS_UNUSED(                        0x281E, _S64, _TG,  15)
@@ -368,7 +368,7 @@ VMCS_GROUP_START(64, HOST)
 VMCS_FIELD(HOST_PAT,                0x2C00, _S64, _TH,  0, _NC,  _V, _NA,  _S)
 VMCS_FIELD(HOST_EFER,               0x2C02, _S64, _TH,  1, _NC,  _V, _NA,  _S)
 VMCS_FIELD(HOST_PGC,                0x2C04, _S64, _TH,  2, _NC,  _V, _NA,  _S)
-VMCS_UNUSED(                        0x2C06, _S64, _TH,  3)
+VMCS_FIELD(HOST_PKRS,               0x2C06, _S64, _TH,  3, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x2C08, _S64, _TH,  4)
 VMCS_UNUSED(                        0x2C0A, _S64, _TH,  5)
 VMCS_UNUSED(                        0x2C0C, _S64, _TH,  6)
@@ -643,9 +643,9 @@ VMCS_FIELD(RFLAGS,                  0x6820,  _SN, _TG, 16, _NC,  _V,  _RW, _NS)
 VMCS_FIELD(PENDDBG,                 0x6822,  _SN, _TG, 17, _NC,  _V,  _RW, _NS)
 VMCS_FIELD(SYSENTER_ESP,            0x6824,  _SN, _TG, 18, _NC,  _V,  _RW, _NS)
 VMCS_FIELD(SYSENTER_EIP,            0x6826,  _SN, _TG, 19, _NC,  _V,  _RW, _NS)
-VMCS_UNUSED(                        0x6828,  _SN, _TG, 20)
-VMCS_UNUSED(                        0x682A,  _SN, _TG, 21)
-VMCS_UNUSED(                        0x682C,  _SN, _TG, 22)
+VMCS_FIELD(S_CET,                   0x6828,  _SN, _TG, 20, _NC,  _V,  _NA, _NS)
+VMCS_FIELD(SSP,                     0x682A,  _SN, _TG, 21, _NC,  _V,  _NA, _NS)
+VMCS_FIELD(ISST,                    0x682C,  _SN, _TG, 22, _NC,  _V,  _NA, _NS)
 VMCS_UNUSED(                        0x682E,  _SN, _TG, 23)
 VMCS_UNUSED(                        0x6830,  _SN, _TG, 24)
 VMCS_UNUSED(                        0x6832,  _SN, _TG, 25)
@@ -671,9 +671,9 @@ VMCS_FIELD(HOST_SYSENTER_ESP,       0x6C10,  _SN, _TH,  8, _NC,  _V,  _NA,  _S)
 VMCS_FIELD(HOST_SYSENTER_EIP,       0x6C12,  _SN, _TH,  9, _NC,  _V,  _NA,  _S)
 VMCS_FIELD(HOST_RSP,                0x6C14,  _SN, _TH, 10, _NC,  _V, _URW,  _S)
 VMCS_FIELD(HOST_RIP,                0x6C16,  _SN, _TH, 11, _NC,  _V,  _NA,  _S)
-VMCS_UNUSED(                        0x6C18,  _SN, _TH, 12)
-VMCS_UNUSED(                        0x6C1A,  _SN, _TH, 13)
-VMCS_UNUSED(                        0x6C1C,  _SN, _TH, 14)
+VMCS_FIELD(HOST_S_CET,              0x6C18,  _SN, _TH, 12, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_SSP,                0x6C1A,  _SN, _TH, 13, _NC,  _V,  _NA,  _S)
+VMCS_FIELD(HOST_ISST,               0x6C1C,  _SN, _TH, 14, _NC,  _V,  _NA,  _S)
 VMCS_UNUSED(                        0x6C1E,  _SN, _TH, 15)
 VMCS_UNUSED(                        0x6C20,  _SN, _TH, 16)
 VMCS_UNUSED(                        0x6C22,  _SN, _TH, 17)
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
index 26536dfe..8e4267f5 100644
--- a/vmmon-only/include/x86vt.h
+++ b/vmmon-only/include/x86vt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2004-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2004-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,14 +31,17 @@
 #include "includeCheck.h"
 
 #include "community_source.h"
-#include "x86msr.h"
 #include "vm_basic_defs.h"
+#include "vm_assert.h"
+#include "x86msr.h"
 #if defined(USERLEVEL) || defined(MONITOR_APP)
 #include "vm_basic_asm.h"
 #else
 #include "vm_asm.h"
 #endif
-#include "x86cpuid_asm.h"
+#ifdef VM_X86_ANY
+#include "x86cpuid_asm.h"  // for CPUID_ISSET in VT_CapableCPU
+#endif
 
 /* VMX related MSRs */
 #define MSR_VMX_BASIC                  0x00000480
@@ -59,12 +62,14 @@
 #define MSR_VMX_TRUE_EXIT_CTLS         0x0000048f
 #define MSR_VMX_TRUE_ENTRY_CTLS        0x00000490
 #define MSR_VMX_VMFUNC                 0x00000491
-#define NUM_VMX_MSRS                   (MSR_VMX_VMFUNC - MSR_VMX_BASIC + 1)
+#define MSR_VMX_3RD_CTLS               0x00000492
+#define NUM_VMX_MSRS                   (MSR_VMX_3RD_CTLS - MSR_VMX_BASIC + 1)
 
 /*
  * An alias to accommodate Intel's naming convention in feature masks.
  */
 #define MSR_VMX_PROCBASED_CTLS2        MSR_VMX_2ND_CTLS
+#define MSR_VMX_PROCBASED_CTLS3        MSR_VMX_3RD_CTLS
 
 
 /*
@@ -81,7 +86,9 @@
    (CONST64U(1) << MSR_VMX_BASIC_ADVANCED_IOINFO_SHIFT)
 #define MSR_VMX_BASIC_TRUE_CTLS                 \
    (CONST64U(1) << MSR_VMX_BASIC_TRUE_CTLS_SHIFT)
-                                               
+#define MSR_VMX_BASIC_VMENTRY_NO_ERR_CODE       \
+   (CONST64U(1) << MSR_VMX_BASIC_VMENTRY_NO_ERR_CODE_SHIFT)
+
 #define MSR_VMX_MISC_VMEXIT_SAVES_LMA           \
    (CONST64U(1) << MSR_VMX_MISC_VMEXIT_SAVES_LMA_SHIFT)
 #define MSR_VMX_MISC_ACTSTATE_HLT               \
@@ -94,9 +101,11 @@
    (CONST64U(1) << MSR_VMX_MISC_PROCESSOR_TRACE_IN_VMX_SHIFT)
 #define MSR_VMX_MISC_RDMSR_SMBASE_IN_SMM        \
    (CONST64U(1) << MSR_VMX_MISC_RDMSR_SMBASE_IN_SMM_SHIFT)
+#define MSR_VMX_MISC_SMM_MONITOR_CTL            \
+   (CONST64U(1) << MSR_VMX_MISC_SMM_MONITOR_CTL_SHIFT)
 #define MSR_VMX_MISC_ALLOW_ALL_VMWRITES         \
    (CONST64U(1) << MSR_VMX_MISC_ALLOW_ALL_VMWRITES_SHIFT)
-#define MSR_VMX_MISC_ZERO_VMENTRY_INSTLEN         \
+#define MSR_VMX_MISC_ZERO_VMENTRY_INSTLEN       \
    (CONST64U(1) << MSR_VMX_MISC_ZERO_VMENTRY_INSTLEN_SHIFT)
 
 
@@ -209,7 +218,8 @@ enum {
    VMX_BASIC(DUALVMM,              49,  1)               \
    VMX_BASIC(MEMTYPE,              50,  4)               \
    VMX_BASIC(ADVANCED_IOINFO,      54,  1)               \
-   VMX_BASIC(TRUE_CTLS,            55,  1)
+   VMX_BASIC(TRUE_CTLS,            55,  1)               \
+   VMX_BASIC(VMENTRY_NO_ERR_CODE,  56,  1)
 
 #define VMX_BASIC_CAP                                    \
         VMX_BASIC_CAP_NDA                                \
@@ -250,6 +260,7 @@ enum {
    VMX_CPU(RDTSC,               12)                      \
    VMX_CPU(LDCR3,               15)                      \
    VMX_CPU(STCR3,               16)                      \
+   VMX_CPU(USE_3RD,             17)                      \
    VMX_CPU(LDCR8,               19)                      \
    VMX_CPU(STCR8,               20)                      \
    VMX_CPU(TPR_SHADOW,          21)                      \
@@ -295,14 +306,37 @@ enum {
    VMX_CPU2(EPT_VIOL_VE,        18)                      \
    VMX_CPU2(PT_SUPPRESS_NR_BIT, 19)                      \
    VMX_CPU2(XSAVES,             20)                      \
+   VMX_CPU2(PASID,              21)                      \
    VMX_CPU2(EPT_MBX,            22)                      \
+   VMX_CPU2(EPT_SUB_PAGE,       23)                      \
+   VMX_CPU2(PT_GUEST_PA,        24)                      \
    VMX_CPU2(TSC_SCALING,        25)                      \
+   VMX_CPU2(UMWAIT,             26)                      \
    VMX_CPU2(ENCLV,              28)                      \
-   VMX_CPU2(EPC_VIRT_EXT,       29)
+   VMX_CPU2(EPC_VIRT_EXT,       29)                      \
+   VMX_CPU2(BUS_LOCK,           30)                      \
+   VMX_CPU2(VM_NOTIFY,          31)
 
 #define VMX_PROCBASED_CTLS2_CAP                          \
         VMX_PROCBASED_CTLS2_CAP_NDA                      \
         VMX_PROCBASED_CTLS2_CAP_PUB
+/*
+ * Tertiary Processor-Based VM-Execution Controls
+ */
+#define VMX_CPU3(_field, _pos)                           \
+   VMXCTL(_PROCBASED_CTLS3, _field, _pos)
+#define VMX_PROCBASED_CTLS3_CAP_NDA
+#define VMX_PROCBASED_CTLS3_CAP_PUB                      \
+   VMX_CPU3(LOADIWKEY,           0)                      \
+   VMX_CPU3(HLAT,                1)                      \
+   VMX_CPU3(PAGING_WRITE,        2)                      \
+   VMX_CPU3(GUEST_PAGING_VERIF,  3)                      \
+   VMX_CPU3(IPI_VIRTUALIZATION,  4)                      \
+
+#define VMX_PROCBASED_CTLS3_CAP                          \
+        VMX_PROCBASED_CTLS3_CAP_NDA                      \
+        VMX_PROCBASED_CTLS3_CAP_PUB
+
 
 /*
  * VM-Exit Controls
@@ -321,7 +355,12 @@ enum {
    VMX_EXIT(LOAD_EFER,           21)                     \
    VMX_EXIT(SAVE_TIMER,          22)                     \
    VMX_EXIT(CLEAR_BNDCFGS,       23)                     \
-   VMX_EXIT(PT_SUPPRESS_VMX_PKT, 24)
+   VMX_EXIT(PT_SUPPRESS_VMX_PKT, 24)                     \
+   VMX_EXIT(CLEAR_RTIT,          25)                     \
+   VMX_EXIT(CLEAR_LBR,           26)                     \
+   VMX_EXIT(CLEAR_UINV,          27)                     \
+   VMX_EXIT(LOAD_CET,            28)                     \
+   VMX_EXIT(LOAD_PKRS,           29)
 
 #define VMX_EXIT_CTLS_CAP                                \
         VMX_EXIT_CTLS_CAP_NDA                            \
@@ -342,7 +381,12 @@ enum {
    VMX_ENTRY(LOAD_PAT,            14)                    \
    VMX_ENTRY(LOAD_EFER,           15)                    \
    VMX_ENTRY(LOAD_BNDCFGS,        16)                    \
-   VMX_ENTRY(PT_SUPPRESS_VMX_PKT, 17)
+   VMX_ENTRY(PT_SUPPRESS_VMX_PKT, 17)                    \
+   VMX_ENTRY(LOAD_RTIT,           18)                    \
+   VMX_ENTRY(LOAD_UINV,           19)                    \
+   VMX_ENTRY(LOAD_CET,            20)                    \
+   VMX_ENTRY(LOAD_LBR,            21)                    \
+   VMX_ENTRY(LOAD_PKRS,           22)
 
 #define VMX_ENTRY_CTLS_CAP                               \
         VMX_ENTRY_CTLS_CAP_NDA                           \
@@ -364,6 +408,7 @@ enum {
    VMX_MISC(RDMSR_SMBASE_IN_SMM,    15,  1)              \
    VMX_MISC(CR3_TARGETS,            16,  9)              \
    VMX_MISC(MAX_MSRS,               25,  3)              \
+   VMX_MISC(SMM_MONITOR_CTL,        28,  1)              \
    VMX_MISC(ALLOW_ALL_VMWRITES,     29,  1)              \
    VMX_MISC(ZERO_VMENTRY_INSTLEN,   30,  1)              \
    VMX_MISC(MSEG_ID,                32, 32)              \
@@ -372,59 +417,6 @@ enum {
         VMX_MISC_CAP_NDA                                 \
         VMX_MISC_CAP_PUB
 
-/*
- * VMX-Fixed Bits in CR0
- */
-#define VMX_FIXED_CR0(_field, _pos)                      \
-   VMXFIXED(_CR0_FIXED, _field, _pos)
-#define VMX_FIXED_CR0_CAP_NDA
-#define VMX_FIXED_CR0_CAP_PUB                            \
-   VMX_FIXED_CR0(PE,          0)                         \
-   VMX_FIXED_CR0(MP,          1)                         \
-   VMX_FIXED_CR0(EM,          2)                         \
-   VMX_FIXED_CR0(TS,          3)                         \
-   VMX_FIXED_CR0(ET,          4)                         \
-   VMX_FIXED_CR0(NE,          5)                         \
-   VMX_FIXED_CR0(WP,         16)                         \
-   VMX_FIXED_CR0(AM,         18)                         \
-   VMX_FIXED_CR0(NW,         29)                         \
-   VMX_FIXED_CR0(CD,         30)                         \
-   VMX_FIXED_CR0(PG,         31)
-
-#define VMX_FIXED_CR0_CAP                                \
-        VMX_FIXED_CR0_CAP_NDA                            \
-        VMX_FIXED_CR0_CAP_PUB
-
-/*
- * VMX-Fixed Bits in CR4
- */
-#define VMX_FIXED_CR4(_field, _pos)                      \
-   VMXFIXED(_CR4_FIXED, _field, _pos)
-#define VMX_FIXED_CR4_CAP_NDA
-#define VMX_FIXED_CR4_CAP_PUB                            \
-   VMX_FIXED_CR4(VME,         0)                         \
-   VMX_FIXED_CR4(PVI,         1)                         \
-   VMX_FIXED_CR4(TSD,         2)                         \
-   VMX_FIXED_CR4(DE,          3)                         \
-   VMX_FIXED_CR4(PSE,         4)                         \
-   VMX_FIXED_CR4(PAE,         5)                         \
-   VMX_FIXED_CR4(MCE,         6)                         \
-   VMX_FIXED_CR4(PGE,         7)                         \
-   VMX_FIXED_CR4(PCE,         8)                         \
-   VMX_FIXED_CR4(OSFXSR,      9)                         \
-   VMX_FIXED_CR4(OSXMMEXCPT, 10)                         \
-   VMX_FIXED_CR4(VMXE,       13)                         \
-   VMX_FIXED_CR4(SMXE,       14)                         \
-   VMX_FIXED_CR4(FSGSBASE,   16)                         \
-   VMX_FIXED_CR4(PCIDE,      17)                         \
-   VMX_FIXED_CR4(OSXSAVE,    18)                         \
-   VMX_FIXED_CR4(SMEP,       20)                         \
-   VMX_FIXED_CR4(SMAP,       21)
-
-#define VMX_FIXED_CR4_CAP                                \
-        VMX_FIXED_CR4_CAP_NDA                            \
-        VMX_FIXED_CR4_CAP_PUB
-
 /*
  * VMCS Enumeration
  */
@@ -452,6 +444,7 @@ enum {
    VMX_EPT(INVEPT,                 20,  1)              \
    VMX_EPT(ACCESS_DIRTY,           21,  1)              \
    VMX_EPT(ADV_EXIT_INFO,          22,  1)              \
+   VMX_EPT(SUP_SHADOW_STK,         23,  1)              \
    VMX_EPT(INVEPT_EPT_CTX,         25,  1)              \
    VMX_EPT(INVEPT_GLOBAL,          26,  1)              \
    VMX_EPT(INVVPID,                32,  1)              \
@@ -475,9 +468,6 @@ enum {
         VMX_VMFUNC_CAP_NDA \
         VMX_VMFUNC_CAP_PUB
 
-
-
-
 /*
  * Match the historical names for these fields:
  * <field>_SHIFT is the lsb of the field.
@@ -504,6 +494,7 @@ enum {
 #define _PINBASED_CTLS        VT_VMCS_PIN_VMEXEC_CTL_
 #define _PROCBASED_CTLS       VT_VMCS_CPU_VMEXEC_CTL_
 #define _PROCBASED_CTLS2      VT_VMCS_2ND_VMEXEC_CTL_
+#define _PROCBASED_CTLS3      VT_VMCS_3RD_VMEXEC_CTL_
 #define _EXIT_CTLS            VT_VMCS_VMEXIT_CTL_
 #define _ENTRY_CTLS           VT_VMCS_VMENTRY_CTL_
 
@@ -518,6 +509,7 @@ enum {
    VMX_EXIT_CTLS_CAP
    VMX_ENTRY_CTLS_CAP
    VMX_PROCBASED_CTLS2_CAP
+   VMX_PROCBASED_CTLS3_CAP
 
 #undef VMXCAP
 #undef VMXALLOW
@@ -716,7 +708,7 @@ enum {
 #define VT_ENTRY_CTLS_DEFAULT1         0x000011ff
 
 
-/* Required feature bits. */
+/* Required and default feature bits. */
 
 #define VT_REQUIRED_PINBASED_CTLS                      \
    (VT_PINBASED_CTLS_DEFAULT1                        | \
@@ -741,15 +733,44 @@ enum {
     VT_VMCS_CPU_VMEXEC_CTL_VNMI_WINDOW               | \
     VT_VMCS_CPU_VMEXEC_CTL_MONITOR)
 
+#define VT_DEFAULT_PROCBASED_CTLS                      \
+   ((VT_REQUIRED_PROCBASED_CTLS                      & \
+     ~VT_VMCS_CPU_VMEXEC_CTL_RDTSC                   & \
+     ~VT_VMCS_CPU_VMEXEC_CTL_INVLPG                  & \
+     ~VT_VMCS_CPU_VMEXEC_CTL_LDCR8                   & \
+     ~VT_VMCS_CPU_VMEXEC_CTL_STCR8                   & \
+     ~VT_VMCS_CPU_VMEXEC_CTL_LDCR3                   & \
+     ~VT_VMCS_CPU_VMEXEC_CTL_STCR3)                  | \
+    VT_VMCS_CPU_VMEXEC_CTL_MSRBITMAP                 | \
+    VT_VMCS_CPU_VMEXEC_CTL_USE_2ND)
+
+#define VT_DEFAULT_PROCBASED_CTLS2                     \
+   (VT_VMCS_2ND_VMEXEC_CTL_EPT                       | \
+    VT_VMCS_2ND_VMEXEC_CTL_RDTSCP                    | \
+    VT_VMCS_2ND_VMEXEC_CTL_VPID                      | \
+    VT_VMCS_2ND_VMEXEC_CTL_WBINVD                    | \
+    VT_VMCS_2ND_VMEXEC_CTL_PAUSE_LOOP                | \
+    VT_VMCS_2ND_VMEXEC_CTL_INVPCID                   | \
+    VT_VMCS_2ND_VMEXEC_CTL_XSAVES                    | \
+    VT_VMCS_2ND_VMEXEC_CTL_UNRESTRICTED)
+
 #define VT_REQUIRED_EXIT_CTLS                          \
    (VT_EXIT_CTLS_DEFAULT1                            | \
     VT_VMCS_VMEXIT_CTL_LONGMODE                      | \
     VT_VMCS_VMEXIT_CTL_INTRACK)
 
+#define VT_DEFAULT_EXIT_CTLS                           \
+   (VT_REQUIRED_EXIT_CTLS                            & \
+    ~VT_VMCS_VMEXIT_CTL_SAVE_DEBUGCTL)
+
 #define VT_REQUIRED_ENTRY_CTLS                         \
    (VT_ENTRY_CTLS_DEFAULT1                           | \
     VT_VMCS_VMENTRY_CTL_LONGMODE)
 
+#define VT_DEFAULT_ENTRY_CTLS                          \
+   (VT_REQUIRED_ENTRY_CTLS                           & \
+    ~VT_VMCS_VMENTRY_CTL_LOAD_DEBUGCTL)
+
 #define VT_REQUIRED_VPID_SUPPORT                       \
    (MSR_VMX_EPT_VPID_INVVPID                         | \
     MSR_VMX_EPT_VPID_INVVPID_ADDR                    | \
@@ -1074,6 +1095,25 @@ VT_MBXSupportedFromFeatures(uint64 secondary)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_ConvEPTViolSupportedFromFeatures --
+ *
+ *   Returns TRUE if the given VMX features provide support for
+ *   Convertible EPT Violations (#VE).
+ *
+ *   Assumes that VT is supported.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+VT_ConvEPTViolSupportedFromFeatures(uint64 secondary)
+{
+   return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_EPT_VIOL_VE) != 0;
+}
+
+
 #if !defined(USERLEVEL) && !defined(MONITOR_APP) /* { */
 /*
  *----------------------------------------------------------------------
@@ -1122,6 +1162,7 @@ VT_SupportedCPU(void)
 #endif /* } !defined(USERLEVEL) */
 
 #if !defined(VMM) /* { */
+#ifdef VM_X86_ANY
 /*
  *----------------------------------------------------------------------
  * VT_CapableCPU --
@@ -1134,6 +1175,7 @@ VT_CapableCPU(void)
 {
    return CPUID_ISSET(1, ECX, VMX, __GET_ECX_FROM_CPUID(1));
 }
+#endif
 #endif /* } !defined(VMM) */
 
 
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 1ebb7033..d0a153d3 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -43,17 +43,13 @@
 
 #include <asm/io.h>
 
-#include "vmware.h"
 #include "driverLog.h"
 #include "driver.h"
 #include "modulecall.h"
-#include "vm_asm.h"
+#include "vm_asm_x86.h"
 #include "vmx86.h"
 #include "task.h"
-#include "memtrack.h"
-#include "task.h"
 #include "cpuid.h"
-#include "circList.h"
 #include "x86msr.h"
 
 #ifdef VMX86_DEVEL
@@ -105,13 +101,11 @@ static const struct file_operations vmuser_fops = {
    .compat_ioctl = LinuxDriver_Ioctl,
 };
 
-#ifndef VMX86_DEVEL
 static struct miscdevice vmmon_miscdev = {
    .name = "vmmon",
    .minor = MISC_DYNAMIC_MINOR,
    .fops = &vmuser_fops,
 };
-#endif
 
 static struct timer_list tscTimer;
 static Atomic_uint32 tsckHz;
@@ -278,6 +272,10 @@ init_module(void)
 {
    int retval;
 
+#ifdef VMX86_DEVEL
+   devel_miscdevice(&vmmon_miscdev);
+#endif
+
    DriverLog_Init("/dev/vmmon");
    HostIF_InitGlobalLock();
 
@@ -303,35 +301,13 @@ init_module(void)
    linuxState.fastClockThread = NULL;
    linuxState.fastClockRate = 0;
 
-#ifdef VMX86_DEVEL
-   devel_init_module();
-   retval = register_chrdev(linuxState.major, linuxState.deviceName,
-                            &vmuser_fops);
-   if (retval) {
-      Warning("Module %s: error registering with major=%d\n",
-              linuxState.deviceName, linuxState.major);
-   } else {
-      Log("Module %s: registered with major=%d\n",
-          linuxState.deviceName, linuxState.major);
-   }
-#else
-   sprintf(linuxState.deviceName, "vmmon");
-   linuxState.major = 10;
-
    retval = misc_register(&vmmon_miscdev);
    if (retval) {
-      Warning("Module %s: error registering misc device %s\n",
-              linuxState.deviceName, vmmon_miscdev.name);
-   } else {
-      Log("Module %s: registered as misc device %s\n", linuxState.deviceName,
-          vmmon_miscdev.name);
-   }
-#endif
-
-   if (retval) {
+      Warning("Module %s: error registering misc device\n", vmmon_miscdev.name);
       Vmx86_CleanupHVIOBitmap();
       return -ENOENT;
    }
+   Log("Module %s: registered as misc device\n", vmmon_miscdev.name);
 
    HostIF_InitUptime();
 #if LINUX_VERSION_CODE < KERNEL_VERSION(4, 15, 0) && !defined(timer_setup)
@@ -344,7 +320,7 @@ init_module(void)
    LinuxDriverInitTSCkHz();
    Vmx86_InitIDList();
 
-   Log("Module %s: initialized\n", linuxState.deviceName);
+   Log("Module %s: initialized\n", vmmon_miscdev.name);
 
    return 0;
 }
@@ -366,13 +342,9 @@ cleanup_module(void)
    /*
     * XXX smp race?
     */
-#ifdef VMX86_DEVEL
-   unregister_chrdev(linuxState.major, linuxState.deviceName);
-#else
    misc_deregister(&vmmon_miscdev);
-#endif
 
-   Log("Module %s: unloaded\n", linuxState.deviceName);
+   Log("Module %s: unloaded\n", vmmon_miscdev.name);
 
    del_timer_sync(&tscTimer);
 
@@ -676,7 +648,7 @@ LinuxDriverReadTSC(void *data,   // OUT: TSC values
  *-----------------------------------------------------------------------------
  */
 
-__attribute__((always_inline)) static Bool
+static Bool
 LinuxDriverSyncReadTSCs(uint64 *delta) // OUT: TSC max - TSC min
 {
    TSCDelta tscDelta;
@@ -1257,7 +1229,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       }
 
    case IOCTL_VMX86_WRITE_PAGE: {
-#if VMX86_DEVEL
+#if defined(VMX86_DEVEL)
          VMMReadWritePage req;
 
          retval = HostIF_CopyFromUser(&req, ioarg, sizeof req);
diff --git a/vmmon-only/linux/driver.h b/vmmon-only/linux/driver.h
index 69c466e6..9403fb38 100644
--- a/vmmon-only/linux/driver.h
+++ b/vmmon-only/linux/driver.h
@@ -30,7 +30,6 @@
 #include <linux/wait.h>
 
 #include "vmx86.h"
-#include "driver_vmcore.h"
 
 
 /* Per-instance driver state */
@@ -55,12 +54,9 @@ typedef struct Device {
  * Static driver state.
  */
 
-#define VM_DEVICE_NAME_SIZE 32
 #define LINUXLOG_BUFFER_SIZE  1024
 
 typedef struct VMXLinuxState {
-   int major;
-   char deviceName[VM_DEVICE_NAME_SIZE];
    char buf[LINUXLOG_BUFFER_SIZE];
    Device *head;
 
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index b03ebc7a..3e29b115 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -28,7 +28,6 @@
 /* Must come before any kernel header file --hpreg */
 #include "driver-config.h"
 
-/* Must come before vmware.h --hpreg */
 #include <linux/binfmts.h>
 #include <linux/delay.h>
 #include <linux/file.h>
@@ -55,9 +54,7 @@
 #include <linux/signal.h>
 #include <linux/taskstats_kern.h> // For linux/sched/signal.h without version check
 
-#include "vmware.h"
 #include "x86apic.h"
-#include "vm_asm.h"
 #include "modulecall.h"
 #include "driver.h"
 #include "memtrack.h"
@@ -73,6 +70,7 @@
 #include "vcpuid.h"
 #include "x86svm.h"
 #include "crosspage.h"
+#include "cpu_defs.h"
 
 #include "pgtbl.h"
 #include "versioned_atomic.h"
@@ -81,6 +79,13 @@
 #error CONFIG_HIGH_RES_TIMERS required for acceptable performance
 #endif
 
+/* task's state is read-once rather than volatile from 5.14-rc2. */
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 15, 0) || defined(get_current_state)
+#define get_task_state(task) READ_ONCE((task)->__state)
+#else
+#define get_task_state(task) ((task)->state)
+#endif
+
 /*
  * Although this is not really related to kernel-compatibility, I put this
  * helper macro here for now for a lack of better place --hpreg
@@ -474,7 +479,7 @@ HostIF_WakeUpYielders(VMDriver *vm,     // IN:
       ASSERT(vcpuid < vm->numVCPUs);
       t = vm->vmhost->vcpuSemaTask[vcpuid];
       VCPUSet_Remove(&req, vcpuid);
-      if (t && (t->state & TASK_INTERRUPTIBLE)) {
+      if (t && (get_task_state(t) & TASK_INTERRUPTIBLE)) {
          wake_up_process(t);
       }
    }
@@ -1855,7 +1860,7 @@ HostIFReadUptimeWork(unsigned long *j)  // OUT: current jiffies
 {
    uint64 monotime, uptime, upBase, monoBase;
    int64 diff;
-   uint32 version;
+   VersionedAtomicCookie version;
    unsigned long jifs, jifBase;
    unsigned int attempts = 0;
 
@@ -2566,14 +2571,14 @@ HostIF_SemaphoreWait(VMDriver *vm,   // IN:
    }
 
    poll_initwait(&table);
-   current->state = TASK_INTERRUPTIBLE;
+   __set_current_state(TASK_INTERRUPTIBLE);
    mask = file->f_op->poll(file, &table.pt);
    if (!(mask & (POLLIN | POLLERR | POLLHUP))) {
       vm->vmhost->vcpuSemaTask[vcpuid] = current;
       schedule_timeout(timeoutms * HZ / 1000);  // convert to Hz
       vm->vmhost->vcpuSemaTask[vcpuid] = NULL;
    }
-   current->state = TASK_RUNNING;
+   __set_current_state(TASK_RUNNING);
    poll_freewait(&table);
 
    /*
@@ -2655,7 +2660,7 @@ HostIF_SemaphoreForceWakeup(VMDriver *vm,       // IN:
        */
       struct task_struct *t =
          (struct task_struct *)xchg(&vm->vmhost->vcpuSemaTask[vcpuid], NULL);
-      if (t && (t->state & TASK_INTERRUPTIBLE)) {
+      if (t && (get_task_state(t) & TASK_INTERRUPTIBLE)) {
          wake_up_process(t);
       }
    } ROF_EACH_VCPU_IN_SET_WITH_MAX();
diff --git a/vmnet-only/vm_assert.h b/vmnet-only/vm_assert.h
index 27f63477..cf344460 100644
--- a/vmnet-only/vm_assert.h
+++ b/vmnet-only/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -21,8 +21,7 @@
  *
  *	The basic assertion facility for all VMware code.
  *
- *      For proper use, see bora/doc/assert and
- *      http://vmweb.vmware.com/~mts/WebSite/guide/programming/asserts.html.
+ *      For proper use, see bora/doc/assert
  */
 
 #ifndef _VM_ASSERT_H_
@@ -41,6 +40,7 @@
 
 // XXX not necessary except some places include vm_assert.h improperly
 #include "vm_basic_types.h"
+#include <stdarg.h>
 
 #ifdef __cplusplus
 extern "C" {
@@ -64,24 +64,23 @@ extern "C" {
 
 #if !defined VMM || defined MONITOR_APP // {
 
-#if defined (VMKPANIC) 
-#include "vmk_assert.h"
-#else /* !VMKPANIC */
-#define _ASSERT_PANIC(name) \
+# if defined (VMKPANIC)
+#  include "vmk_assert.h"
+# else /* !VMKPANIC */
+#  define _ASSERT_PANIC(name) \
            Panic(_##name##Fmt "\n", __FILE__, __LINE__)
-#define _ASSERT_PANIC_BUG(bug, name) \
+#  define _ASSERT_PANIC_BUG(bug, name) \
            Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
-#define _ASSERT_PANIC_NORETURN(name) \
+#  define _ASSERT_PANIC_NORETURN(name) \
            Panic(_##name##Fmt "\n", __FILE__, __LINE__)
-#define _ASSERT_PANIC_BUG_NORETURN(bug, name) \
+#  define _ASSERT_PANIC_BUG_NORETURN(bug, name) \
            Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
-#endif /* VMKPANIC */
+# endif /* VMKPANIC */
 
 #endif // }
 
 
 // These strings don't have newline so that a bug can be tacked on.
-#define _AssertPanicFmt            "PANIC %s:%d"
 #define _AssertAssertFmt           "ASSERT %s:%d"
 #define _AssertVerifyFmt           "VERIFY %s:%d"
 #define _AssertNotImplementedFmt   "NOT_IMPLEMENTED %s:%d"
@@ -94,19 +93,21 @@ extern "C" {
  * Panic and log functions
  */
 
-void Log(const char *fmt, ...) PRINTF_DECL(1, 2);
+void Log(const char *fmt, ...)     PRINTF_DECL(1, 2);
 void Warning(const char *fmt, ...) PRINTF_DECL(1, 2);
+
 #if defined VMKPANIC
 void Panic_SaveRegs(void);
 
 NORETURN void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
 
-#define Panic(fmt...) do { \
-   Panic_SaveRegs();       \
-   Panic_NoSave(fmt);      \
-} while(0)
+# define Panic(fmt...)        \
+   do {                       \
+      Panic_SaveRegs();       \
+      Panic_NoSave(fmt);      \
+   } while(0)
 
-#else
+#else /* !VMKPANIC */
 NORETURN void Panic(const char *fmt, ...) PRINTF_DECL(1, 2);
 #endif
 
@@ -116,8 +117,6 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 
 #ifndef ASSERT_IFNOT
    /*
-    * PR 271512: When compiling with gcc, catch assignments inside an ASSERT.
-    *
     * 'UNLIKELY' is defined with __builtin_expect, which does not warn when
     * passed an assignment (gcc bug 36050). To get around this, we put 'cond'
     * in an 'if' statement and make sure it never gets executed by putting
@@ -128,75 +127,136 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
     * not clear if this is a problem with other compilers, the ASSERT
     * definition was not changed for them. Using a bare 'cond' with the
     * ternary operator may provide a solution.
+    *
+    * PR 271512: When compiling with gcc, catch assignments inside an ASSERT.
     */
 
-   #ifdef __GNUC__
-      #define ASSERT_IFNOT(cond, panic)                                       \
+# ifdef __GNUC__
+#  define ASSERT_IFNOT(cond, panic)                                       \
          ({if (UNLIKELY(!(cond))) { panic; if (0) { if (cond) {;}}} (void)0;})
-   #else
-      #define ASSERT_IFNOT(cond, panic)                                       \
+# else
+#  define ASSERT_IFNOT(cond, panic)                                       \
          (UNLIKELY(!(cond)) ? (panic) : (void)0)
-   #endif
+# endif
 #endif
 
 
 /*
  * Assert, panic, and log macros
  *
- * Some of these are redefined below undef !VMX86_DEBUG.
- * ASSERT() is special cased because of interaction with Windows DDK.
+ * Some of these are redefined or undef below in !VMX86_DEBUG.
  */
 
 #if defined VMX86_DEBUG
-#undef  ASSERT
-#define ASSERT(cond) ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertAssert))
-#define ASSERT_BUG(bug, cond) \
+   /*
+    * Assert is a debug-only construct.
+    *
+    * Assert should capture (i.e., document and validate) invariants,
+    * including method preconditions, postconditions, loop invariants,
+    * class invariants, data structure invariants, etc.
+    *
+    * ASSERT() is special cased because of interaction with Windows DDK.
+    */
+# undef  ASSERT
+# define ASSERT(cond) ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertAssert))
+# define ASSERT_BUG(bug, cond) \
            ASSERT_IFNOT(cond, _ASSERT_PANIC_BUG(bug, AssertAssert))
 #endif
 
+   /*
+    * Verify is present on all build types.
+    *
+    * Verify should protect against missing functionality (e.g., unhandled
+    * cases), bugs and other forms of gaps, and also be used as the fail-safe
+    * way to plug remaining security risks. Verify is not the correct primitive
+    * to use to validate an invariant, as a condition never being true implies
+    * that it need not be handled.
+    */
 #undef  VERIFY
 #define VERIFY(cond) \
            ASSERT_IFNOT(cond, _ASSERT_PANIC_NORETURN(AssertVerify))
 #define VERIFY_BUG(bug, cond) \
            ASSERT_IFNOT(cond, _ASSERT_PANIC_BUG_NORETURN(bug, AssertVerify))
 
-#define PANIC()        _ASSERT_PANIC(AssertPanic)
-#define PANIC_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertPanic)
-
+   /*
+    * NOT IMPLEMENTED is useful to indicate that a codepath has not yet
+    * been implemented, and should cause execution to forcibly quit if it is
+    * ever reached. Some instances use NOT_IMPLEMENTED for things that will
+    * never be implemented (as implied by ASSERT_NOT_IMPLEMENTED).
+    *
+    * PR1151214 asks for ASSERT_NOT_IMPLEMENTED to be replaced with VERIFY.
+    * ASSERT_NOT_IMPLEMENTED is a conditional NOT_IMPLEMENTED. Despite the
+    * name, ASSERT_NOT_IMPLEMENTED is present in release builds.
+    *
+    * NOT_IMPLEMENTED_BUG is NOT_IMPLEMENTED with the bug number included
+    * in the panic string.
+    */
 #define ASSERT_NOT_IMPLEMENTED(cond) \
            ASSERT_IFNOT(cond, NOT_IMPLEMENTED())
 
 #if defined VMKPANIC || defined VMM
-#define NOT_IMPLEMENTED()        _ASSERT_PANIC_NORETURN(AssertNotImplemented)
+# define NOT_IMPLEMENTED()        _ASSERT_PANIC_NORETURN(AssertNotImplemented)
 #else
-#define NOT_IMPLEMENTED()        _ASSERT_PANIC(AssertNotImplemented)
+# define NOT_IMPLEMENTED()        _ASSERT_PANIC(AssertNotImplemented)
 #endif
 
 #if defined VMM
-#define NOT_IMPLEMENTED_BUG(bug) \
+# define NOT_IMPLEMENTED_BUG(bug) \
           _ASSERT_PANIC_BUG_NORETURN(bug, AssertNotImplemented)
-#else 
-#define NOT_IMPLEMENTED_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertNotImplemented)
+#else
+# define NOT_IMPLEMENTED_BUG(bug) _ASSERT_PANIC_BUG(bug, AssertNotImplemented)
 #endif
 
+   /*
+    * NOT_REACHED is meant to indicate code paths that we can never
+    * execute. This can be very dangerous on release builds due to how
+    * some compilers behave when you do potentially reach the point
+    * indicated by NOT_REACHED and can lead to very difficult to debug
+    * failures. NOT_REACHED should be used sparingly due to this.
+    *
+    * On debug builds, NOT_REACHED is a Panic with a fixed string.
+    */
 #if defined VMKPANIC || defined VMM
-#define NOT_REACHED()            _ASSERT_PANIC_NORETURN(AssertNotReached)
+# define NOT_REACHED()            _ASSERT_PANIC_NORETURN(AssertNotReached)
 #else
-#define NOT_REACHED()            _ASSERT_PANIC(AssertNotReached)
+# define NOT_REACHED()            _ASSERT_PANIC(AssertNotReached)
 #endif
 
-#define ASSERT_MEM_ALLOC(cond) \
+#if !defined VMKERNEL && !defined VMKBOOT && !defined VMKERNEL_MODULE
+   /*
+    * PR 2621164,2624036: ASSERT_MEM_ALLOC is deprecated and should not be
+    * used. Please use VERIFY where applicable, since the latter aligns
+    * better with the consistency model as defined by bora/doc/assert. You
+    * could also consider the Util_Safe*alloc* functions in userland.
+    *
+    * Despite its name, ASSERT_MEM_ALLOC is present in both debug and release
+    * builds.
+    */
+# define ASSERT_MEM_ALLOC(cond) \
            ASSERT_IFNOT(cond, _ASSERT_PANIC(AssertMemAlloc))
-
-#ifdef VMX86_DEVEL
-#define NOT_TESTED()       Warning(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
-#else
-#define NOT_TESTED()       Log(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
 #endif
 
+   /*
+    * ASSERT_NO_INTERRUPTS & ASSERT_HAS_INTERRUPTS are shorthand to
+    * assert whether interrupts are disabled or enabled.
+    */
 #define ASSERT_NO_INTERRUPTS()  ASSERT(!INTERRUPTS_ENABLED())
 #define ASSERT_HAS_INTERRUPTS() ASSERT(INTERRUPTS_ENABLED())
 
+   /*
+    * NOT_TESTED may be used to indicate that we've reached a code path.
+    * It simply puts an entry in the log file.
+    *
+    * ASSERT_NOT_TESTED does the same, conditionally.
+    * NOT_TESTED_ONCE will only log the first time we executed it.
+    * NOT_TESTED_1024 will only log every 1024th time we execute it.
+    */
+#ifdef VMX86_DEVEL
+# define NOT_TESTED()      Warning(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
+#else
+# define NOT_TESTED()      Log(_AssertNotTestedFmt "\n", __FILE__, __LINE__)
+#endif
+
 #define ASSERT_NOT_TESTED(cond) (UNLIKELY(!(cond)) ? NOT_TESTED() : (void)0)
 #define NOT_TESTED_ONCE()       DO_ONCE(NOT_TESTED())
 
@@ -211,17 +271,36 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
 
 
 /*
- * Redefine macros that are only in debug versions
+ * Redefine macros that have a different behaviour on release
+ * builds. This includes no behaviour (ie. removed).
  */
 
 #if !defined VMX86_DEBUG // {
 
-#undef  ASSERT
-#define ASSERT(cond)          ((void)0)
-#define ASSERT_BUG(bug, cond) ((void)0)
+# undef  ASSERT
+# define ASSERT(cond)          ((void)0)
+# define ASSERT_BUG(bug, cond) ((void)0)
 
 /*
- * Expand NOT_REACHED() as appropriate for each situation.
+ * NOT_REACHED on debug builds is a Panic; but on release
+ * builds reaching it is __builtin_unreachable()
+ * which is "undefined behaviour" according to
+ * gcc. (https://gcc.gnu.org/onlinedocs/gcc/Other-Builtins.html)
+ *
+ * When used correctly __builtin_unreachable() allows the compiler
+ * to generate slightly better code and eliminates some warnings
+ * when the compiler can't identify a "fallthrough" path that is
+ * never reached.
+ *
+ * When used incorrectly, __builtin_unreachable is a dangerous
+ * construct and we should structure code in such a way that we
+ * need fewer instances of NOT_REACHED to silence the compiler,
+ * and use the function attribute "noreturn" where appropriate
+ * and potentially then using NOT_REACHED as documentation.
+ *
+ * We should *never* have code after NOT_REACHED in a block as
+ * it's unclear to the reader if that path is ever possible, and
+ * as mentioned above, gcc will do weird and wonderful things to us.
  *
  * Mainly, we want the compiler to infer the same control-flow
  * information as it would from Panic().  Otherwise, different
@@ -234,30 +313,31 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
  * (measured at 212 bytes for the release vmm for a minimal infinite
  * loop; panic would cost even more) so it does without and lives
  * with the inconsistency.
+ *
  */
 
-#if defined VMKPANIC || defined VMM
-#undef  NOT_REACHED
-#if defined __GNUC__ && (__GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 5)
-#define NOT_REACHED() (__builtin_unreachable())
-#else
-#define NOT_REACHED() ((void)0)
-#endif
-#else
-// keep debug definition
-#endif
-
-#undef LOG_UNEXPECTED
-#define LOG_UNEXPECTED(bug)     ((void)0)
-
-#undef  ASSERT_NOT_TESTED
-#define ASSERT_NOT_TESTED(cond) ((void)0)
-#undef  NOT_TESTED
-#define NOT_TESTED()            ((void)0)
-#undef  NOT_TESTED_ONCE
-#define NOT_TESTED_ONCE()       ((void)0)
-#undef  NOT_TESTED_1024
-#define NOT_TESTED_1024()       ((void)0)
+# if defined VMKPANIC || defined VMM
+#  undef  NOT_REACHED
+#  if defined __GNUC__ && (__GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 5)
+#   define NOT_REACHED() (__builtin_unreachable())
+#  else
+#   define NOT_REACHED() ((void)0)
+#  endif
+# else
+ // keep debug definition
+# endif
+
+# undef LOG_UNEXPECTED
+# define LOG_UNEXPECTED(bug)     ((void)0)
+
+# undef  ASSERT_NOT_TESTED
+# define ASSERT_NOT_TESTED(cond) ((void)0)
+# undef  NOT_TESTED
+# define NOT_TESTED()            ((void)0)
+# undef  NOT_TESTED_ONCE
+# define NOT_TESTED_ONCE()       ((void)0)
+# undef  NOT_TESTED_1024
+# define NOT_TESTED_1024()       ((void)0)
 
 #endif // !VMX86_DEBUG }
 
@@ -320,9 +400,9 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
  * the __clang_analyzer__ macro defined only when clang SA is parsing files.
  */
 #ifdef __clang_analyzer__
-#define ANALYZER_ASSERT(cond) ASSERT(cond)
+# define ANALYZER_ASSERT(cond) ASSERT(cond)
 #else
-#define ANALYZER_ASSERT(cond) ((void)0)
+# define ANALYZER_ASSERT(cond) ((void)0)
 #endif
 
 #ifdef __cplusplus
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index 52bb5d88..dc378c56 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -23,9 +23,6 @@
  *
  * Note: Only partially tested on ARM processors: Works for View Open
  *       Client, which shouldn't have threads, and ARMv8 processors.
- *
- *       In ARM, GCC intrinsics (__sync*) compile but might not
- *       work, while MS intrinsics (_Interlocked*) do not compile.
  */
 
 #ifndef _ATOMIC_H_
@@ -294,7 +291,7 @@ Atomic_Read8(Atomic_uint8 const *var)  // IN:
 
 #if defined __GNUC__ && defined VM_ARM_32
    val = AtomicUndefined(var);
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    val = _VMATOM_X(R, 8, &var->value);
 #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
    __asm__ __volatile__(
@@ -334,7 +331,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
 {
 #if defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + val);
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 8, TRUE, &var->value, val);
 #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
    __asm__ __volatile__(
@@ -375,7 +372,7 @@ Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
 {
 #if defined __GNUC__ && defined VM_ARM_32
    AtomicUndefined(var + val);
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(W, 8, &var->value, val);
 #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
    __asm__ __volatile__(
@@ -414,7 +411,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
 {
 #if defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + oldVal + newVal);
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RIFEQW, 8, TRUE, &var->value, oldVal, newVal);
 #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
    uint8 val;
@@ -460,7 +457,7 @@ Atomic_ReadAnd8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, and, val);
 #else
    do {
@@ -492,7 +489,7 @@ static INLINE void
 Atomic_And8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, and, val);
 #else
    (void)Atomic_ReadAnd8(var, val);
@@ -522,7 +519,7 @@ Atomic_ReadOr8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, orr, val);
 #else
    do {
@@ -554,7 +551,7 @@ static INLINE void
 Atomic_Or8(Atomic_uint8 *var, // IN/OUT
            uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, orr, val);
 #else
    (void)Atomic_ReadOr8(var, val);
@@ -584,7 +581,7 @@ Atomic_ReadXor8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, eor, val);
 #else
    do {
@@ -616,7 +613,7 @@ static INLINE void
 Atomic_Xor8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, eor, val);
 #else
    (void)Atomic_ReadXor8(var, val);
@@ -646,7 +643,7 @@ Atomic_ReadAdd8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, add, val);
 #else
    do {
@@ -678,7 +675,7 @@ static INLINE void
 Atomic_Add8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, add, val);
 #else
    (void)Atomic_ReadAdd8(var, val);
@@ -706,7 +703,7 @@ static INLINE void
 Atomic_Sub8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, sub, val);
 #else
    Atomic_Add8(var, -val);
@@ -892,8 +889,8 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 retVal;
-   register volatile uint32 res;
+   uint32 retVal;
+   uint32 res;
 
    dmb();
 
@@ -1037,8 +1034,8 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register uint32 retVal;
-   register uint32 res;
+   uint32 retVal;
+   uint32 res;
 
    dmb();
 
@@ -1108,8 +1105,8 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register uint64 retVal;
-   register uint32 res;
+   uint64 retVal;
+   uint32 res;
 
    dmb();
 
@@ -1198,8 +1195,8 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1257,8 +1254,8 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1316,8 +1313,8 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1417,8 +1414,8 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1476,8 +1473,8 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 tmp;
 
    dmb();
 
@@ -1621,7 +1618,7 @@ Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, orr, val);
 #else
    do {
@@ -1655,7 +1652,7 @@ Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, and, val);
 #else
    do {
@@ -1690,7 +1687,7 @@ Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, orr, val);
 #else
    do {
@@ -1724,7 +1721,7 @@ Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, and, val);
 #else
    do {
@@ -1763,9 +1760,9 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined __GNUC__
 #ifdef VM_ARM_V7
-   register volatile uint32 res;
-   register volatile uint32 retVal;
-   register volatile uint32 tmp;
+   uint32 res;
+   uint32 retVal;
+   uint32 tmp;
 
    dmb();
 
@@ -2074,13 +2071,13 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
       : "m" (*var)
       : "cc"
    );
-#elif defined _MSC_VER && defined __x86_64__
+#elif defined _MSC_VER && defined VM_64BIT
    /*
     * Microsoft docs guarantee "Simple reads and writes to properly
     * aligned 64-bit variables are atomic on 64-bit Windows."
     * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
     *
-    * XXX Verify that value is properly aligned. Bug 61315.
+    * XXX Unconditionally verify that value is properly aligned. Bug 61315.
     */
    return var->value;
 #elif defined _MSC_VER && defined VM_ARM_32
@@ -2157,7 +2154,7 @@ static INLINE uint64
 Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, add, val);
 #elif defined __x86_64__
 
@@ -2213,7 +2210,7 @@ static INLINE uint64
 Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined VM_ARM_64
+#if defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
    return Atomic_ReadAdd64(var, (uint64)-(int64)val);
@@ -2449,24 +2446,20 @@ static INLINE uint64
 Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
                    uint64 val)         // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "xchgq %0, %1"
       : "=r" (val),
-        "+m" (var->value)
+      "+m" (var->value)
       : "0" (val)
       : "memory"
    );
    return val;
-#elif defined _MSC_VER
-   return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
-#else
-#error No compiler defined for Atomic_ReadWrite64
-#endif
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 64, TRUE, &var->value, val);
+#elif defined _MSC_VER && defined VM_64BIT
+   return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
 #else
    uint64 oldVal;
 
@@ -2503,8 +2496,7 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
    ASSERT((uintptr_t)var % 8 == 0);
 #endif
 
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __GNUC__ && defined __x86_64__
    /*
     * There is no move instruction for 64-bit immediate to memory, so unless
     * the immediate value fits in 32-bit (i.e. can be sign-extended), GCC
@@ -2517,21 +2509,18 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
       : "=m" (var->value)
       : "r" (val)
    );
-#elif defined _MSC_VER
+#elif defined __GNUC__ && defined VM_ARM_64
+   _VMATOM_X(W, 64, &var->value, val);
+#elif defined _MSC_VER && defined VM_64BIT
    /*
     * Microsoft docs guarantee "Simple reads and writes to properly aligned
     * 64-bit variables are atomic on 64-bit Windows."
     * http://msdn.microsoft.com/en-us/library/ms684122%28VS.85%29.aspx
     *
-    * XXX Verify that value is properly aligned. Bug 61315.
+    * XXX Unconditionally verify that value is properly aligned. Bug 61315.
     */
 
    var->value = val;
-#else
-#error No compiler defined for Atomic_Write64
-#endif
-#elif defined VM_ARM_64
-   _VMATOM_X(W, 64, &var->value, val);
 #else
    (void)Atomic_ReadWrite64(var, val);
 #endif
@@ -2558,8 +2547,7 @@ static INLINE void
 Atomic_Or64(Atomic_uint64 *var, // IN/OUT
             uint64 val)         // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; orq %1, %0"
@@ -2567,14 +2555,11 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined _MSC_VER
+#elif defined __GNUC__ && defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, orr, val);
+#elif defined _MSC_VER && defined VM_64BIT
    _InterlockedOr64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_Or64
-#endif
-#elif defined VM_ARM_64
-   _VMATOM_X(OP, 64, TRUE, &var->value, orr, val);
-#else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    do {
@@ -2605,8 +2590,7 @@ static INLINE void
 Atomic_And64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined __x86_64__
-#if defined __GNUC__
+#if defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; andq %1, %0"
@@ -2614,14 +2598,11 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined _MSC_VER
+#elif defined __GNUC__ && defined VM_ARM_64
+   _VMATOM_X(OP, 64, TRUE, &var->value, and, val);
+#elif defined _MSC_VER && defined VM_64BIT
    _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_And64
-#endif
-#elif defined VM_ARM_64
-   _VMATOM_X(OP, 64, TRUE, &var->value, and, val);
-#else // __x86_64__
    uint64 oldVal;
    uint64 newVal;
    do {
@@ -2877,8 +2858,8 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
    );
    return val;
 #elif defined VM_ARM_V7
-   register volatile uint16 retVal;
-   register volatile uint16 res;
+   uint16 retVal;
+   uint16 res;
 
    NOT_TESTED();
 
@@ -2987,8 +2968,8 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
    );
    return val;
 #elif defined VM_ARM_V7
-   register uint16 retVal;
-   register uint16 res;
+   uint16 retVal;
+   uint16 res;
 
    NOT_TESTED();
 
@@ -3047,8 +3028,8 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3104,8 +3085,8 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3161,8 +3142,8 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3218,8 +3199,8 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3275,8 +3256,8 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
       : "cc", "memory"
    );
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 tmp;
 
    NOT_TESTED();
 
@@ -3440,9 +3421,9 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
    );
    return val;
 #elif defined VM_ARM_V7
-   register volatile uint16 res;
-   register volatile uint16 retVal;
-   register volatile uint16 tmp;
+   uint16 res;
+   uint16 retVal;
+   uint16 tmp;
 
    NOT_TESTED();
 
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index 8bc743e8..51fd6f66 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -191,7 +191,7 @@ mssb64_0(const uint64 value)
 }
 #endif
 
-#ifdef __GNUC__
+#if defined __GNUC__ || defined __clang__
 
 #ifdef VM_X86_ANY
 #define USE_ARCH_X86_CUSTOM
@@ -222,10 +222,6 @@ mssb64_0(const uint64 value)
  * **********************************************************
  */
 
-#if __GNUC__ < 4
-#define FEWER_BUILTINS
-#endif
-
 static INLINE int
 lssb32_0(uint32 v)
 {
@@ -244,7 +240,6 @@ lssb32_0(uint32 v)
    return __builtin_ffs(value) - 1;
 }
 
-#ifndef FEWER_BUILTINS
 static INLINE int
 mssb32_0(uint32 value)
 {
@@ -297,46 +292,6 @@ lssb64_0(const uint64 v)
 #endif
    return __builtin_ffsll(value) - 1;
 }
-#endif /* !FEWER_BUILTINS */
-
-#ifdef FEWER_BUILTINS
-/* GCC 3.3.x does not like __bulitin_clz or __builtin_ffsll. */
-static INLINE int
-mssb32_0(uint32 value)
-{
-   if (UNLIKELY(value == 0)) {
-      return -1;
-   } else {
-      int pos;
-      __asm__ __volatile__("bsrl %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
-      return pos;
-   }
-}
-
-static INLINE int
-lssb64_0(const uint64 value)
-{
-   if (UNLIKELY(value == 0)) {
-      return -1;
-   } else {
-      intptr_t pos;
-
-#ifdef VM_X86_64
-      __asm__ __volatile__("bsf %1, %0\n" : "=r" (pos) : "rm" (value) : "cc");
-#else
-      /* The coding was chosen to minimize conditionals and operations */
-      pos = lssb32_0((uint32) value);
-      if (pos == -1) {
-         pos = lssb32_0((uint32) (value >> 32));
-         if (pos != -1) {
-            return pos + 32;
-         }
-      }
-#endif /* VM_X86_64 */
-      return pos;
-   }
-}
-#endif /* FEWER_BUILTINS */
 
 
 static INLINE int
@@ -683,7 +638,7 @@ uint32set(void *dst, uint32 val, size_t count)
 static INLINE uint16
 Bswap16(uint16 v)
 {
-#if defined(VM_ARM_64)
+#if defined(VM_ARM_64) && !defined(_MSC_VER)
    __asm__("rev16 %w0, %w0" : "+r"(v));
    return v;
 #else
@@ -716,7 +671,7 @@ Bswap32(uint32 v) // IN
 #elif defined(VM_ARM_32) && !defined(__ANDROID__) && !defined(_MSC_VER)
     __asm__("rev %0, %0" : "+r"(v));
     return v;
-#elif defined(VM_ARM_64)
+#elif defined(VM_ARM_64) && !defined(_MSC_VER)
    __asm__("rev32 %x0, %x0" : "+r"(v));
    return v;
 #else
@@ -742,7 +697,7 @@ Bswap32(uint32 v) // IN
 static INLINE uint64
 Bswap64(uint64 v) // IN
 {
-#if defined(VM_ARM_64)
+#if defined(VM_ARM_64) && !defined(_MSC_VER)
    __asm__("rev %0, %0" : "+r"(v));
    return v;
 #else
@@ -773,7 +728,11 @@ PAUSE(void)
 }
 #elif defined(_MSC_VER)
 {
+#ifdef VM_X86_ANY
    _mm_pause();
+#else
+   __yield();
+#endif
 }
 #else  /* __GNUC__  */
 #error No compiler defined for PAUSE
@@ -809,6 +768,11 @@ RDTSC(void)
 
    return tim;
 #elif defined(VM_ARM_64)
+   /*
+    * Keep this implementation in sync with:
+    * bora/lib/vprobe/arm64/vp_emit_tc.c::VpEmit_BuiltinRDTSCWork()
+    * bora/modules/vmkernel/tests/core/xmapTest/xmapTest_arm64.c::XMapTest_SetupLoopCode()
+    */
 #if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1)
    return MRS(CNTPCT_EL0);
 #else
@@ -932,18 +896,27 @@ TestBit64(const uint64 *var, unsigned index)
  *-----------------------------------------------------------------------------
  */
 
+#if defined __GCC_ASM_FLAG_OUTPUTS__
+/*
+ * See https://gcc.gnu.org/onlinedocs/gcc/Extended-Asm.html
+ * 6.47.2.4 Flag Output Operands
+ *
+ * This expands to 0 or 1 instructions followed by the output operand string.
+ */
+#define GCC_ASM_BT_EPILOG : "=@ccc"
+#else
+#define GCC_ASM_BT_EPILOG "\n\tsetc\t%0" : "=qQm"
+#endif
+
 static INLINE Bool
 SetBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
    Bool bit;
-   __asm__ (
-      "bts %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (*(uint32 *)var)
-      : "rI" (index)
-      : "memory", "cc"
-   );
+   __asm__("bts\t%2, %1"
+           GCC_ASM_BT_EPILOG (bit), "+m" (*(uint32 *)var)
+           : "rI" (index)
+           : "memory", "cc");
    return bit;
 #elif defined(_MSC_VER)
    return _bittestandset((long *)var, index) != 0;
@@ -959,13 +932,10 @@ ClearBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
    Bool bit;
-   __asm__ (
-      "btr %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (*(uint32 *)var)
-      : "rI" (index)
-      : "memory", "cc"
-   );
+   __asm__("btr\t%2, %1"
+           GCC_ASM_BT_EPILOG (bit), "+m" (*(uint32 *)var)
+           : "rI" (index)
+           : "memory", "cc");
    return bit;
 #elif defined(_MSC_VER)
    return _bittestandreset((long *)var, index) != 0;
@@ -981,13 +951,10 @@ ComplementBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
    Bool bit;
-   __asm__ (
-      "btc %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (*(uint32 *)var)
-      : "rI" (index)
-      : "memory", "cc"
-   );
+   __asm__("btc\t%2, %1"
+           GCC_ASM_BT_EPILOG (bit), "+m" (*(uint32 *)var)
+           : "rI" (index)
+           : "memory", "cc");
    return bit;
 #elif defined(_MSC_VER)
    return _bittestandcomplement((long *)var, index) != 0;
@@ -1003,13 +970,10 @@ TestBitVector(const void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
    Bool bit;
-   __asm__ (
-      "bt %2, %1;"
-      "setc %0"
-      : "=qQm" (bit)
-      : "m" (*(const uint32 *)var), "rI" (index)
-      : "cc"
-   );
+   __asm__("bt\t%2, %1"
+           GCC_ASM_BT_EPILOG (bit)
+           : "m" (*(const uint32 *)var), "rI" (index)
+           : "cc");
    return bit;
 #elif defined _MSC_VER
    return _bittest((long *)var, index) != 0;
@@ -1018,6 +982,45 @@ TestBitVector(const void *var, int32 index)
 #endif
 }
 
+#undef GCC_ASM_BT_EPILOG
+
+/*
+ *-----------------------------------------------------------------------------
+ * RoundDownPow2_{64,32} --
+ *
+ *   Rounds a value down to the previous power of 2.  Returns the original
+ *   value if it is a power of 2. Returns 0 for input of 0 and 1 for 1.
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint64
+RoundDownPow2_64(uint64 value)
+{
+   if ((value & (value - 1)) == 0) {
+      /*
+       * Already zero or a power of two.
+       */
+      return value;
+   }
+
+   return CONST64U(1) << mssb64_0(value);
+}
+
+
+static INLINE uint32
+RoundDownPow2_32(uint32 value)
+{
+   if ((value & (value - 1)) == 0) {
+      /*
+       * Already a power of two.
+       */
+      return value;
+   }
+
+   return 1U << mssb32_0(value);
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  * RoundUpPow2_{64,32} --
@@ -1155,7 +1158,7 @@ RoundUpPow2_32(uint32 value)
 static INLINE unsigned
 PopCount32(uint32 value)
 {
-#if defined(__GNUC__) && !defined(FEWER_BUILTINS) && defined(__POPCNT__)
+#if defined(__GNUC__) && defined(__POPCNT__)
    return __builtin_popcount(value);
 #else
    /*
@@ -1224,7 +1227,7 @@ PopCount32(uint32 value)
 static INLINE unsigned
 PopCount64(uint64 value)
 {
-#if defined(__GNUC__) && !defined(FEWER_BUILTINS) && defined(__POPCNT__)
+#if defined(__GNUC__) && defined(__POPCNT__)
 #if defined(VM_X86_64)
    return __builtin_popcountll(value);
 #else
@@ -1243,6 +1246,79 @@ PopCount64(uint64 value)
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * INTR_R_BARRIER_R --
+ * INTR_R_BARRIER_W --
+ * INTR_R_BARRIER_RW --
+ * INTR_W_BARRIER_R --
+ * INTR_W_BARRIER_W --
+ * INTR_W_BARRIER_RW --
+ * INTR_RW_BARRIER_R --
+ * INTR_RW_BARRIER_W --
+ * INTR_RW_BARRIER_RW --
+ *
+ *      Enforce ordering on memory operations witnessed by and
+ *      affected by interrupt handlers.
+ *
+ *      This should be used to replace the legacy COMPILER_*_BARRIER
+ *      for code that has been audited to determine it only needs
+ *      ordering with respect to interrupt handlers, and not to other
+ *      CPUs (SMP_*), memory-mapped I/O (MMIO_*), or DMA (DMA_*).
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+#ifdef __GNUC__
+
+static INLINE void
+INTR_RW_BARRIER_RW(void)
+{
+   __asm__ __volatile__("" ::: "memory");
+}
+
+#define INTR_R_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_R_BARRIER_W INTR_RW_BARRIER_RW
+#define INTR_R_BARRIER_RW INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_W INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_RW INTR_RW_BARRIER_RW
+#define INTR_RW_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_RW_BARRIER_W INTR_RW_BARRIER_RW
+
+#elif defined _MSC_VER
+
+static INLINE void
+INTR_R_BARRIER_R(void)
+{
+   _ReadBarrier();
+}
+
+static INLINE void
+INTR_W_BARRIER_W(void)
+{
+   _WriteBarrier();
+}
+
+static INLINE void
+INTR_RW_BARRIER_RW(void)
+{
+   _ReadWriteBarrier();
+}
+
+#define INTR_R_BARRIER_W INTR_RW_BARRIER_RW
+#define INTR_R_BARRIER_RW INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_W_BARRIER_RW INTR_RW_BARRIER_RW
+#define INTR_RW_BARRIER_R INTR_RW_BARRIER_RW
+#define INTR_RW_BARRIER_W INTR_RW_BARRIER_RW
+
+#else
+#error No compiler defined for INTR_*_BARRIER_*
+#endif
+
+
 #if defined __cplusplus
 } // extern "C"
 #endif
diff --git a/vmnet-only/vm_basic_asm_x86.h b/vmnet-only/vm_basic_asm_x86.h
index 9879dc6d..3f6369c9 100644
--- a/vmnet-only/vm_basic_asm_x86.h
+++ b/vmnet-only/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -328,9 +328,7 @@ Div643264(uint64 dividend,   // IN
  *-----------------------------------------------------------------------------
  */
 
-#if defined(__GNUC__) && \
-   (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 4)) && \
-   !defined(MUL64_NO_ASM)
+#if defined(__GNUC__) && !defined(MUL64_NO_ASM)
 
 static INLINE uint64
 Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
@@ -435,9 +433,7 @@ Mul64x3264(uint64 multiplicand, uint32 multiplier, uint32 shift)
  *-----------------------------------------------------------------------------
  */
 
-#if defined(__GNUC__) && \
-   (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 4)) && \
-   !defined(MUL64_NO_ASM)
+#if defined(__GNUC__) && !defined(MUL64_NO_ASM)
 
 static INLINE int64
 Muls64x32s64(int64 multiplicand, uint32 multiplier, uint32 shift)
diff --git a/vmnet-only/vm_basic_asm_x86_64.h b/vmnet-only/vm_basic_asm_x86_64.h
index 75823a43..d3e2ab9e 100644
--- a/vmnet-only/vm_basic_asm_x86_64.h
+++ b/vmnet-only/vm_basic_asm_x86_64.h
@@ -19,7 +19,7 @@
 /*
  * vm_basic_asm_x86_64.h
  *
- *	Basic x86_64 asm macros.
+ *      Basic x86_64 asm macros.
  */
 
 #ifndef _VM_BASIC_ASM_X86_64_H_
@@ -41,7 +41,8 @@
 
 #if defined(__GNUC__)
 /*
- * GET_CURRENT_PC
+ * _GET_CURRENT_PC --
+ * GET_CURRENT_PC --
  *
  * Returns the current program counter (i.e. instruction pointer i.e. rip
  * register on x86_64). In the example below:
@@ -51,29 +52,37 @@
  *
  * the return value from GET_CURRENT_PC will point a debugger to L123.
  */
-#define GET_CURRENT_PC() ({                                           \
-      void *__rip;                                                    \
-      asm("lea 0(%%rip), %0;\n\t"                                     \
-         : "=r" (__rip));                                             \
-      __rip;                                                          \
-})
+
+#define _GET_CURRENT_PC(rip)                                                  \
+   asm volatile("lea 0(%%rip), %0" : "=r" (rip))
+
+static INLINE_ALWAYS void *
+GET_CURRENT_PC(void)
+{
+   void *rip;
+
+   _GET_CURRENT_PC(rip);
+   return rip;
+}
 
 /*
- * GET_CURRENT_LOCATION
+ * GET_CURRENT_LOCATION --
  *
  * Updates the arguments with the values of the %rip, %rbp, and %rsp
- * registers at the current code location where the macro is invoked,
- * and the return address.
+ * registers and the return address at the current code location where
+ * the macro is invoked.
  */
-#define GET_CURRENT_LOCATION(rip, rbp, rsp, retAddr)  do {         \
-      asm("lea 0(%%rip), %0\n"                                     \
-          "mov %%rbp, %1\n"                                        \
-          "mov %%rsp, %2\n"                                        \
-          : "=r" (rip), "=r" (rbp), "=r" (rsp));                   \
-      retAddr = (uint64) GetReturnAddress();                       \
-   } while (0)
+
+#define GET_CURRENT_LOCATION(rip, rbp, rsp, retAddr) do {                     \
+   _GET_CURRENT_PC(rip);                                                      \
+   asm volatile("mov %%rbp, %0" "\n\t"                                        \
+                "mov %%rsp, %1"                                               \
+                : "=r" (rbp), "=r" (rsp));                                    \
+   retAddr = (uint64)GetReturnAddress();                                      \
+} while (0)
 #endif
 
+
 /*
  * FXSAVE/FXRSTOR
  *     save/restore SIMD/MMX fpu state
@@ -376,13 +385,13 @@ Mul64x6464(uint64 multiplicand,
     *      discarded by the shift.
     *    Return the low-order 64 bits of the above.
     */
-   uint64 tmplo, tmphi;
-   tmplo = _umul128(multiplicand, multiplier, &tmphi);
    if (shift == 0) {
-      return tmplo;
+      return multiplicand * multiplier;
    } else {
-      return __shiftright128(tmplo, tmphi, (uint8) shift) +
-         ((tmplo >> (shift - 1)) & 1);
+      uint64 lo, hi;
+
+      lo = _umul128(multiplicand, multiplier, &hi);
+      return __shiftright128(lo, hi, (uint8)shift) + (lo >> (shift - 1) & 1);
    }
 }
 
@@ -463,13 +472,13 @@ Muls64x64s64(int64 multiplicand,
     * Note: using an unsigned shift is correct because shift < 64 and
     * we return only the low 64 bits of the shifted result.
     */
-   int64 tmplo, tmphi;
-   tmplo = _mul128(multiplicand, multiplier, &tmphi);
    if (shift == 0) {
-      return tmplo;
+      return multiplicand * multiplier;
    } else {
-      return __shiftright128(tmplo, tmphi, (uint8) shift) +
-         ((tmplo >> (shift - 1)) & 1);
+      int64 lo, hi;
+
+      lo = _mul128(multiplicand, multiplier, &hi);
+      return __shiftright128(lo, hi, (uint8)shift) + (lo >> (shift - 1) & 1);
    }
 }
 
diff --git a/vmnet-only/vm_basic_asm_x86_common.h b/vmnet-only/vm_basic_asm_x86_common.h
index 8c2ee36e..9b659c8b 100644
--- a/vmnet-only/vm_basic_asm_x86_common.h
+++ b/vmnet-only/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -150,6 +150,37 @@ GetCallerEFlags(void)
    X86MSR_GetMSR(MSR_BIOS_SIGN_ID))
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * CLFLUSH --
+ *
+ *      Wrapper around the CLFLUSH instruction.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      See CLFLUSH instruction in Intel SDM or AMD Programmer's Manual.
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+CLFLUSH(const void *addr)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "clflush %0"
+      :: "m" (*(uint8 *)addr));
+#elif defined _MSC_VER
+   _mm_clflush(addr);
+#else
+#error No compiler defined for CLFLUSH
+#endif
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -365,12 +396,22 @@ LOCKED_INSN_BARRIER(void)
  * accesses accross the barrier. It is not a CPU instruction, it is a compiler
  * directive (i.e. it does not emit any code).
  *
+ * => A compiler memory barrier on its own is useful for coordinating
+ *    with an interrupt handler (or preemption logic in the scheduler)
+ *    on the same CPU, so that the order of read and write
+ *    instructions in code that might be interrupted is consistent
+ *    with the barriers. But when there are other CPUs involved, or
+ *    other types of devices like memory-mapped I/O and DMA
+ *    controllers, a compiler memory barrier is not enough.
+ *
  * A CPU memory barrier prevents the CPU from re-ordering memory accesses
  * accross the barrier. It is a CPU instruction.
  *
+ * => On its own the CPU instruction isn't useful because the compiler
+ *    may reorder loads and stores around the CPU instruction.  It is
+ *    useful only when combined with a compiler memory barrier.
+ *
  * A memory barrier is the union of a compiler memory barrier and a CPU memory
- * barrier. A compiler memory barrier is a useless construct by itself. It is
- * only useful when combined with a CPU memory barrier, to implement a memory
  * barrier.
  *
  *    Semantics
@@ -418,12 +459,11 @@ LOCKED_INSN_BARRIER(void)
  * <mem_type/purpose>_<before_access_type>_BARRIER_<after_access_type>
  *
  * where:
- *   <mem_type/purpose> is either SMP, DMA, or MMIO.
+ *   <mem_type/purpose> is either INTR, SMP, DMA, or MMIO.
  *   <*_access type> is either R(load), W(store) or RW(any).
  *
  * Above every use of these memory barriers in the code, there _must_ be a
  * comment to justify the use, i.e. a comment which:
- *
  * 1) Precisely identifies which memory accesses must not be re-ordered across
  *    the memory barrier.
  * 2) Explains why it is important that the memory accesses not be re-ordered.
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index f683168c..0ec30b33 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -130,9 +130,22 @@ Max(int a, int b)
 #define ROUNDUPBITS(x, bits)	(((uintptr_t) (x) + MASK(bits)) & ~MASK(bits))
 #define ROUNDDOWNBITS(x, bits)	((uintptr_t) (x) & ~MASK(bits))
 #define CEILING(x, y)		(((x) + (y) - 1) / (y))
+
+#if defined VMKERNEL || defined VMKBOOT
+# define CEIL(_a, _b)        CEILING(_a, _b)
+# define FLOOR(_a, _b)       ((_a)/(_b))
+# define ALIGN_DOWN(_a, _b)  ROUNDDOWN(_a, _b)
+# define ALIGN_UP(_a, _b)    ROUNDUP(_a, _b)
+# define IS_ALIGNED(_a, _b)  (ALIGN_DOWN(_a, _b) == _a)
+#endif
+
 #if defined __APPLE__
 #include <machine/param.h>
 #undef MASK
+#include <mach/machine/vm_param.h>
+#undef PAGE_SHIFT
+#undef PAGE_SIZE
+#undef PAGE_MASK
 #endif
 
 /*
@@ -188,34 +201,54 @@ Max(int a, int b)
  * Page operations
  *
  * It has been suggested that these definitions belong elsewhere
- * (like x86types.h).  However, I deem them common enough
+ * (like cpu_types.h).  However, I deem them common enough
  * (since even regular user-level programs may want to do
  * page-based memory manipulation) to be here.
  * -- edward
  */
 
+#define PAGE_SHIFT_4KB   12
+#define PAGE_SHIFT_16KB  14
+#define PAGE_SHIFT_64KB  16
+
 #ifndef PAGE_SHIFT // {
 #if defined __x86_64__ || defined __i386__
-   #define PAGE_SHIFT    12
+   #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #elif defined __APPLE__
-   #define PAGE_SHIFT    12
+   #if defined VM_ARM_ANY
+      #define PAGE_SHIFT    PAGE_SHIFT_16KB
+   #else
+      #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #endif
 #elif defined VM_ARM_64
-   #define PAGE_SHIFT    12
+   #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #elif defined __arm__
-   #define PAGE_SHIFT    12
+   #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #else
    #error
 #endif
 #endif // }
 
+#define PAGE_SIZE_4KB    (1 << PAGE_SHIFT_4KB)
+#define PAGE_SIZE_16KB   (1 << PAGE_SHIFT_16KB)
+#define PAGE_SIZE_64KB   (1 << PAGE_SHIFT_64KB)
+
 #ifndef PAGE_SIZE
 #define PAGE_SIZE     (1 << PAGE_SHIFT)
 #endif
 
+#define PAGE_MASK_4KB    (PAGE_SIZE_4KB - 1)
+#define PAGE_MASK_16KB   (PAGE_SIZE_16KB - 1)
+#define PAGE_MASK_64KB   (PAGE_SIZE_64KB - 1)
+
 #ifndef PAGE_MASK
 #define PAGE_MASK     (PAGE_SIZE - 1)
 #endif
 
+#define PAGE_OFFSET_4KB(_addr)   ((uintptr_t)(_addr) & (PAGE_SIZE_4KB - 1))
+#define PAGE_OFFSET_16KB(_addr)  ((uintptr_t)(_addr) & (PAGE_SIZE_16KB - 1))
+#define PAGE_OFFSET_64KB(_addr)  ((uintptr_t)(_addr) & (PAGE_SIZE_64KB - 1))
+
 #ifndef PAGE_OFFSET
 #define PAGE_OFFSET(_addr)  ((uintptr_t)(_addr) & (PAGE_SIZE - 1))
 #endif
@@ -254,6 +287,10 @@ Max(int a, int b)
    ((uint64)(_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
+#ifndef PAGES_2_KBYTES
+#define PAGES_2_KBYTES(_npages) ((_npages) << (PAGE_SHIFT - KBYTES_SHIFT))
+#endif
+
 #ifndef PAGES_2_MBYTES
 #define PAGES_2_MBYTES(_npages) ((_npages) >> (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
@@ -392,34 +429,14 @@ void *_ReturnAddress(void);
 
 
 #ifdef __GNUC__
-#ifndef sun
-
-/*
- * A bug in __builtin_frame_address was discovered in gcc 4.1.1, and
- * fixed in 4.2.0; assume it originated in 4.0. PR 147638 and 554369.
- */
-#if  !(__GNUC__ == 4 && (__GNUC_MINOR__ == 0 || __GNUC_MINOR__ == 1))
 #define GetFrameAddr() __builtin_frame_address(0)
-#endif
-
-#endif // sun
 #endif // __GNUC__
 
-/*
- * Data prefetch was added in gcc 3.1.1
- * http://www.gnu.org/software/gcc/gcc-3.1/changes.html
- */
 #ifdef __GNUC__
-#  if ((__GNUC__ > 3) || (__GNUC__ == 3 && __GNUC_MINOR__ > 1) || \
-       (__GNUC__ == 3 && __GNUC_MINOR__ == 1 && __GNUC_PATCHLEVEL__ >= 1))
-#     define PREFETCH_R(var) __builtin_prefetch((var), 0 /* read */, \
-                                                3 /* high temporal locality */)
-#     define PREFETCH_W(var) __builtin_prefetch((var), 1 /* write */, \
-                                                3 /* high temporal locality */)
-#  else
-#     define PREFETCH_R(var) ((void)(var))
-#     define PREFETCH_W(var) ((void)(var))
-#  endif
+#  define PREFETCH_R(var) __builtin_prefetch((var), 0 /* read */, \
+                                             3 /* high temporal locality */)
+#  define PREFETCH_W(var) __builtin_prefetch((var), 1 /* write */, \
+                                             3 /* high temporal locality */)
 #endif /* __GNUC__ */
 
 
@@ -482,14 +499,6 @@ typedef int pid_t;
 // The macOS kernel SDK defines va_copy in stdarg.h.
 #include <stdarg.h>
 
-#elif defined(__GNUC__) && (__GNUC__ < 3)
-
-/*
- * Old versions of gcc recognize __va_copy, but not va_copy.
- */
-
-#define va_copy(dest, src) __va_copy(dest, src)
-
 #endif // _WIN32
 
 #endif // va_copy
@@ -595,6 +604,12 @@ typedef int pid_t;
 #define HOSTED_ONLY(x) x
 #endif
 
+#ifdef VMX86_ESXIO
+#define vmx86_esxio      1
+#else
+#define vmx86_esxio      0
+#endif
+
 #ifdef VMKERNEL
 #define vmkernel 1
 #define VMKERNEL_ONLY(x) x
@@ -652,8 +667,26 @@ typedef int pid_t;
 #ifdef ULM
 #define vmx86_ulm 1
 #define ULM_ONLY(x) x
+#ifdef ULM_MAC
+#define ulm_mac 1
+#else
+#define ulm_mac 0
+#endif
+#ifdef ULM_WIN
+#define ulm_win 1
+#else
+#define ulm_win 0
+#endif
+#ifdef ULM_ESX
+#define ulm_esx 1
+#else
+#define ulm_esx 0
+#endif
 #else
 #define vmx86_ulm 0
+#define ulm_mac 0
+#define ulm_win 0
+#define ulm_esx 0
 #define ULM_ONLY(x)
 #endif
 
@@ -720,7 +753,7 @@ typedef int pid_t;
  * Bug 827422 and 838523.
  */
 
-#if defined __GNUC__ && __GNUC__ >= 4
+#if defined __GNUC__
 #define VISIBILITY_HIDDEN __attribute__((visibility("hidden")))
 #else
 #define VISIBILITY_HIDDEN /* nothing */
@@ -812,4 +845,17 @@ typedef int pid_t;
 #define VMW_CLANG_ANALYZER_NORETURN() ((void)0)
 #endif
 
+/* VMW_FALLTHROUGH
+ *
+ *   Instructs GCC 9 and above to not warn when a case label of a
+ *   'switch' statement falls through to the next label.
+ *
+ *   If not GCC 9 or above, expands to nothing.
+ */
+#if __GNUC__ >= 9
+#define VMW_FALLTHROUGH() __attribute__((fallthrough))
+#else
+#define VMW_FALLTHROUGH()
+#endif
+
 #endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index d32cde0d..8a0d41de 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,12 +39,24 @@
 #include "includeCheck.h"
 
 /*
- * Macros __i386__ and __ia64 are intrinsically defined by GCC
+ * Standardize MSVC arch macros to GCC arch macros.
  */
 #if defined _MSC_VER && defined _M_X64
-#  define __x86_64__
+#  define __x86_64__ 1
 #elif defined _MSC_VER && defined _M_IX86
-#  define __i386__
+#  define __i386__ 1
+#elif defined _MSC_VER && defined _M_ARM64
+#  define __aarch64__ 1
+#elif defined _MSC_VER && defined _M_ARM
+#  define __arm__ 1
+#endif
+
+/*
+ * Apple/Darwin uses __arm64__, but defines the more standard
+ * __aarch64__ too. Code below assumes __aarch64__.
+ */
+#if defined __arm64__ && !defined __aarch64__
+#  error Unexpected: defined __arm64__ without __aarch64__
 #endif
 
 /*
@@ -95,6 +107,25 @@
 #define vm_arm_64 0
 #endif
 
+#ifdef VM_ARM_ANY
+#define vm_arm_any 1
+#else
+#define vm_arm_any 0
+#endif
+
+#ifdef VM_X86_ANY
+#define vm_x86_any 1
+#else
+#define vm_x86_any 0
+#endif
+
+#if defined(__APPLE__) && defined(VM_ARM_64)
+#define VM_MAC_ARM
+#define vm_mac_arm 1
+#else
+#define vm_mac_arm 0
+#endif
+
 #define vm_64bit (sizeof (void *) == 8)
 
 #ifdef _MSC_VER
@@ -117,19 +148,22 @@
 
 /*
  * C99 <stdint.h> or equivalent
- * Special cases:
- * - Linux kernel lacks <stdint.h>, preferring <linux/types.h>
+ * Userlevel: 100% <stdint.h>
+ * - gcc-4.5 or later, and earlier for some sysroots
+ * - vs2010 or later
+ * Kernel: <stdint.h> is often unavailable (and no common macros)
+ * - Linux: uses <linux/types.h> instead
  *   (and defines uintptr_t since 2.6.24, but not intptr_t)
- * - Solaris collides with gcc <stdint.h>, but has <sys/stdint.h>
- * - VMKernel + FreeBSD collides with gcc <stdint.h>, but has <sys/stdint.h>
- * - VMKernel (+DECODERLIB) share macros with Linux kernel
- * - Windows only added <stdint.h> in vc10/vs2010 (MSC ver 1600),
- *   and WDKs lack it.
+ * - Solaris: conflicts with gcc <stdint.h>, but has <sys/stdint.h>
+ * - VMKernel + FreeBSD combination collides with gcc <stdint.h>,
+ *   but has <sys/stdint.h>
+ * - Windows: some types in <crtdefs.h>, no definitions for other types.
  *
  * NB about LLP64 in LP64 environments:
  * - Apple uses 'long long' uint64_t
  * - Linux kernel uses 'long long' uint64_t
  * - Linux userlevel uses 'long' uint64_t
+ * - Windows uses 'long long' uint64_t
  */
 #if !defined(VMKERNEL) && !defined(DECODERLIB) && \
     defined(__linux__) && defined(__KERNEL__)
@@ -143,11 +177,8 @@
       (defined(VMKERNEL) && defined(__FreeBSD__)) || \
       defined(_SYS_STDINT_H_)
 #  include <sys/stdint.h>
-#elif !defined(_MSC_VER)
-   /* Common case */
-#  include <stdint.h>
-#else
-   /* COMPAT: until pre-vc10 is retired */
+#elif defined(_MSC_VER) && defined(_KERNEL_MODE)
+   /* Windows driver headers (km/crt) lack stdint.h */
 #  include <crtdefs.h>  // uintptr_t
    typedef unsigned __int64   uint64_t;
    typedef unsigned int       uint32_t;
@@ -158,6 +189,9 @@
    typedef int                int32_t;
    typedef short              int16_t;
    typedef signed char        int8_t;
+#else
+   /* Common case */
+#  include <stdint.h>
 #endif
 
 /*
@@ -355,12 +389,6 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
  * Suffix for 64-bit constants.  Use it like this:
  *    CONST64(0x7fffffffffffffff) for signed or
  *    CONST64U(0x7fffffffffffffff) for unsigned.
- *
- * 2004.08.30(thutt):
- *   The vmcore/asm64/gen* programs are compiled as 32-bit
- *   applications, but must handle 64 bit constants.  If the
- *   64-bit-constant defining macros are already defined, the
- *   definition will not be overwritten.
  */
 
 #if !defined(CONST64) || !defined(CONST64U)
@@ -459,6 +487,7 @@ typedef uint64    PageNum;
 typedef unsigned  MemHandle;
 typedef unsigned  IoHandle;
 typedef int32     World_ID;
+typedef uint64    VSCSI_HandleID;
 
 /* !! do not alter the definition of INVALID_WORLD_ID without ensuring
  * that the values defined in both bora/public/vm_basic_types.h and
@@ -496,8 +525,9 @@ typedef  int128  Reg128;
 typedef uint128 UReg128;
 #endif
 
-#if defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
-    defined (VMKERNEL) || defined (VMKBOOT) || defined (ULM)
+#if (defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
+     defined (VMKERNEL) || defined (VMKBOOT) || defined (ULM)) &&  \
+    !defined (FROBOS)
 typedef  Reg64  Reg;
 typedef UReg64 UReg;
 #endif
@@ -688,19 +718,20 @@ typedef void * UserVA;
 
 /*
  * At present, we effectively require a compiler that is at least
- * gcc-4.1 (circa 2006).  Enforce this here, various things below
+ * gcc-4.4 (circa 2009).  Enforce this here, various things below
  * this line depend upon it.
  *
  * Current oldest compilers:
- * - guest tools: 4.1.2 (freebsd/solaris)
  * - buildhost compiler: 4.4.3
  * - hosted kernel modules: 4.5
+ * - widespread usage: 4.8
  *
  * SWIG's preprocessor is exempt.
+ * clang pretends to be gcc (4.2.1 by default), so needs to be excluded.
  */
-#ifndef SWIG
-#if defined __GNUC__ && (__GNUC__ < 4 || (__GNUC__ == 4 && __GNUC_MINOR__ < 1))
-#error "gcc version is too old, need gcc-4.1 or better"
+#if !defined __clang__ && !defined SWIG
+#if defined __GNUC__ && (__GNUC__ < 4 || (__GNUC__ == 4 && __GNUC_MINOR__ < 4))
+#error "gcc version is too old, need gcc-4.4 or better"
 #endif
 #endif
 
@@ -797,7 +828,7 @@ typedef void * UserVA;
  *    Note that there is no annotation for "neither."
  */
 
-#if defined __GNUC__ && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3))
+#if defined __GNUC__
 #define HOT __attribute__((hot))
 #define COLD __attribute__((cold))
 #else
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
index 6e38b220..9650f7fe 100644
--- a/vmnet-only/vm_device_version.h
+++ b/vmnet-only/vm_device_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2005-2012,2014-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2005-2012,2014-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -43,6 +43,7 @@
 #define PCI_DEVICE_ID_LSISAS1068        0x0054
 
 /* Our own PCI IDs
+ *    VMware SBX (Sandbox device for graphics driver VM)
  *    VMware SVGA II (Unified VGA)
  *    VMware SVGA (PCI Accelerator)
  *    VMware vmxnet (Idealized NIC)
@@ -54,6 +55,8 @@
  *    VMware HD Audio controller
  */
 #define PCI_VENDOR_ID_VMWARE                    0x15AD
+#define PCI_DEVICE_ID_VMWARE_SBX                0x0420
+#define PCI_DEVICE_ID_VMWARE_SVGA_EFI           0x0407
 #define PCI_DEVICE_ID_VMWARE_SVGA3              0x0406
 #define PCI_DEVICE_ID_VMWARE_SVGA2              0x0405
 #define PCI_DEVICE_ID_VMWARE_SVGA               0x0710
@@ -113,6 +116,12 @@
 #define PCI_DEVICE_ID_VMWARE_VRDMA      0x0820
 #define PCI_DEVICE_ID_VMWARE_VTPM       0x0830
 
+/*
+ * VMware Device Virtualization Extension (DVX) devices
+ */
+#define PCI_DEVICE_ID_VMWARE_DVX_SAMPLE 0x0840
+#define PCI_DEVICE_ID_VMWARE_DVX_TEST   0x0841
+
 /*
  * VMware Virtual Device Test Infrastructure (VDTI) devices
  */
@@ -167,7 +176,9 @@
 /*
  * Intel Volume Management Device (VMD)
  */
-#define PCI_DEVICE_ID_INTEL_VMD_V1           0x201d
+#define PCI_DEVICE_ID_INTEL_VMD_GEN1           0x201d
+#define PCI_DEVICE_ID_INTEL_VMD_GEN2           0x28c0
+#define PCI_DEVICE_ID_INTEL_VMD_GEN3           0x476F
 
 /*
  * Intel Quickassist (QAT) devices.
@@ -328,10 +339,10 @@
 #define MAX_FLOPPY_DRIVES      2
 
 /************* PCI Passthrough implementation limits ********************/
-#define MAX_PCI_PASSTHRU_DEVICES 16
+#define MAX_PCI_PASSTHRU_DEVICES 32
 
 /************* Test device implementation limits ********************/
-#define MAX_PCI_TEST_DEVICES 16
+#define MAX_PCI_TEST_DEVICES 32
 
 /************* VDTI PCI Device implementation limits ********************/
 #define MAX_VDTI_PCI_DEVICES 16
@@ -352,6 +363,9 @@
 /************* PrecisionClock implementation limits ********************/
 #define MAX_PRECISIONCLOCK_DEVICES 1
 
+/************* DeviceGroup implementation limits ********************/
+#define MAX_DEVICE_GROUP_DEVICES 4
+
 /************* Strings for Host USB Driver *******************************/
 
 #ifdef _WIN32
diff --git a/vmnet-only/vm_oui.h b/vmnet-only/vm_oui.h
index 83b8d73b..b6126555 100644
--- a/vmnet-only/vm_oui.h
+++ b/vmnet-only/vm_oui.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -172,7 +172,7 @@ extern "C" {
  * Generate a random static MAC usable by devices that are not
  * virtual host adapters.
  *
- * XXX - 0 if non-x86
+ * XXX - 0 if non-x86 and not ARM
  */
 
 static INLINE void
@@ -189,7 +189,7 @@ VMX86_GENERATE_RANDOM_MAC(uint8 mac[6])
     */
    offset = 0x200000;
    /* Randomize bits 20-0 and make them unique on this machine. */
-#if defined(__i386__) || defined(__x86_64__)
+#if defined(__i386__) || defined(__x86_64__) || defined(VM_ARM_64)
    r = (uint32)RDTSC();
 #endif
    VMX86_BUILD_MAC(mac, r | offset);

From 2d39b2ed9c62d5d1550bb706f8e5daaa4d1c2018 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 11 Mar 2022 16:20:08 +0100
Subject: [PATCH 19/41] import Workstation 16.2.3 module sources

---
 vmmon-only/common/crosspage.c       |   4 +-
 vmmon-only/common/task.c            |  20 ++--
 vmmon-only/include/compat_version.h |  11 +-
 vmmon-only/include/vm_basic_defs.h  |  26 +++--
 vmmon-only/include/x86_basic_defs.h |   2 +
 vmmon-only/include/x86msr.h         |   8 +-
 vmmon-only/linux/hostif.c           |  20 ++--
 vmnet-only/compat_netdevice.h       | 149 +---------------------------
 vmnet-only/compat_version.h         |  11 +-
 vmnet-only/vm_basic_defs.h          |  26 +++--
 vmnet-only/vnetInt.h                |   2 +-
 11 files changed, 90 insertions(+), 189 deletions(-)

diff --git a/vmmon-only/common/crosspage.c b/vmmon-only/common/crosspage.c
index 2394fa78..a5a47c51 100644
--- a/vmmon-only/common/crosspage.c
+++ b/vmmon-only/common/crosspage.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -47,7 +47,7 @@
 
 #ifdef __linux__
 #   include "driver-config.h"
-#   if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 10, 0)
+#   if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 10, 0) || defined(RHEL85_BACKPORTS)
 #      include <linux/objtool.h>
 #   elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 6, 0)
 #      include <linux/frame.h>
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index 583b9126..7259b390 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -46,14 +46,23 @@
 #   include <string.h>
 #endif
 
+/* On Linux, must come before any inclusion of asm/page.h --hpreg */
+#include "hostKernel.h"
+
+/* On Linux this must be before any inclusion of vmx86.h */
+#ifdef LINUX_GDT_IS_RO
+#   include <asm/desc.h>
+#   define default_rw_gdt get_current_gdt_rw()
+#else
+#   define default_rw_gdt NULL
+#endif
+
 #include "modulecall.h"
 #include "vmx86.h"
 #include "task.h"
 #include "vm_asm.h"
 #include "cpuid.h"
 #include "hostif.h"
-/* On Linux, must come before any inclusion of asm/page.h --hpreg */
-#include "hostKernel.h"
 #include "comport.h"
 #include "crossgdt.h"
 #include "x86svm.h"
@@ -68,13 +77,6 @@
 #include "crosspage.h"
 #include "cpu_defs.h"
 
-#ifdef LINUX_GDT_IS_RO
-#   include <asm/desc.h>
-#   define default_rw_gdt get_current_gdt_rw()
-#else
-#   define default_rw_gdt NULL
-#endif
-
 #if defined(_WIN64)
 #   include "vmmon-asm-x86-64.h"
 #   define USE_TEMPORARY_GDT 1
diff --git a/vmmon-only/include/compat_version.h b/vmmon-only/include/compat_version.h
index 56d021cf..51facf4b 100644
--- a/vmmon-only/include/compat_version.h
+++ b/vmmon-only/include/compat_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -128,4 +128,13 @@
 #   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) 1
 #endif
 
+#if defined(RHEL_RELEASE_CODE) && defined(RHEL_RELEASE_VERSION)
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(8, 4)
+#      define RHEL84_BACKPORTS 1
+#   endif
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(8, 5)
+#      define RHEL85_BACKPORTS 1
+#   endif
+#endif
+
 #endif /* __COMPAT_VERSION_H__ */
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index 0ec30b33..006c60ca 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -282,9 +282,18 @@ Max(int a, int b)
 #define MBYTES_SHIFT 20
 #endif
 
+#ifndef GBYTES_SHIFT
+#define GBYTES_SHIFT 30
+#endif
+
+#ifndef KBYTES_2_PAGES
+#define KBYTES_2_PAGES(_nkbytes) \
+   ((uint64)(_nkbytes) >> (PAGE_SHIFT - KBYTES_SHIFT))
+#endif
+
 #ifndef MBYTES_2_PAGES
-#define MBYTES_2_PAGES(_nbytes) \
-   ((uint64)(_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
+#define MBYTES_2_PAGES(_nMbytes) \
+   ((uint64)(_nMbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_KBYTES
@@ -306,11 +315,12 @@ Max(int a, int b)
 #endif
 
 #ifndef GBYTES_2_PAGES
-#define GBYTES_2_PAGES(_nbytes) ((uint64)(_nbytes) << (30 - PAGE_SHIFT))
+#define GBYTES_2_PAGES(_nGbytes) \
+   ((uint64)(_nGbytes) << (GBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_GBYTES
-#define PAGES_2_GBYTES(_npages) ((_npages) >> (30 - PAGE_SHIFT))
+#define PAGES_2_GBYTES(_npages) ((_npages) >> (GBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef BYTES_2_KBYTES
@@ -318,7 +328,7 @@ Max(int a, int b)
 #endif
 
 #ifndef KBYTES_2_BYTES
-#define KBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << KBYTES_SHIFT)
+#define KBYTES_2_BYTES(_nkbytes) ((uint64)(_nkbytes) << KBYTES_SHIFT)
 #endif
 
 #ifndef BYTES_2_MBYTES
@@ -326,15 +336,15 @@ Max(int a, int b)
 #endif
 
 #ifndef MBYTES_2_BYTES
-#define MBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << MBYTES_SHIFT)
+#define MBYTES_2_BYTES(_nMbytes) ((uint64)(_nMbytes) << MBYTES_SHIFT)
 #endif
 
 #ifndef BYTES_2_GBYTES
-#define BYTES_2_GBYTES(_nbytes) ((_nbytes) >> 30)
+#define BYTES_2_GBYTES(_nbytes) ((_nbytes) >> GBYTES_SHIFT)
 #endif
 
 #ifndef GBYTES_2_BYTES
-#define GBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << 30)
+#define GBYTES_2_BYTES(_nGbytes) ((uint64)(_nGbytes) << GBYTES_SHIFT)
 #endif
 
 #ifndef VM_PAE_LARGE_PAGE_SHIFT
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index e6fcee45..f40b20a4 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -75,7 +75,9 @@
 #define CR3_PDB_MASK   0xfffff000
 #define CR3_IGNORE     0xFFF
 #define PAE_CR3_IGNORE 0x1F
+#ifndef CR3_PCID_MASK
 #define CR3_PCID_MASK  0xFFF
+#endif
 #define CR3_NO_FLUSH   (1ULL << 63)
 
 #define CR4_VME        0x00000001
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 88c7f269..855eeb32 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -119,8 +119,10 @@ typedef struct MSRQuery {
 #define MSR_PL3_SSP                          0x6a7
 #define MSR_ISST_ADDR                        0x6a8
 
+#ifndef MSR_TEST_CTRL
 #define MSR_TEST_CTRL                        0x33
 #define MSR_TEST_CTRL_SPLIT_LOCK_DETECT           (1ULL << 29)
+#endif
 
 #define IA32_MSR_ARCH_CAPABILITIES           0x10a
 #define MSR_ARCH_CAPABILITIES_RDCL_NO             (1ULL << 0)
@@ -147,7 +149,9 @@ typedef struct MSRQuery {
 #define MSR_TSX_CTRL_RTM_DISABLE                  (1ULL << 0)
 #define MSR_TSX_CTRL_CPUID_CLEAR                  (1ULL << 1)
 
+#ifndef MSR_MISC_FEATURES_ENABLES
 #define MSR_MISC_FEATURES_ENABLES            0x140
+#endif
 
 #define MSR_XFD                              0x1c4
 #define MSR_XFD_ERR                          0x1c5
@@ -581,11 +585,11 @@ typedef struct MSRQuery {
 /* This ifndef is necessary because this is defined by some kernel headers. */
 #ifndef MSR_K7_HWCR
 #define MSR_K7_HWCR                0xc0010015    // Available on AMD processors
-#endif
 #define MSR_K7_HWCR_SSEDIS         0x00008000ULL // Disable SSE bit
 #define MSR_K7_HWCR_MONMWAITUSEREN 0x00000400ULL // Enable MONITOR/MWAIT CPL>0
 #define MSR_K7_HWCR_TLBFFDIS       0x00000040ULL // Disable TLB Flush Filter
 #define MSR_K7_HWCR_SMMLOCK        0x00000001ULL // Lock SMM environment
+#endif
 
 #ifndef MSR_K8_SYSCFG
 #define MSR_K8_SYSCFG        0xc0010010
@@ -790,10 +794,12 @@ typedef struct MSRQuery {
 #define MSR_HYPERV_GUESTOSID_OS_MASK             0xfULL
 #define MSR_HYPERV_GUESTOSID_OS_WINNT_DERIVATIVE 4ULL
 
+#ifndef MSR_TSX_FORCE_ABORT
 /* MSR for forcing RTM abort to recover PMC3 (see PR 2333817) */
 /* See SKZ87 in intel 335901-009 6th-gen-x-series-spec-update.pdf */
 #define MSR_TSX_FORCE_ABORT                      0x0000010f
 #define MSR_TSX_FORCE_ABORT_RTM_BIT_INDEX        0
+#endif
 
 /*
  * Total Memory Encryption MSRs
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 3e29b115..0f45125e 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -1684,11 +1684,11 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
     * since at least 2.6.0.
     */
 
-#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 0, 0)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 0, 0) || defined(RHEL84_BACKPORTS)
+   PageCnt totalPhysicalPages = totalram_pages();
+#else
    extern unsigned long totalram_pages;
    PageCnt totalPhysicalPages = totalram_pages;
-#else
-   PageCnt totalPhysicalPages = totalram_pages();
 #endif
    /*
     * Use the memory information linux exports as of late for a more
@@ -1705,28 +1705,28 @@ HostIF_EstimateLockedPageLimit(const VMDriver* vm,                // IN
    PageCnt lockedPages = hugePages + reservedPages;
    PageCnt anonPages;
 
-   /* global_page_state is global_zone_page_state in 4.14. */
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 14, 0)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 11, 0) || defined(RHEL85_BACKPORTS)
+   lockedPages += global_node_page_state(NR_PAGETABLE);
+#elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 14, 0)
    lockedPages += global_zone_page_state(NR_PAGETABLE);
 #else
    lockedPages += global_page_state(NR_PAGETABLE);
 #endif
-   /* NR_SLAB_* moved from zone to node in 4.13. */
 
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 9, 0)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(5, 9, 0) || defined(RHEL84_BACKPORTS)
    lockedPages += global_node_page_state_pages(NR_SLAB_UNRECLAIMABLE_B);
 #elif LINUX_VERSION_CODE >= KERNEL_VERSION(4, 13, 0)
    lockedPages += global_node_page_state(NR_SLAB_UNRECLAIMABLE);
 #else
    lockedPages += global_page_state(NR_SLAB_UNRECLAIMABLE);
 #endif
-   /* NR_UNEVICTABLE moved from global to node in 4.8. */
+
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 8, 0)
    lockedPages += global_node_page_state(NR_UNEVICTABLE);
 #else
    lockedPages += global_page_state(NR_UNEVICTABLE);
 #endif
-   /* NR_ANON_MAPPED moved & changed name in 4.8. */
+
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 8, 0)
    anonPages = global_node_page_state(NR_ANON_MAPPED);
 #else
diff --git a/vmnet-only/compat_netdevice.h b/vmnet-only/compat_netdevice.h
index ae5c79cb..bb5001b2 100644
--- a/vmnet-only/compat_netdevice.h
+++ b/vmnet-only/compat_netdevice.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -24,153 +24,6 @@
 #include <linux/rtnetlink.h>
 #include <linux/netdevice.h>
 #include <linux/etherdevice.h>
-#include <linux/pci.h>
-
-/*
- * The enet_statistics structure moved from linux/if_ether.h to
- * linux/netdevice.h and is renamed net_device_stats in 2.1.25 --hpreg
- */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 1, 25)
-#   include <linux/if_ether.h>
-
-#   define net_device_stats enet_statistics
-#endif
-
-
-/* The netif_rx_ni() API appeared in 2.4.8 --hpreg */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 8)
-#   define netif_rx_ni netif_rx
-#endif
-
-
-/* The device struct was renamed net_device in 2.3.14 --hpreg */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 3, 14)
-#   define net_device device
-#endif
-
-
-/*
- * SET_MODULE_OWNER appeared sometime during 2.3.x. It was setting
- * dev->owner = THIS_MODULE until 2.5.70, where netdevice refcounting
- * was completely changed.  SET_MODULE_OWNER was nop for whole
- * 2.6.x series, and finally disappeared in 2.6.24.
- *
- * MOD_xxx_USE_COUNT wrappers are here, as they must be mutually
- * exclusive with SET_MODULE_OWNER call.
- */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
-#   define COMPAT_SET_MODULE_OWNER(dev) do {} while (0)
-#   define COMPAT_NETDEV_MOD_INC_USE_COUNT MOD_INC_USE_COUNT
-#   define COMPAT_NETDEV_MOD_DEC_USE_COUNT MOD_DEC_USE_COUNT
-#else
-#   if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
-#      define COMPAT_SET_MODULE_OWNER(dev) SET_MODULE_OWNER(dev)
-#   else
-#      define COMPAT_SET_MODULE_OWNER(dev) do {} while (0)
-#   endif
-#   define COMPAT_NETDEV_MOD_INC_USE_COUNT do {} while (0)
-#   define COMPAT_NETDEV_MOD_DEC_USE_COUNT do {} while (0)
-#endif
-
-/*
- * SET_NETDEV_DEV appeared sometime during 2.5.x, and later was
- * crossported to various 2.4.x kernels (as dummy macro).
- */
-#ifdef SET_NETDEV_DEV
-#   define COMPAT_SET_NETDEV_DEV(dev, pdev) SET_NETDEV_DEV(dev, pdev)
-#else
-#   define COMPAT_SET_NETDEV_DEV(dev, pdev) do {} while (0)
-#endif
-
-/*
- * Build alloc_etherdev API on the top of init_etherdev.  For 2.0.x kernels
- * we must provide dummy init method, otherwise register_netdev does
- * nothing.
- */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 3)
-
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 2, 0)
-int
-vmware_dummy_init(struct net_device *dev)
-{
-   return 0;
-}
-#endif
-
-
-static inline struct net_device*
-compat_alloc_etherdev(int priv_size)
-{
-   struct net_device* dev;
-   int size = sizeof *dev + priv_size;
-
-   /*
-    * The name is dynamically allocated before 2.4.0, but 
-    * is an embedded array in later kernels.
-    */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
-   size += sizeof("ethXXXXXXX");
-#endif
-   dev = kmalloc(size, GFP_KERNEL);
-   if (dev) {
-      memset(dev, 0, size);
-      if (priv_size) {
-         dev->priv = dev + 1;
-      }
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
-      dev->name = (char *)(dev + 1) + priv_size;
-#endif
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 2, 0)
-      dev->init = vmware_dummy_init;
-#endif
-      if (init_etherdev(dev, 0) != dev) {
-         kfree(dev);
-         dev = NULL;
-      }
-   }
-   return dev;
-}
-#else
-#define compat_alloc_etherdev(sz)   alloc_etherdev(sz)
-#endif
-
-
-/*
- * alloc_netdev and free_netdev are there since 2.4.23.  Their use is mandatory
- * since 2.6.24.
- */
-#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 23)
-static inline struct net_device *
-compat_alloc_netdev(int priv_size,
-                    const char *mask,
-                    void (*setup)(struct net_device *))
-{
-   struct net_device *dev;
-   int netdev_size = sizeof *dev;
-   int alloc_size;
-
-#   if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
-   netdev_size += IFNAMSIZ;
-#   endif
-
-   alloc_size = netdev_size + priv_size;
-   dev = kmalloc(alloc_size, GFP_KERNEL);
-   if (dev) {
-      memset(dev, 0, alloc_size);
-      dev->priv = (char*)dev + netdev_size;
-      setup(dev);
-#   if LINUX_VERSION_CODE < KERNEL_VERSION(2, 4, 0)
-      dev->name = (char*)(dev + 1);
-#   endif
-      strcpy(dev->name, mask);   
-   }
-   return dev;
-}
-#   define compat_free_netdev(dev)     kfree(dev)
-#else
-#   define compat_alloc_netdev(size, mask, setup) alloc_netdev(size, mask, setup)
-#   define compat_free_netdev(dev)                free_netdev(dev)
-#endif
 
 /* netdev_priv() appeared in 2.6.3 */
 #if  LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 3)
diff --git a/vmnet-only/compat_version.h b/vmnet-only/compat_version.h
index 56d021cf..51facf4b 100644
--- a/vmnet-only/compat_version.h
+++ b/vmnet-only/compat_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -128,4 +128,13 @@
 #   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) 1
 #endif
 
+#if defined(RHEL_RELEASE_CODE) && defined(RHEL_RELEASE_VERSION)
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(8, 4)
+#      define RHEL84_BACKPORTS 1
+#   endif
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(8, 5)
+#      define RHEL85_BACKPORTS 1
+#   endif
+#endif
+
 #endif /* __COMPAT_VERSION_H__ */
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index 0ec30b33..006c60ca 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -282,9 +282,18 @@ Max(int a, int b)
 #define MBYTES_SHIFT 20
 #endif
 
+#ifndef GBYTES_SHIFT
+#define GBYTES_SHIFT 30
+#endif
+
+#ifndef KBYTES_2_PAGES
+#define KBYTES_2_PAGES(_nkbytes) \
+   ((uint64)(_nkbytes) >> (PAGE_SHIFT - KBYTES_SHIFT))
+#endif
+
 #ifndef MBYTES_2_PAGES
-#define MBYTES_2_PAGES(_nbytes) \
-   ((uint64)(_nbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
+#define MBYTES_2_PAGES(_nMbytes) \
+   ((uint64)(_nMbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_KBYTES
@@ -306,11 +315,12 @@ Max(int a, int b)
 #endif
 
 #ifndef GBYTES_2_PAGES
-#define GBYTES_2_PAGES(_nbytes) ((uint64)(_nbytes) << (30 - PAGE_SHIFT))
+#define GBYTES_2_PAGES(_nGbytes) \
+   ((uint64)(_nGbytes) << (GBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef PAGES_2_GBYTES
-#define PAGES_2_GBYTES(_npages) ((_npages) >> (30 - PAGE_SHIFT))
+#define PAGES_2_GBYTES(_npages) ((_npages) >> (GBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
 #ifndef BYTES_2_KBYTES
@@ -318,7 +328,7 @@ Max(int a, int b)
 #endif
 
 #ifndef KBYTES_2_BYTES
-#define KBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << KBYTES_SHIFT)
+#define KBYTES_2_BYTES(_nkbytes) ((uint64)(_nkbytes) << KBYTES_SHIFT)
 #endif
 
 #ifndef BYTES_2_MBYTES
@@ -326,15 +336,15 @@ Max(int a, int b)
 #endif
 
 #ifndef MBYTES_2_BYTES
-#define MBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << MBYTES_SHIFT)
+#define MBYTES_2_BYTES(_nMbytes) ((uint64)(_nMbytes) << MBYTES_SHIFT)
 #endif
 
 #ifndef BYTES_2_GBYTES
-#define BYTES_2_GBYTES(_nbytes) ((_nbytes) >> 30)
+#define BYTES_2_GBYTES(_nbytes) ((_nbytes) >> GBYTES_SHIFT)
 #endif
 
 #ifndef GBYTES_2_BYTES
-#define GBYTES_2_BYTES(_nbytes) ((uint64)(_nbytes) << 30)
+#define GBYTES_2_BYTES(_nGbytes) ((uint64)(_nGbytes) << GBYTES_SHIFT)
 #endif
 
 #ifndef VM_PAE_LARGE_PAGE_SHIFT
diff --git a/vmnet-only/vnetInt.h b/vmnet-only/vnetInt.h
index e05a25d0..f6a90a13 100644
--- a/vmnet-only/vnetInt.h
+++ b/vmnet-only/vnetInt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the

From 23b8308203e4c516532e891d26f733a3e3f1f573 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Tue, 26 Jul 2022 22:27:27 +0200
Subject: [PATCH 20/41] import Workstation 16.2.4 module sources

---
 vmmon-only/include/vm_asm_x86.h | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index 5d9350b5..e876d93f 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -61,12 +61,15 @@
  *  ASSERT_ON_COMPILE(sizeof(Selector) == 2 &&                            \
  *                    ((__builtin_constant_p(expr) ? ((expr) >> 16) == 0) \
  *                                                 : sizeof(expr) <= 2)
+ * The __builtin_choose_expr is due to GCC bug 79482:
+ * https://gcc.gnu.org/bugzilla/show_bug.cgi?id=79482
  */
 #ifndef USE_UBSAN
 #define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)                                \
    ASSERT_ON_COMPILE(sizeof(Selector) == 2 &&                                \
-                     ((__builtin_constant_p(expr) && ((expr) >> 16) == 0) || \
-                      sizeof(expr) <= 2))
+                     __builtin_choose_expr(__builtin_constant_p(expr),       \
+                                           ((expr) >> 16) == 0,              \
+                                           sizeof(expr) <= 2))
 #else
 #define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)
 #endif

From 33f1d0e6510328d00fa1d5470326a263b4a4f4b8 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 18 Nov 2022 13:25:00 +0100
Subject: [PATCH 21/41] import Workstation 17.0.0 module sources

---
 vmmon-only/bootstrap/monLoader.c             | 166 +++++-------
 vmmon-only/bootstrap/vmmblob.c               |  17 +-
 vmmon-only/common/comport.c                  |  19 +-
 vmmon-only/common/cpuid.c                    |  11 +-
 vmmon-only/common/crosspage.c                |  21 +-
 vmmon-only/common/hostif.h                   |  17 +-
 vmmon-only/common/phystrack.c                |   4 +-
 vmmon-only/common/task.c                     |  33 +--
 vmmon-only/common/vmx86.c                    | 180 +++++++------
 vmmon-only/common/vmx86.h                    |   6 +-
 vmmon-only/include/addrlayout_table.h        |  12 +-
 vmmon-only/include/intelVT.h                 |   5 +-
 vmmon-only/include/iocontrols.h              |  42 ++-
 vmmon-only/include/modulecall.h              |   5 +-
 vmmon-only/include/monLoader.h               |   2 +-
 vmmon-only/include/mon_assert.h              |   6 +-
 vmmon-only/include/perfctr_arch.h            |  48 ++--
 vmmon-only/include/ptsc.h                    |   1 +
 vmmon-only/include/segs.h                    |  13 +-
 vmmon-only/include/vcpuset.h                 |  42 +--
 vmmon-only/include/vcpuset_types.h           |   2 +-
 vmmon-only/include/virtual_vt.h              |   7 +-
 vmmon-only/include/vm_asm_x86.h              |  27 +-
 vmmon-only/include/vm_assert.h               |  37 +--
 vmmon-only/include/vm_atomic.h               | 233 +++++++++-------
 vmmon-only/include/vm_basic_asm.h            |  23 +-
 vmmon-only/include/vm_basic_asm_x86_64.h     |  33 ++-
 vmmon-only/include/vm_basic_asm_x86_common.h |  43 ++-
 vmmon-only/include/vm_basic_defs.h           |  35 ++-
 vmmon-only/include/vm_basic_types.h          |  32 +--
 vmmon-only/include/vm_idt_x86.h              |   9 +-
 vmmon-only/include/vmm_constants.h           |   9 +-
 vmmon-only/include/x86/cpu_types_arch.h      |  11 +-
 vmmon-only/include/x86_basic_defs.h          |   1 +
 vmmon-only/include/x86cet.h                  |  83 ++++++
 vmmon-only/include/x86cpuid.h                | 268 +++++++++++--------
 vmmon-only/include/x86msr.h                  | 101 +++++--
 vmmon-only/include/x86paging_64.h            |   9 +-
 vmmon-only/include/x86svm.h                  | 126 +++++++--
 vmmon-only/include/x86vt-vmcs-fields.h       |  24 +-
 vmmon-only/include/x86vt.h                   |  88 ++++--
 vmmon-only/linux/driver.c                    |  59 ++--
 vmmon-only/linux/hostif.c                    |  32 +--
 vmnet-only/bridge.c                          |  19 +-
 vmnet-only/driver.c                          |  59 +---
 vmnet-only/hub.c                             |  10 +-
 vmnet-only/netif.c                           |  16 +-
 vmnet-only/smac.c                            |   4 +-
 vmnet-only/smac.h                            |   8 +-
 vmnet-only/userif.c                          |  83 ++++--
 vmnet-only/vm_assert.h                       |  37 +--
 vmnet-only/vm_atomic.h                       | 233 +++++++++-------
 vmnet-only/vm_basic_asm.h                    |  23 +-
 vmnet-only/vm_basic_asm_x86_64.h             |  33 ++-
 vmnet-only/vm_basic_asm_x86_common.h         |  43 ++-
 vmnet-only/vm_basic_defs.h                   |  35 ++-
 vmnet-only/vm_basic_types.h                  |  32 +--
 vmnet-only/vm_device_version.h               |  42 ++-
 vmnet-only/vnet.h                            |  33 +--
 59 files changed, 1556 insertions(+), 1096 deletions(-)
 create mode 100644 vmmon-only/include/x86cet.h

diff --git a/vmmon-only/bootstrap/monLoader.c b/vmmon-only/bootstrap/monLoader.c
index dfc6f527..fef36977 100644
--- a/vmmon-only/bootstrap/monLoader.c
+++ b/vmmon-only/bootstrap/monLoader.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -262,31 +262,6 @@ MonLoaderMapMPN(MonLoaderContext *ctx,    // IN/OUT
 }
 
 
-/*
- *----------------------------------------------------------------------
- *
- * MonLoaderBuildsPtLevel --
- *
- *      Determines whether MonLoader allocates and maps the page table(s) for
- *      the monitor at the given level.
- *
- * Result:
- *      TRUE if MonLoader creates the page table at the given level, FALSE
- *      otherwise.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-static Bool
-MonLoaderCreatesPtLevel(PT_Level level)
-{
-   ASSERT(level >= PT_LEVEL_STOP && level <= PT_MAX_LEVELS);
-   return FALSE;
-}
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -338,91 +313,75 @@ MonLoaderCreateAddressSpace(MonLoaderContext *ctx,      // IN/OUT
 
    ptMPNs = &ctx->vcpu.ptMPNs;
 
-   if (MonLoaderCreatesPtLevel(PT_LEVEL_4)) {
-      NOT_IMPLEMENTED();
-   } else {
-      /* Verify the VMX's allocation. */
-      mpn = MonLoaderCallout_GetPageRoot(ctx->envCtx, vcpu);
-      if (mpn == INVALID_MPN) {
-         return ML_ERROR_CALLOUT_PAGEROOT_GET;
-      }
-      LOG(5, "%s: vcpu %u page root=0x%"FMT64"x\n", __FUNCTION__, vcpu, mpn);
-      ptMPNs->L4MPNs[0] = mpn;
-      MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
+   /* Verify the VMX's allocation. */
+   mpn = MonLoaderCallout_GetPageRoot(ctx->envCtx, vcpu);
+   if (mpn == INVALID_MPN) {
+      return ML_ERROR_CALLOUT_PAGEROOT_GET;
    }
+   LOG(5, "%s: vcpu %u page root=0x%"FMT64"x\n", __FUNCTION__, vcpu, mpn);
+   ptMPNs->L4MPNs[0] = mpn;
+   MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
    ptMPNs->L4MPNCount = 1;
 
    for (i = 0; i < L3MPNsNeeded; i++) {
-      if (MonLoaderCreatesPtLevel(PT_LEVEL_3)) {
-         NOT_IMPLEMENTED();
-      } else {
-         VPN monVPN = firstVPN + i * PT_PAGES_PER_L4E;
-         unsigned L4Off = PT_LPN_2_L4OFF(monVPN);
-         PT_L1E pte;
-         if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L4MPNs[0], L4Off,
-                                      vcpu, &pte)) {
-            return ML_ERROR_CALLOUT_GETPTE;
-         }
-         LOG(5, "%s: monVPN=0x%"FMTVPN"x: L4E=0x%"FMT64"x\n", __FUNCTION__,
-                 monVPN, pte);
-         mpn = ML_PTE_2_PFN(pte);
-         if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
-            return ML_ERROR_PAGE_TABLE_IMPORT;
-         }
-         MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
+      VPN monVPN = firstVPN + i * PT_PAGES_PER_L4E;
+      unsigned L4Off = PT_LPN_2_L4OFF(monVPN);
+      PT_L1E pte;
+      if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L4MPNs[0], L4Off,
+                                   vcpu, &pte)) {
+         return ML_ERROR_CALLOUT_GETPTE;
+      }
+      LOG(5, "%s: monVPN=0x%"FMTVPN"x: L4E=0x%"FMT64"x\n", __FUNCTION__,
+              monVPN, pte);
+      mpn = ML_PTE_2_PFN(pte);
+      if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
+         return ML_ERROR_PAGE_TABLE_IMPORT;
       }
+      MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
       ptMPNs->L3MPNs[i] = mpn;
    }
    ptMPNs->L3MPNCount = L3MPNsNeeded;
       
    for (i = 0; i < L2MPNsNeeded; i++) {
-      if (MonLoaderCreatesPtLevel(PT_LEVEL_2)) {
-         NOT_IMPLEMENTED();
-      } else {
-         VPN monVPN = firstVPN + i * PT_PAGES_PER_L3E;
-         unsigned L3Off = PT_LPN_2_L3OFF(monVPN);
-         unsigned L3Page = L3EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
-         PT_L1E pte;
-         if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L3MPNs[L3Page],
-                                      L3Off, vcpu, &pte)) {
-            return ML_ERROR_CALLOUT_GETPTE;
-         }
-         LOG(5, "%s: monVPN=0x%"FMTVPN"x: L3E=0x%"FMT64"x\n", __FUNCTION__,
-                 monVPN, pte);
-         mpn = ML_PTE_2_PFN(pte);
-         if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
-            return ML_ERROR_PAGE_TABLE_IMPORT;
-         }
-         MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
+      VPN monVPN = firstVPN + i * PT_PAGES_PER_L3E;
+      unsigned L3Off = PT_LPN_2_L3OFF(monVPN);
+      unsigned L3Page = L3EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
+      PT_L1E pte;
+      if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L3MPNs[L3Page],
+                                   L3Off, vcpu, &pte)) {
+         return ML_ERROR_CALLOUT_GETPTE;
+      }
+      LOG(5, "%s: monVPN=0x%"FMTVPN"x: L3E=0x%"FMT64"x\n", __FUNCTION__,
+              monVPN, pte);
+      mpn = ML_PTE_2_PFN(pte);
+      if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
+         return ML_ERROR_PAGE_TABLE_IMPORT;
       }
+      MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
       ptMPNs->L2MPNs[i] = mpn;
    }
    ptMPNs->L2MPNCount = L2MPNsNeeded;
 
    for (i = 0; i < L1MPNsNeeded; i++) {
-      if (MonLoaderCreatesPtLevel(PT_LEVEL_1)) {
-         NOT_IMPLEMENTED();
-      } else {
-         VPN monVPN = firstVPN + i * PT_PAGES_PER_L2E;
-         unsigned L2Off = PT_LPN_2_L2OFF(monVPN);
-         unsigned L2Page = L2EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
-         PT_L1E pte;
-         if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L2MPNs[L2Page],
-                                      L2Off, vcpu, &pte)) {
-            return ML_ERROR_CALLOUT_GETPTE;
-         }
-         LOG(5, "%s: monVPN=0x%"FMTVPN"x: L2E=0x%"FMT64"x\n", __FUNCTION__,
-                 monVPN, pte);
-         if (!ML_PERM_PRESENT(pte)) {
-            ptMPNs->L1MPNs[i] = INVALID_MPN;
-            continue;
-         }
-         mpn = ML_PTE_2_PFN(pte);
-         if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
-            return ML_ERROR_PAGE_TABLE_IMPORT;
-         }
-         MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
+      VPN monVPN = firstVPN + i * PT_PAGES_PER_L2E;
+      unsigned L2Off = PT_LPN_2_L2OFF(monVPN);
+      unsigned L2Page = L2EArrayIdx(ctx->vcpu.ASFirstVPN, monVPN);
+      PT_L1E pte;
+      if (!MonLoaderCallout_GetPTE(ctx->envCtx, ptMPNs->L2MPNs[L2Page],
+                                   L2Off, vcpu, &pte)) {
+         return ML_ERROR_CALLOUT_GETPTE;
+      }
+      LOG(5, "%s: monVPN=0x%"FMTVPN"x: L2E=0x%"FMT64"x\n", __FUNCTION__,
+              monVPN, pte);
+      if (!ML_PERM_PRESENT(pte)) {
+         ptMPNs->L1MPNs[i] = INVALID_MPN;
+         continue;
+      }
+      mpn = ML_PTE_2_PFN(pte);
+      if (mpn == INVALID_MPN || !ML_PERMS_MATCH(pte, flags)) {
+         return ML_ERROR_PAGE_TABLE_IMPORT;
       }
+      MonLoaderCallout_ImportPage(ctx->envCtx, mpn, vcpu);
       ptMPNs->L1MPNs[i] = mpn;
    }
    ptMPNs->L1MPNCount = L1MPNsNeeded;
@@ -457,7 +416,6 @@ MonLoaderMapPageTables(MonLoaderContext *ctx,      // IN/OUT
                        VPN               monVPN,   // IN
                        uint64            monPages) // IN
 {
-   Bool verify = !MonLoaderCreatesPtLevel(level);
    uint64    i;
    unsigned  count;
    MPN      *ptMPNs;
@@ -498,17 +456,13 @@ MonLoaderMapPageTables(MonLoaderContext *ctx,      // IN/OUT
       
       for (i = 0; i < monPages; i++) {
          VPN vpn = monVPN + i;
-         if (verify) {
-            PT_L1E l1e;
-            if (ptMPNs[i] == INVALID_MPN && level == PT_LEVEL_1) {
-               continue;
-            }
-            if (MonLoaderTranslateMonVPNToL1E(ctx, vpn, &l1e) != ML_OK ||
-                ML_PTE_2_PFN(l1e) != ptMPNs[i] || !ML_PERMS_MATCH(l1e, flags)) {
-               return ML_ERROR_PAGE_TABLE_VERIFY;
-            }
-         } else {
-            NOT_IMPLEMENTED();
+         PT_L1E l1e;
+         if (ptMPNs[i] == INVALID_MPN && level == PT_LEVEL_1) {
+            continue;
+         }
+         if (MonLoaderTranslateMonVPNToL1E(ctx, vpn, &l1e) != ML_OK ||
+             ML_PTE_2_PFN(l1e) != ptMPNs[i] || !ML_PERMS_MATCH(l1e, flags)) {
+            return ML_ERROR_PAGE_TABLE_VERIFY;
          }
       }
    }
diff --git a/vmmon-only/bootstrap/vmmblob.c b/vmmon-only/bootstrap/vmmblob.c
index 129b62e1..e0ff8193 100644
--- a/vmmon-only/bootstrap/vmmblob.c
+++ b/vmmon-only/bootstrap/vmmblob.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2017-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2017-2020, 2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -28,11 +28,9 @@
 #include "vm_assert.h"
 #include "hostif.h"
 #include "vmmblob.h"
+#include "vmm_constants.h"
 #include "monLoader.h"
 
-#define VMMBLOB_SIZE_MAX (22 * 1024 * 1024) /* Ensure enough space for
-                                             * obj build with * GCOV_VMM=1. */
-
 /*
  *----------------------------------------------------------------------
  *
@@ -176,9 +174,14 @@ VmmBlob_Load(UserVA64 blobAddr,
 
    if (numBytes > VMMBLOB_SIZE_MAX || headerOffset > numBytes ||
        fixedHdrSize > numBytes - headerOffset) {
-      Warning("Invalid arguments for processing bootstrap. "
-              "Header offset: %u, Fixed header size: %"FMTSZ"u bytes, "
-              "Blob size: %u bytes\n", headerOffset, fixedHdrSize, numBytes);
+      Warning("Invalid arguments for processing bootstrap:");
+      Warning("  Size          : %u  (expected <= %u)\n",
+              numBytes, VMMBLOB_SIZE_MAX);
+      Warning("  Hdr Offs      : %u  (expected <= %d)\n",
+              headerOffset, numBytes);
+      Warning("  Fixed Hdr Offs: %"FMTSZ"u (expected <= %d)",
+              fixedHdrSize, numBytes - headerOffset);
+      Warning("  Blob size: %u bytes\n", numBytes);
       goto error;
    }
    mpns = HostIF_AllocKernelMem(numPages * sizeof(*mpns), FALSE);
diff --git a/vmmon-only/common/comport.c b/vmmon-only/common/comport.c
index 29291b2c..521beba5 100644
--- a/vmmon-only/common/comport.c
+++ b/vmmon-only/common/comport.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006,2016 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006,2016,2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -41,19 +41,13 @@
 
 #if 000 // defined(_MSC_VER)
 #define USE_DBGPRINT 1
-#define USE_MACPORT80 0
 #else
 #define USE_DBGPRINT 0
-#ifdef __APPLE__
-#define USE_MACPORT80 1
-#else
-#define USE_MACPORT80 0
-#endif
 #endif
 
 #if USE_DBGPRINT
 void DbgPrint(char const *format, ...);
-#elif !USE_MACPORT80
+#else
 #define IOBASE 0x3F8  // COM1 base IO port number
 #define BAUD 115200   // baud rate
 #define THR 0         // transmitter holding register
@@ -66,7 +60,7 @@ void DbgPrint(char const *format, ...);
 void
 CP_Init(void)
 {
-#if !USE_DBGPRINT && !USE_MACPORT80
+#if !USE_DBGPRINT
    OUTB(IOBASE+3, 0x83);               // LCR=select DLL/DLH, wordlen=8 bits
    OUTB(IOBASE+0, (115200/BAUD)&255);  // DLL=lo order baud rate
    OUTB(IOBASE+1, (115200/BAUD)/256);  // DLH=hi order baud rate
@@ -83,13 +77,6 @@ CP_PutChr(uint8 ch) // IN
 {
 #if USE_DBGPRINT
    DbgPrint("%c", ch);
-#elif USE_MACPORT80
-   int bit;
-
-   OUTB(0x80, (ch & 1) | 0x10);
-   for (bit = 1; bit < 64; bit ++) {
-      OUTB(0x80, (ch >> (bit & 7)) & 1);
-   }
 #else
    if (ch == '\n') CP_PutChr('\r');
    while ((INB(IOBASE+LSR) & LSR_TE) == 0) { }
diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
index cabee8b1..78b7a4af 100644
--- a/vmmon-only/common/cpuid.c
+++ b/vmmon-only/common/cpuid.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2016-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998, 2016-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -22,9 +22,6 @@
 
 #   include <linux/string.h>
 #endif
-#ifdef __APPLE__
-#   include <string.h> // For strcmp().
-#endif
 
 #include "vm_assert.h"
 #include "hostif.h"
@@ -77,7 +74,7 @@ CPUIDExtendedSupported(void)
 void
 CPUID_Init(void)
 {
-   CPUIDRegs regs, regs88;
+   CPUIDRegs regs, regs72, regs88;
    uint32 *ptr;
    char name[16];
 
@@ -107,10 +104,12 @@ CPUID_Init(void)
    }
 
    __GET_CPUID2(7, 0, &regs);
+   __GET_CPUID2(7, 2, &regs72);
    __GET_CPUID2(0x80000008, 0, &regs88);
    hostHasSpecCtrl =  CPUID_ISSET(7, EDX, IBRSIBPB, regs.edx) ||
                       CPUID_ISSET(7, EDX, STIBP, regs.edx)    ||
-                      CPUID_ISSET(7, EDX, SSBD,  regs.edx)    ||
+                      CPUID_ISSET(7, EDX, SSBD, regs.edx)     ||
+                      CPUID_ISSET(7, EDX, PSFD, regs72.edx)   ||
                       CPUID_ISSET(0x80000008, EBX, LEAF88_SSBD_SPEC_CTRL,
                                   regs88.ebx)                 ||
                       CPUID_ISSET(0x80000008, EBX, LEAF88_PSFD, regs88.ebx);
diff --git a/vmmon-only/common/crosspage.c b/vmmon-only/common/crosspage.c
index a5a47c51..8a8c11c1 100644
--- a/vmmon-only/common/crosspage.c
+++ b/vmmon-only/common/crosspage.c
@@ -62,20 +62,6 @@
 #include "vm_idt_x86.h"
 #include "crosspage.h"
 
-#ifdef __APPLE__
-/*
- * The Mac compiler expects symbols to have a _ prefix.
- * This arranges for any symbol being exported out of the assembly code
- * to be accessible.
- */
-#define ASM_PREFIX "_"
-/*
- * OSX uses a segment,section style syntax for specifying output sections.
- * https://developer.apple.com/library/archive/documentation/Performance/
- * Conceptual/CodeFootprint/Articles/MachOOverview.html
- */
-#define ASM_SECTION "__TEXT,cross"
-#else
 /*
  * This is a COFF grouped section identifier.  This ensures the crosspage code
  * is merged with the normal .text area but as a separate unit so it can have
@@ -86,10 +72,10 @@
  */
 #define ASM_SECTION ".text$cross"
 #define ASM_PREFIX
-#endif
 
 #define EXPORTED_ASM_SYMBOL(fn) ".global " ASM_PREFIX #fn "\n"   \
                                 ASM_PREFIX #fn ":\n"
+#define ENDBR ".byte 0xf3, 0x0f, 0x1e, 0xfa\n"
 
 /*
  * Tag the crosspage code C wrapper with the crosspage section and page
@@ -309,6 +295,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchDBHandler)
+   ENDBR
    "pushq        %%rax\n"
    "call         SwitchExcGetCrossPageData\n"
    "addq         %[wsExceptionDB], %%rax\n"
@@ -347,6 +334,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchUDHandler)
+   ENDBR
    "pushq        %%rax\n"
    "pushq        %%rbx\n"
    "pushq        %%rcx\n"
@@ -415,6 +403,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchNMIHandler)
+   ENDBR
    "pushq        %%rax\n"
    "call         SwitchExcGetCrossPageData\n"
    "addq         %[wsExceptionNMI], %%rax\n"
@@ -450,6 +439,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchMCEHandler)
+   ENDBR
    "pushq        %%rax\n"
    "call         SwitchExcGetCrossPageData\n"
    "addq         %[wsExceptionMC], %%rax\n"
@@ -570,6 +560,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(VmmToHost)
+   ENDBR
    "movq            %c[VMMCROSSPAGE] + %c[crosspageDataLA], %%rcx\n"
    /* Create an lret frame on the monitor stack. */
    "pushq           (%%rsp)\n"
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index e1939ab1..445570b9 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -38,8 +38,8 @@
 /*
  * Host-specific definitions.
  */
-#if !__linux__ && !defined(WINNT_DDK) && !defined __APPLE__
-#error "Only Linux or NT or Mac OS defined for now."
+#if !__linux__ && !defined(WINNT_DDK)
+#error "Only Linux or NT defined for now."
 #endif
 
 
@@ -81,7 +81,6 @@ EXTERN int   HostIF_LockPage(VMDriver *vm, VA64 uAddr,
                              Bool allowMultipleMPNsPerVA, MPN *mpn);
 EXTERN int   HostIF_UnlockPage(VMDriver *vm, VA64 uAddr);
 EXTERN int   HostIF_UnlockPageByMPN(VMDriver *vm, MPN mpn, VA64 uAddr);
-EXTERN Bool  HostIF_IsLockedByMPN(VMDriver *vm, MPN mpn);
 EXTERN void  HostIF_FreeAllResources(VMDriver *vm);
 EXTERN uint64 HostIF_ReadUptime(void);
 EXTERN uint64 HostIF_UptimeFrequency(void);
@@ -136,14 +135,8 @@ EXTERN int HostIF_ReadPhysical(VMDriver *vm, MA ma, VA64 addr,
 EXTERN int HostIF_WritePhysical(VMDriver *vm, MA ma, VA64 addr,
                                 Bool kernelBuffer, size_t len);
 EXTERN int HostIF_WriteMachinePage(MPN mpn, VA64 addr);
-#if defined __APPLE__
-// There is no need for a fast clock lock on Mac OS.
-#define HostIF_FastClockLock(_callerID) do {} while (0)
-#define HostIF_FastClockUnlock(_callerID) do {} while (0)
-#else
 EXTERN void HostIF_FastClockLock(int callerID);
 EXTERN void HostIF_FastClockUnlock(int callerID);
-#endif
 EXTERN int HostIF_SetFastClockRate(unsigned rate);
 
 EXTERN MPN HostIF_AllocMachinePage(void);
@@ -154,8 +147,4 @@ EXTERN int HostIF_SafeRDMSR(uint32 msr, uint64 *val);
 EXTERN int HostIF_CopyFromUser(void *dst, VA64 src, size_t len);
 EXTERN int HostIF_CopyToUser(VA64 dst, const void *src, size_t len);
 
-#if defined __APPLE__
-EXTERN void HostIF_PageUnitTest(void);
-#endif
-
 #endif // ifdef _HOSTIF_H_
diff --git a/vmmon-only/common/phystrack.c b/vmmon-only/common/phystrack.c
index d4d9aaef..4b33805d 100644
--- a/vmmon-only/common/phystrack.c
+++ b/vmmon-only/common/phystrack.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2014,2019-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2014,2019-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -24,7 +24,7 @@
  *    Depending on configuration phystracker provides either 2-level or
  *    3-level structure to track whether page (specified by its MPN) is
  *    locked or no.  Linux uses 3-level structures with top limit of
- *    1TB (32bit) or 16TB (64bit).  Windows and Mac use 2-level structures
+ *    1TB (32bit) or 16TB (64bit).  Windows uses 2-level structures
  *    ready to hold 128GB (32bit) or 2TB (64bit) of memory.
  *
  *    2-level phystracker is built on top of 3-level one by collapsing
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index 7259b390..5d34cf4d 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -81,7 +81,7 @@
 #   include "vmmon-asm-x86-64.h"
 #   define USE_TEMPORARY_GDT 1
 #else
-/* It is OK to set this to 1 on 64-bit Linux/Mac OS for testing. */
+/* It is OK to set this to 1 on 64-bit Linux for testing. */
 #   define USE_TEMPORARY_GDT 0
 #endif
 
@@ -2296,6 +2296,18 @@ TaskTestCrossPageExceptionHandlers(VMCrossPageData *crosspage)
 
          asm volatile ("\n"
                        "        movl    $16, %%ecx      \n"
+                       /*
+                        * Initial push/incq sequence is essentially a nop.
+                        * Linux objtool does track push/pop, but not decq.
+                        * So we need to have balanced number of pushes and
+                        * pops.  So we do same number of push/pop and
+                        * incq/decq so objtool does not get upset.
+                        */
+                       "        pushq   %%rax           \n"
+                       "        pushq   %%rcx           \n"
+                       "1000:   incq    %%rsp           \n"
+                       "        loop    1000b           \n"
+                       "        mov     $16, %%cl       \n"
                        "1000:                           \n"
                        "        decq    %%rsp           \n"
                        "        movb    $0xDB, (%%rsp)  \n"
@@ -2581,30 +2593,13 @@ Task_Switch(VMDriver *vm,  // IN
           *
           * 2) prevent us from faulting if they happen to be in the LDT
           *    (since the LDT is saved and restored here too).
-          *
-          * Also, the 32-bit Mac OS running in legacy mode has
-          * CS, DS, ES, SS in the LDT!
           */
          cs = GET_CS();
          ss = GET_SS();
-#if defined __APPLE__
-         /*
-          * The 64-bit Mac OS kernel leaks segment selectors from
-          * other threads into 64-bit threads.  When the selectors
-          * reference a foreign thread's LDT, we may not be able to
-          * reload them using our thread's LDT.  So, let's just clear
-          * them instead of trying to preserve them.  [PR 467140]
-          */
-         ds = 0;
-         es = 0;
-         fs = 0;
-         gs = 0;
-#else
          ds = GET_DS();
          es = GET_ES();
          fs = GET_FS();
          gs = GET_GS();
-#endif
          GET_LDT(hostLDT);
          GET_TR(hostTR);
 
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index adcc9171..86e52fb4 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -33,10 +33,6 @@
 #   include <string.h>
 #endif
 
-#ifdef __APPLE__
-#include <IOKit/IOLib.h>
-#endif
-
 #include "vm_assert.h"
 #include "vm_basic_math.h"
 #include "vmx86.h"
@@ -64,6 +60,7 @@
 #include "statVarsVmmon.h"
 #include "intelVT.h"
 #include "cpu_defs.h"
+#include "x86cet.h"
 
 PseudoTSC pseudoTSC;
 
@@ -1070,6 +1067,33 @@ Vmx86_CacheNXState(void)
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx865LvlPagingEnabled --
+ *
+ *       Checks if 5-level paging enabled on the current CPU.  It is assumed
+ *       that the host OS will not support a mix of 4 and 5-level paging.
+ *
+ * Results:
+ *       None.
+ *
+ * Side effects:
+ *       None.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static Bool
+Vmx865LvlPagingEnabled(void)
+{
+   uintptr_t cr4;
+
+   GET_CR4(cr4);
+   return (cr4 & CR4_LA57) != 0;
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1079,6 +1103,7 @@ Vmx86_CacheNXState(void)
  *
  * Results:
  *      VMDriver structure or NULL on error.
+ *      'status' is populated with the status of the operation.
  *
  * Side effects:
  *      May allocate kernel memory.
@@ -1087,7 +1112,10 @@ Vmx86_CacheNXState(void)
  */
 
 VMDriver *
-Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
+Vmx86_CreateVM(VA64 bsBlob,            // IN:
+               uint32 bsBlobSize,      // IN:
+               uint32 numVCPUs,        // IN:
+               VMCreateStatus *status) // OUT:
 {
    VMDriver *vm;
    Vcpuid v;
@@ -1095,18 +1123,26 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
    BSVMM_HostParams *bsParams;
 
    /* Disallow VM creation if the vmx passes us an invalid number of vcpus. */
-   if (numVCPUs == 0 || numVCPUs > MAX_VCPUS) {
+   if (numVCPUs == 0) {
+      *status = VM_CREATE_ERR_NO_VCPUS;
+      return NULL;
+   }
+
+   if (numVCPUs > MAX_VCPUS) {
+      *status = VM_CREATE_ERR_TOO_MANY_VCPUS;
       return NULL;
    }
 
    /* Disallow VM creation if NX is disabled on the host as VMM requires NX. */
    if (!hostUsesNX) {
+      *status = VM_CREATE_ERR_NO_NX;
       Log("NX/XD must be enabled.  Cannot create VM.\n");
       return NULL;
    }
 
    vm = Vmx86AllocVMDriver(numVCPUs);
    if (vm == NULL) {
+      *status = VM_CREATE_ERR_NO_MEM;
       return NULL;
    }
 
@@ -1119,43 +1155,61 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
       vm->ptRootMpns[v] = INVALID_MPN;
    }
    if (!HostIF_Init(vm, numVCPUs)) {
+      *status = VM_CREATE_ERR_NO_MEM;
       goto cleanup;
    }
 
-   /* The ULM does not use the cross GDT. */
+   /* If the BS blob exists then the VMM is in use. */
    if (bsBlobSize != 0) {
+
+      /* Disallow VM creation if 5 level paging is enabled with the VMM. */
+      if (Vmx865LvlPagingEnabled()) {
+         Log("5 level paging must not be enabled.  Cannot create VM.\n");
+         *status = VM_CREATE_ERR_5LP;
+         goto cleanup;
+      }
+
+      /* The ULM does not use the cross GDT. */
       bsBuf = HostIF_AllocKernelMem(bsBlobSize, FALSE);
       if (bsBuf == NULL) {
+         *status = VM_CREATE_ERR_NO_MEM;
          goto cleanup;
       }
       if (HostIF_CopyFromUser(bsBuf, bsBlob, bsBlobSize) != 0) {
+         *status = VM_CREATE_ERR_NO_BLOB;
          goto cleanup;
       }
       bsParams = BSVMM_Validate(bsBuf, bsBlobSize);
       if (bsParams == NULL) {
+         *status = VM_CREATE_ERR_INV_BLOB;
          Warning("Could not validate the VMM bootstrap blob");
          goto cleanup;
       }
 
       if (!Task_CreateCrossGDT(&bsParams->gdtInit)) {
+         *status = VM_CREATE_ERR_CROSS_GDT;
          goto cleanup;
       }
    }
 
    vm->ptpTracker = MemTrack_Init(vm);
    if (vm->ptpTracker == NULL) {
+      *status = VM_CREATE_ERR_NO_MEM;
       goto cleanup;
    }
    vm->vmmTracker = MemTrack_Init(vm);
    if (vm->vmmTracker == NULL) {
+      *status = VM_CREATE_ERR_NO_MEM;
       goto cleanup;
    }
    vm->sharedArea = SharedAreaVmmon_Init(vm);
    if (vm->sharedArea == NULL) {
+      *status = VM_CREATE_ERR_NO_MEM;
       goto cleanup;
    }
    vm->statVars = StatVarsVmmon_Init(vm);
    if (vm->statVars == NULL) {
+      *status = VM_CREATE_ERR_NO_MEM;
       goto cleanup;
    }
 
@@ -1163,11 +1217,13 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
 
 #ifdef _WIN32
    if (vmCount >= MAX_VMS_WIN32) {
+      *status = VM_CREATE_ERR_TOO_MANY_VMS;
       HostIF_GlobalUnlock(0);
       goto cleanup;
    }
 #endif
    if (vmCount >= MAX_VMS) {
+      *status = VM_CREATE_ERR_TOO_MANY_VMS;
       HostIF_GlobalUnlock(0);
       goto cleanup;
    }
@@ -1179,9 +1235,12 @@ Vmx86_CreateVM(VA64 bsBlob, uint32 bsBlobSize, uint32 numVCPUs)
    if (bsBuf != NULL) {
       HostIF_FreeKernelMem(bsBuf);
    }
+   *status = VM_CREATE_SUCCESS;
    return vm;
 
 cleanup:
+   ASSERT(*status != VM_CREATE_SUCCESS);
+
    if (bsBuf != NULL) {
       HostIF_FreeKernelMem(bsBuf);
    }
@@ -1532,53 +1591,6 @@ Vmx86_ComputekHz(uint64 cycles, uint64 uptime)
 }
 
 
-#ifdef __APPLE__
-/*
- *----------------------------------------------------------------------
- *
- * Vmx86GetBusyKHzEstimate
- *
- *      Return an estimate the of the processor's kHz rating, based on
- *      a spinloop.  This is especially useful on systems where the TSC
- *      is known to run at its maximum rate when we are using the CPU.
- *      As of 2006, Intel Macs are this way... the TSC rate is 0 if the
- *      CPU is in a deep enough sleep state, or at its max rate otherwise.
- *
- * Results:
- *      Processor speed in kHz.
- *
- * Side effects:
- *      None.
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE_SINGLE_CALLER uint32
-Vmx86GetBusyKHzEstimate(void)
-{
-   static const int ITERS = 100;
-   static const int CYCLES_PER_ITER = 20000;
-   int i;
-   uint64 j;
-   uint64 aggregateCycles = 0;
-   uint64 aggregateUptime = 0;
-
-   for (i = 0; i < ITERS; i++) {
-      NO_INTERRUPTS_BEGIN() {
-         aggregateCycles -= RDTSC();
-         aggregateUptime -= HostIF_ReadUptime();
-         for (j = RDTSC() + CYCLES_PER_ITER; RDTSC() < j; )
-            ;
-         aggregateCycles += RDTSC();
-         aggregateUptime += HostIF_ReadUptime();
-      } NO_INTERRUPTS_END();
-   }
-
-   return Vmx86_ComputekHz(aggregateCycles, aggregateUptime);
-}
-#else // ifdef __APPLE__
-
-
 /*
  *----------------------------------------------------------------------
  *
@@ -1606,7 +1618,6 @@ Vmx86GetkHzEstimate(VmTimeStart *st)   // IN: start time
 
    return Vmx86_ComputekHz(cDiff, tDiff);
 }
-#endif // ifdef __APPLE__
 
 
 /*
@@ -1643,11 +1654,7 @@ Vmx86_GetkHzEstimate(VmTimeStart *st)   // IN: start time
       return kHz;
    }
 
-#ifdef __APPLE__
-   return kHz = Vmx86GetBusyKHzEstimate();
-#else
    return kHz = Vmx86GetkHzEstimate(st);
-#endif
 }
 
 
@@ -3160,14 +3167,6 @@ Vmx86_YieldToSet(VMDriver *vm,       // IN:
       return;
    }
 
-#ifdef __APPLE__
-   if (skew) {
-      /* Mac scheduler yield does fine in the skew case */
-      (void)thread_block(THREAD_CONTINUE_NULL);
-      return;
-   }
-#endif
-
    /* Crosscalls should spin a few times before blocking */
    if (!skew && usecs < CROSSCALL_SPIN_SHORT_US) {
       HostIF_WakeUpYielders(vm, currVcpu);
@@ -3591,14 +3590,6 @@ Vmx86_CreateHVIOBitmap(void)
    if (!CPUID_HostSupportsSVM()) {
       return TRUE;
    }
-   if (vmx86_apple) {
-      /*
-       * This function is not called on MacOS.  No supported MacOS system is
-       * available for AMD so that platform has no need to create the SVM I/O
-       * bitmap.
-       */
-      return TRUE;
-   }
    hvIOBitmap = HostIF_AllocContigPages(NULL, SVM_VMCB_IO_BITMAP_PAGES);
    if (hvIOBitmap == NULL) {
       Warning("Failed to allocate SVM I/O bitmap.\n");
@@ -4034,3 +4025,40 @@ Vmx86_CheckMSRUniformity(void)
    return TRUE;
 }
 
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * Vmx86_KernelCETEnabled --
+ *
+ *      Check if kernel mode shadow stacks are enabled by examining
+ *      the current shadow stack pointer.
+ *
+ * Results:
+ *      TRUE if any CPU has kernel mode shadow stacks enabled.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static void
+Vmx86KernelCETEnabledOnCPU(void *data)
+{
+   uint64 ssp = GET_SSP();
+
+   if (ssp != INVALID_SSP) {
+      Atomic_Bool *kernelCETEnabled = (Atomic_Bool *)data;
+
+      Atomic_WriteBool(kernelCETEnabled, TRUE);
+   }
+}
+
+
+Bool
+Vmx86_KernelCETEnabled(void)
+{
+   Atomic_Bool kernelCETEnabled;
+
+   Atomic_WriteBool(&kernelCETEnabled, FALSE);
+   HostIF_CallOnEachCPU(Vmx86KernelCETEnabledOnCPU, &kernelCETEnabled);
+   return Atomic_ReadBool(&kernelCETEnabled);
+}
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index b739496d..89262309 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -120,7 +120,8 @@ extern PseudoTSC pseudoTSC;
 extern void Vmx86_CacheNXState(void);
 extern VMDriver *Vmx86_CreateVM(VA64 bsBlob,
                                 uint32 bsBlobSize,
-                                uint32 numVCPUs);
+                                uint32 numVCPUs,
+                                VMCreateStatus *status);
 extern Bool Vmx86_ProcessBootstrap(VMDriver *vm,
                                    VA64 bsBlobAddr,
                                    uint32 numBytes,
@@ -227,5 +228,6 @@ extern void Vmx86_CleanupVMMPages(VMDriver *vm);
 
 extern VPN Vmx86_MapPage(MPN mpn);
 extern void Vmx86_UnmapPage(VPN vpn);
+extern Bool Vmx86_KernelCETEnabled(void);
 
 #endif
diff --git a/vmmon-only/include/addrlayout_table.h b/vmmon-only/include/addrlayout_table.h
index 27f20056..2e876e61 100644
--- a/vmmon-only/include/addrlayout_table.h
+++ b/vmmon-only/include/addrlayout_table.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2020, 2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -73,7 +73,7 @@ REGION(TC_REGION,              1024)
  * area and other contents.
  * Mapped small (allowing non-present mappings and sharing) and read-write.
  */
-REGION(MONITOR_MISC,           5632)
+REGION(MONITOR_MISC,           5120)
 #ifdef VMX86_SERVER
   ITEM(GUARD_PAGE,                2) // Reserved (for symmetry with hosted).
 #else
@@ -114,7 +114,7 @@ REGION(MONITOR_MISC,           5632)
   ITEM(GART_BF_PAGES,             8) // Gart Bloom filter memory pages.
   ITEM(VVT_GUEST_VIRT_APIC,       1) // Inner guest virtual APIC page.
   ITEM(HT_STATE_MAP,              8) // Information used by the SecureHT module
-  ITEM(SHARED_RW_DATA,         5462) // R/W shared data, including the shared
+  ITEM(SHARED_RW_DATA,         4950) // R/W shared data, including the shared
                                      // area and stat vars. Any remaining pages
                                      // are left to the dynamic allocator, which
                                      // extends throughout the entire reclaimed
@@ -126,7 +126,7 @@ REGION(MONITOR_MISC,           5632)
  * extends through to the end of the VMM address space once the bootstrap region
  * is reclaimed.
  */
-REGION(BOOTSTRAP,              8192)
+REGION(BOOTSTRAP,              8704)
   ITEM(BS_TXT,                   17) // bootstrap's .text
   ITEM(BS_RODATA,                10) // bootstrap's .rodata
   ITEM(BS_DATA,                  10) // bootstrap's .data
@@ -135,10 +135,10 @@ REGION(BOOTSTRAP,              8192)
   ITEM(BS_VCPU_L1PT_RANGE,       32) // VCPU L1PT mappings
   ITEM(BS_VCPU_L1PT_PT,           1) // L1PT that maps a VCPU's L1 page tables
   ITEM(BS_INIT_POOL,              1) // pool for initializing VMM pages
-  ITEM(BS_DYNAMIC_ALLOC,       1880) // bs_alloc's dynamic allocator pages
+  ITEM(BS_DYNAMIC_ALLOC,       2300) // bs_alloc's dynamic allocator pages
   ITEM(MON_IDT_TMP,               1) // temporary addr for normal IDT on bsp
   ITEM(IDT_BOOTSTRAP_STUBS,       2) // bootstrap IDT gate stubs
   ITEM(BS_PER_VM_VMX,           300) // vmm64's shared_per_vm_vmx
   ITEM(BS_PER_VCPU,               8) // vmm64's shared_per_vcpu for VCPU 0
   ITEM(BS_PER_VCPU_VMX,         136) // vmm64's shared_per_vcpu_vmx for VCPU 0
-  ITEM(VMM_MODULES,            5783) // ~22.6MB for unlinked VMM modules
+  ITEM(VMM_MODULES,            5875) // ~24.06 MB for unlinked VMM modules
diff --git a/vmmon-only/include/intelVT.h b/vmmon-only/include/intelVT.h
index d6755fb9..8de2cfe0 100644
--- a/vmmon-only/include/intelVT.h
+++ b/vmmon-only/include/intelVT.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -416,7 +416,8 @@ IntelVT_Supported(const MSRCache *cache, uint32 pcpu)
       uint64 cpu   = MSRCache_Get(cache, MSR_VMX_TRUE_PROCBASED_CTLS, pcpu);
       uint64 entry = MSRCache_Get(cache, MSR_VMX_TRUE_ENTRY_CTLS, pcpu);
       uint64 exit  = MSRCache_Get(cache, MSR_VMX_TRUE_EXIT_CTLS, pcpu);
-      return VT_SupportedFromFeatures(pin, cpu, entry, exit, basic);
+      uint64 ept   = MSRCache_Get(cache, MSR_VMX_EPT_VPID, pcpu);
+      return VT_SupportedFromFeatures(pin, cpu, entry, exit, basic, ept);
    } else {
       /* Bug 1914425 - VMM no longer supports CPUs without TRUE_xxx_CTLS */
       return FALSE;
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 61d71e35..2dca0be8 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -146,7 +146,7 @@ PtrToVA64(void const *ptr) // IN
  * the NT specific VMX86_DRIVER_VERSION.
  */
 
-#define VMMON_VERSION           (410 << 16 | 0)
+#define VMMON_VERSION           (416 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
@@ -276,6 +276,7 @@ enum IOCTLCmd {
 
    IOCTLCMD(GET_UNAVAIL_PERF_CTRS),
    IOCTLCMD(GET_MONITOR_CONTEXT),
+   IOCTLCMD(KERNEL_CET_ENABLED),
    // Must be last.
    IOCTLCMD(LAST)
 };
@@ -312,10 +313,8 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_RUN_VM              VMIOCTL_NEITHER(RUN_VM)
 #define IOCTL_VMX86_SEND_IPI            VMIOCTL_NEITHER(SEND_IPI)
 #define IOCTL_VMX86_SEND_ONE_IPI        VMIOCTL_BUFFERED(SEND_ONE_IPI)
-#define IOCTL_VMX86_GET_IPI_VECTORS     VMIOCTL_BUFFERED(GET_IPI_VECTORS)
 #define IOCTL_VMX86_GET_SWITCH_ERROR_ADDR VMIOCTL_BUFFERED(GET_SWITCH_ERROR_ADDR)
 #define IOCTL_VMX86_LOOK_UP_MPN         VMIOCTL_BUFFERED(LOOK_UP_MPN)
-#define IOCTL_VMX86_GET_VMM_PAGE_ROOT   VMIOCTL_BUFFERED(GET_VMM_PAGE_ROOT)
 #define IOCTL_VMX86_LOCK_PAGE           VMIOCTL_BUFFERED(LOCK_PAGE)
 #define IOCTL_VMX86_UNLOCK_PAGE         VMIOCTL_BUFFERED(UNLOCK_PAGE)
 #define IOCTL_VMX86_APIC_INIT           VMIOCTL_BUFFERED(APIC_INIT)
@@ -337,10 +336,6 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_GET_NEXT_ANON_PAGE  VMIOCTL_BUFFERED(GET_NEXT_ANON_PAGE)
 #define IOCTL_VMX86_GET_NUM_ANON_PAGES  VMIOCTL_BUFFERED(GET_NUM_ANON_PAGES)
 
-#define IOCTL_VMX86_READ_DISASM_PROC_BINARY \
-                                      VMIOCTL_BUFFERED(READ_DISASM_PROC_BINARY)
-#define IOCTL_VMX86_CHECK_CANDIDATE_VA64 VMIOCTL_BUFFERED(CHECK_CANDIDATE_VA64)
-
 #define IOCTL_VMX86_SET_MEMORY_PARAMS   VMIOCTL_BUFFERED(SET_MEMORY_PARAMS)
 
 #define IOCTL_VMX86_REMEMBER_KHZ_ESTIMATE VMIOCTL_BUFFERED(REMEMBER_KHZ_ESTIMATE)
@@ -356,6 +351,7 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_REMAP_SCATTER_LIST    VMIOCTL_BUFFERED(REMAP_SCATTER_LIST)
 #define IOCTL_VMX86_REMAP_SCATTER_LIST_RO VMIOCTL_BUFFERED(REMAP_SCATTER_LIST_RO)
 #define IOCTL_VMX86_UNMAP_SCATTER_LIST    VMIOCTL_BUFFERED(UNMAP_SCATTER_LIST)
+#define IOCTL_VMX86_KERNEL_CET_ENABLED    VMIOCTL_BUFFERED(KERNEL_CET_ENABLED)
 #endif
 
 
@@ -376,13 +372,6 @@ typedef union {
 } VMLockPage;
 #pragma pack(pop)
 
-#pragma pack(push, 1)
-typedef union {
-   Vcpuid vcpuid; // IN: VCPU
-   MPN pageRoot;  // OUT: MPN of the VCPU's page root
-} VcpuPageRoot;
-#pragma pack(pop)
-
 #define VMX86_DRIVER_VCPUID_OFFSET 1000
 
 
@@ -507,23 +496,30 @@ typedef struct PTSCCheckParams {
    uint8  _pad[7];
 } PTSCCheckParams;
 
-typedef struct IPIVectors {
-   /*
-    * Vectors we have allocated or stolen for the monitor interrupts.
-    */
-   uint8 monitorIPIVector;
-   uint8 hvIPIVector;
-} IPIVectors;
-
 /*
  * Arguments and return value for VM creation.
  */
+typedef enum VMCreateStatus {
+   VM_CREATE_SUCCESS,
+   VM_CREATE_ERR_UNKNOWN,
+   VM_CREATE_ERR_NO_VCPUS,
+   VM_CREATE_ERR_TOO_MANY_VCPUS,
+   VM_CREATE_ERR_NO_NX,
+   VM_CREATE_ERR_NO_MEM,
+   VM_CREATE_ERR_5LP,
+   VM_CREATE_ERR_NO_BLOB,
+   VM_CREATE_ERR_INV_BLOB,
+   VM_CREATE_ERR_CROSS_GDT,
+   VM_CREATE_ERR_TOO_MANY_VMS
+} VMCreateStatus;
+
 typedef struct VMCreateBlock {
    VA64               bsBlob;        // IN: User VA of the VMM bootstrap blob.
    VA64               vmmonData;     // IN: User VA of a userlevel scratch area
                                      //     required by the Linux vmmon
    uint32             bsBlobSize;    // IN: Size of VMM bootstrap blob.
    uint32             numVCPUs;      // IN: Number of VCPUs.
+   VMCreateStatus     status;        // OUT: Status of the operation.
    uint16             vmid;          // OUT: VM ID for the created VM.
 } VMCreateBlock;
 
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index 2a816fd3..f7a467bf 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -31,7 +31,6 @@
 #include "includeCheck.h"
 
 #include "cpu_types.h"
-#include "x86desc.h"
 #include "ptsc.h"
 #include "vcpuid.h"
 #include "vcpuset.h"
@@ -128,6 +127,7 @@ typedef enum ModuleCallType {
 #define WS_INTR_STRESS 0
 
 
+#if !defined VMX86_SERVER && defined VM_X86_64
 /*----------------------------------------------------------------------
  *
  * VMMPageTablePatch
@@ -175,6 +175,7 @@ typedef struct VMMPageTablePatch {
    VM_PDPTE pte;                /* PTE.                                */
 } VMMPageTablePatch;
 #pragma pack(pop)
+#endif // !defined VMX86_SERVER && defined VM_X86_64
 
 #define MODULECALL_NUM_ARGS  4
 
@@ -276,9 +277,11 @@ typedef struct VMCrossPageData {
    uint16   _pad2[3];
    /* A hardcoded value for monitor %rip which facilitates backtraces. */
    uint64   monRIP;
+#if !defined VMX86_SERVER && defined VM_X86_64
    Task64   monTask;          /* vmm's task */
 
    VMMPageTablePatch vmmPTP[MAX_SWITCH_PT_PATCHES]; /* page table patch */
+#endif
 
    /*
     * The monitor may requests up to two actions when returning to the
diff --git a/vmmon-only/include/monLoader.h b/vmmon-only/include/monLoader.h
index b1f6ae01..c3984c38 100644
--- a/vmmon-only/include/monLoader.h
+++ b/vmmon-only/include/monLoader.h
@@ -124,7 +124,7 @@
 #if defined VM_X86_64
 #include "x86paging_64.h"
 #elif defined VM_ARM_64
-#include "arm64_vmsa.h"
+#include "vmsa.h"
 #endif
 
 #define ML_NAME_MAX 16
diff --git a/vmmon-only/include/mon_assert.h b/vmmon-only/include/mon_assert.h
index c9de933c..a065d67a 100644
--- a/vmmon-only/include/mon_assert.h
+++ b/vmmon-only/include/mon_assert.h
@@ -96,7 +96,7 @@
 typedef uint32 Assert_MonSrcLoc;
 
 #define ADEF(type, fmt) type
-typedef enum Assert_Type {  
+typedef enum Assert_Type {
    ALL_ASSERT_TYPES
 } Assert_Type;
 #undef ADEF
@@ -115,7 +115,7 @@ typedef struct Assert_Info {
 
 #define ASSERT_NULL_MONSRCLOC     0             // there is never line 0
 
-#if defined(VMM) && !defined(MONITOR_APP) // {
+#if defined(VMM) && !defined(DECODER)
 /*
  * Assertion information is collected in a non-loadable section
  * named .assert_info.  Each record in this section contains
@@ -196,6 +196,6 @@ extern uint64 bsAssertRIP;
    ({COMPILER_MEM_BARRIER();                                             \
      ASSERT_RECORDINFO("", AssertType_##name##Bug, bug);                 \
      __builtin_trap();})
-#endif // VMM && !MONITOR_APP}
+#endif
 
 #endif // _MON_ASSERT_H_
diff --git a/vmmon-only/include/perfctr_arch.h b/vmmon-only/include/perfctr_arch.h
index e8b23cee..22a6b4a9 100644
--- a/vmmon-only/include/perfctr_arch.h
+++ b/vmmon-only/include/perfctr_arch.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2014, 2019-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2014, 2019-2020, 2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -22,8 +22,8 @@
  *      Performance counters (x64 specific).
  */
 
-#ifndef _X86_PERFCTR_ARCH_H_
-#define _X86_PERFCTR_ARCH_H_
+#ifndef _PERFCTR_X86_H_
+#define _PERFCTR_X86_H_
 
 #ifndef _PERFCTR_H_
 #error "This file can only be included by perfctr.h"
@@ -486,25 +486,27 @@
 #define PERFCTR_CORE_BRANCH_MISPRED_RETIRED      0xc5
 
 /* Non-Architectural event counters in Intel Core and Core 2 */
-#define PERFCTR_CORE_L2_LINES_IN                 0x24
-#define PERFCTR_CORE_L2_M_LINES_IN               0x25
-#define PERFCTR_CORE_L2_LINES_OUT                0x26
-#define PERFCTR_CORE_L2_M_LINES_OUT              0x27
-#define PERFCTR_CORE_DATA_MEM_REF                0x43
-#define PERFCTR_CORE_DATA_MEM_CACHE_REF          0x44
-#define PERFCTR_CORE_DCACHE_REPL                 0x45
-#define PERFCTR_CORE_DCACHE_M_REPL               0x46
-#define PERFCTR_CORE_DCACHE_M_EVICT              0x47
-#define PERFCTR_CORE_DCACHE_PEND_MISS            0x48
-#define PERFCTR_CORE_DTLB_MISS                   0x49
-#define PERFCTR_CORE_BUS_TRANS                   0x70
-#define PERFCTR_CORE_ICACHE_READS                0x80
-#define PERFCTR_CORE_ICACHE_MISSES               0x81
-#define PERFCTR_CORE_ITLB_MISSES                 0x85
-#define PERFCTR_CORE_UOPS_RETIRED                0xC2
-#define PERFCTR_CORE_RESOURCE_STALLS             0xDC
-#define PERFCTR_NEHALEM_OFFCORE_RESP0_EVENT      (0xB7 | (0x01 << 8))
-#define PERFCTR_NEHALEM_OFFCORE_RESP1_EVENT      (0xBB | (0x01 << 8))
+#define PERFCTR_CORE_L2_LINES_IN                      0x24
+#define PERFCTR_CORE_L2_M_LINES_IN                    0x25
+#define PERFCTR_CORE_L2_LINES_OUT                     0x26
+#define PERFCTR_CORE_L2_M_LINES_OUT                   0x27
+#define PERFCTR_CORE_DATA_MEM_REF                     0x43
+#define PERFCTR_CORE_DATA_MEM_CACHE_REF               0x44
+#define PERFCTR_CORE_DCACHE_REPL                      0x45
+#define PERFCTR_CORE_DCACHE_M_REPL                    0x46
+#define PERFCTR_CORE_DCACHE_M_EVICT                   0x47
+#define PERFCTR_CORE_DCACHE_PEND_MISS                 0x48
+#define PERFCTR_CORE_DTLB_MISS                        0x49
+#define PERFCTR_CORE_BUS_TRANS                        0x70
+#define PERFCTR_CORE_ICACHE_READS                     0x80
+#define PERFCTR_CORE_ICACHE_MISSES                    0x81
+#define PERFCTR_CORE_ITLB_MISSES                      0x85
+#define PERFCTR_CORE_UOPS_RETIRED                     0xC2
+#define PERFCTR_CORE_RESOURCE_STALLS                  0xDC
+#define PERFCTR_NEHALEM_OFFCORE_RESP0_EVENT           (0xB7 | (0x01 << 8))
+#define PERFCTR_NEHALEM_OFFCORE_RESP1_EVENT           (0xBB | (0x01 << 8))
+#define PERFCTR_SAPPHIRERAPIDS_OFFCORE_RESP0_EVENT    (0x2A | (0x01 << 8))
+#define PERFCTR_SAPPHIRERAPIDS_OFFCORE_RESP1_EVENT    (0x2B | (0x01 << 8))
 
 /* Intel TSX performance events introduced on Haswell */
 #define PERFCTR_HASWELL_HLE_RETIRED_START        (0xc8 | (0x01 << 8))
@@ -754,4 +756,4 @@ PerfCtr_PTAvailable(void)
    return FALSE;
 }
 
-#endif // _X86_PERFCTR_ARCH_H_
+#endif // _PERFCTR_X86_H_
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
index 476edc68..be48c4a7 100644
--- a/vmmon-only/include/ptsc.h
+++ b/vmmon-only/include/ptsc.h
@@ -27,6 +27,7 @@
 
 #define INCLUDE_ALLOW_VMX
 
+#define INCLUDE_ALLOW_USERLEVEL
 #define INCLUDE_ALLOW_VMCORE
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMKERNEL
diff --git a/vmmon-only/include/segs.h b/vmmon-only/include/segs.h
index 1819c87b..6e25852a 100644
--- a/vmmon-only/include/segs.h
+++ b/vmmon-only/include/segs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2018-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2018-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,7 +37,7 @@
 #include "x86segdescrs.h"
 #include "x86sel.h"
 #include "addrlayout.h"
-
+#include "vm_atomic.h"
 
 /*
  * For each pcpu, a per-pcpu data area, the GDT, and the Task State
@@ -158,7 +158,14 @@ typedef enum VmwSegs {
 #pragma pack(push, 1)
 typedef struct PcpuData {
    Bool         inVMM;       /* TRUE iff vmm world running in vmm context. */
-   uint8        _unused[PCPU_DATA_SIZE - sizeof(Bool)];
+
+   /*
+    * nmiIPIFromVMkernel is set when vmkernel detects a CPU
+    * lockup inside any of the worlds. This done before
+    * vmkernel sends an NMI IPI to the CPU.
+    */
+   Atomic_Bool  nmiIPIFromVMkernel;
+   uint8        _unused[PCPU_DATA_SIZE - sizeof(Atomic_Bool) - sizeof(Bool)];
 } PcpuData;
 #pragma pack(pop)
 
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
index 58af6f85..0d005850 100644
--- a/vmmon-only/include/vcpuset.h
+++ b/vmmon-only/include/vcpuset.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,7 +40,9 @@
 #include "vcpuid.h"
 #include "vcpuset_types.h"
 
-#if defined VMX86_VMX || defined MONITOR_APP
+#if defined VMX86_VMX || defined COREQUERY || defined BINARY_CHECKER || \
+    defined ULM || defined TRAPAPI_APP || defined DECODER ||            \
+    defined VMSS2CORE || defined FROBOS || defined DIS16
 #   include <stdio.h>   /* libc snprintf */
 #   define VCS_SNPRINTF
 #elif defined VMM || defined VMKERNEL
@@ -468,42 +470,6 @@ VCPUSet_AtomicTestInclude(VCPUSet *vcs, Vcpuid v)
 }
 
 
-#if defined(VMM) && !defined(MONITOR_APP)
-/*
- *----------------------------------------------------------------------
- *
- * VCPUSet_PackCareful --
- *
- *      Pack a VCPUSet into the bytes at "ptr".
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE void
-VCPUSet_PackCareful(unsigned numVCPUs, const VCPUSet *vcs, void *ptr)
-{
-   memcpy(ptr, vcs->subset, (numVCPUs + 7) / 8);
-}
-
-
-/*
- *----------------------------------------------------------------------
- *
- * VCPUSet_UnpackCareful --
- *
- *      Unpack a VCPUSet from the bytes at "ptr".
- *
- *----------------------------------------------------------------------
- */
-
-static INLINE void
-VCPUSet_UnpackCareful(unsigned numVCPUs, VCPUSet *vcs, const void *ptr)
-{
-   memcpy(vcs->subset, ptr, (numVCPUs + 7) / 8);
-}
-#endif /* VMM && !MONITOR_APP */
-
-
 /*
  *----------------------------------------------------------------------
  *
diff --git a/vmmon-only/include/vcpuset_types.h b/vmmon-only/include/vcpuset_types.h
index 6a54f27a..64c7cbff 100644
--- a/vmmon-only/include/vcpuset_types.h
+++ b/vmmon-only/include/vcpuset_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2013, 2016-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2013, 2016-2017, 2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/virtual_vt.h b/vmmon-only/include/virtual_vt.h
index ce2be474..8fdbcde8 100644
--- a/vmmon-only/include/virtual_vt.h
+++ b/vmmon-only/include/virtual_vt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -75,6 +75,7 @@
                                       VT_VMCS_2ND_VMEXEC_CTL_PML |          \
                                       VT_VMCS_2ND_VMEXEC_CTL_ENCLS |        \
                                       VT_VMCS_2ND_VMEXEC_CTL_ENCLV |        \
+                                      VT_VMCS_2ND_VMEXEC_CTL_UMWAIT |       \
                                       VT_VMCS_2ND_VMEXEC_CTL_EPC_VIRT_EXT)
 
 #define VVT_2ND_CTLS                 QWORD(VVT_2ND_CTLS1,                   \
@@ -122,6 +123,7 @@
                                       VT_VMCS_VMEXIT_CTL_LOAD_EFER |        \
                                       VT_VMCS_VMEXIT_CTL_CLEAR_BNDCFGS |    \
                                       VT_VMCS_VMEXIT_CTL_LOAD_PKRS |        \
+                                      VT_VMCS_VMEXIT_CTL_LOAD_CET |         \
                                       VT_VMCS_VMEXIT_CTL_LOAD_PGC)
 #define VVT_TRUE_EXIT_CTLS           QWORD(VVT_TRUE_EXIT_CTLS1,             \
                                            VVT_TRUE_EXIT_CTLS0)
@@ -132,6 +134,7 @@
                                       VT_VMCS_VMENTRY_CTL_LOAD_EFER |       \
                                       VT_VMCS_VMENTRY_CTL_LOAD_BNDCFGS |    \
                                       VT_VMCS_VMENTRY_CTL_LOAD_PKRS    |    \
+                                      VT_VMCS_VMENTRY_CTL_LOAD_CET     |    \
                                       VT_VMCS_VMENTRY_CTL_LOAD_PGC)
 #define VVT_TRUE_ENTRY_CTLS          QWORD(VVT_TRUE_ENTRY_CTLS1,            \
                                            VVT_TRUE_ENTRY_CTLS0)
@@ -182,9 +185,9 @@
 #define VVT_EPT_SUPPORT              (VT_REQUIRED_EPT_SUPPORT | \
                                       MSR_VMX_EPT_VPID_EPTE_X | \
                                       MSR_VMX_EPT_VPID_ETMT_UC | \
-                                      MSR_VMX_EPT_VPID_INVEPT_EPT_CTX | \
                                       MSR_VMX_EPT_VPID_INVEPT_GLOBAL | \
                                       MSR_VMX_EPT_VPID_ACCESS_DIRTY | \
+                                      MSR_VMX_EPT_VPID_SUP_SHADOW_STK | \
                                       MSR_VMX_EPT_VPID_ADV_EXIT_INFO)
 
 #define VVT_VPID_SUPPORT             (VT_REQUIRED_VPID_SUPPORT | \
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index e876d93f..9f9b2991 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -63,13 +63,22 @@
  *                                                 : sizeof(expr) <= 2)
  * The __builtin_choose_expr is due to GCC bug 79482:
  * https://gcc.gnu.org/bugzilla/show_bug.cgi?id=79482
+ * but only works on gcc >= 6. The gcc test is for >= 9 because it was only
+ * tested on gcc >= 9.
  */
 #ifndef USE_UBSAN
+#if __GNUC__ >= 9
 #define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)                                \
    ASSERT_ON_COMPILE(sizeof(Selector) == 2 &&                                \
                      __builtin_choose_expr(__builtin_constant_p(expr),       \
                                            ((expr) >> 16) == 0,              \
                                            sizeof(expr) <= 2))
+#else /* __GNUC__ < 9 */
+#define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)                                \
+   ASSERT_ON_COMPILE(sizeof(Selector) == 2 &&                                \
+                     ((__builtin_constant_p(expr) && ((expr) >> 16) == 0) || \
+                      sizeof(expr) <= 2))
+#endif /* __GNUC__ >= 9 */
 #else
 #define ASSERT_ON_COMPILE_SELECTOR_SIZE(expr)
 #endif
@@ -366,6 +375,22 @@ CLTS(void)
 #define RAISE_INTERRUPT(_x)  __asm__ __volatile__("int %0" :: "g" (_x))
 #define RETURN_FROM_INT()   __asm__ __volatile__("iret" :: )
 
+#ifdef VM_X86_64
+static INLINE uint64
+GET_SSP(void)
+{
+   uint64 ssp = 0x3; /* INVALID_SSP */
+   /*
+    * rdsspq %rax
+    * On systems without CET support, or when shadow stacks are
+    * disabled at the current CPL, rdsspq is a nop.
+    */
+   __asm__ __volatile__(".byte 0xf3, 0x48, 0x0f, 0x1e, 0xc8\n"
+                        : "+a" (ssp) : : "memory");
+   return ssp;
+}
+#endif
+
 /* End of the section whose correctness has NOT been checked */
 
 #elif defined _MSC_VER  /* !__GNUC__ */
diff --git a/vmmon-only/include/vm_assert.h b/vmmon-only/include/vm_assert.h
index cf344460..fca85007 100644
--- a/vmmon-only/include/vm_assert.h
+++ b/vmmon-only/include/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,7 +40,11 @@
 
 // XXX not necessary except some places include vm_assert.h improperly
 #include "vm_basic_types.h"
+
+/* No stdarg.h on Linux kernels 5.15+ */
+#ifndef KBUILD_MODNAME
 #include <stdarg.h>
+#endif
 
 #ifdef __cplusplus
 extern "C" {
@@ -62,7 +66,10 @@ extern "C" {
  * so it uses generic functions.
  */
 
-#if !defined VMM || defined MONITOR_APP // {
+#if !defined VMM ||                                                     \
+    defined BINARY_CHECKER || defined COREQUERY || defined DECODER ||   \
+    defined DIS16 || defined FROBOS || defined TRAPAPI_APP ||           \
+    defined VMM_LINKER || defined VMSS2CORE
 
 # if defined (VMKPANIC)
 #  include "vmk_assert.h"
@@ -76,8 +83,7 @@ extern "C" {
 #  define _ASSERT_PANIC_BUG_NORETURN(bug, name) \
            Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
 # endif /* VMKPANIC */
-
-#endif // }
+#endif
 
 
 // These strings don't have newline so that a bug can be tacked on.
@@ -307,22 +313,21 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
  * compilation options will lead to different control-flow-derived
  * errors, causing some make targets to fail while others succeed.
  *
- * VC++ has the __assume() built-in function which we don't trust
- * (see bug 43485); gcc has no such construct; we just panic in
- * userlevel code.  The monitor doesn't want to pay the size penalty
- * (measured at 212 bytes for the release vmm for a minimal infinite
- * loop; panic would cost even more) so it does without and lives
- * with the inconsistency.
+ * VC++ has the __assume() built-in function which we don't trust (see
+ * bug 43485).  However, __assume() is used in the Windows ULM
+ * implementation, because the newer compiler used for that project
+ * generates correct code.
  *
+ * With gcc, the __builtin_unreachable() extension is used when the
+ * compiler is known to support it.
  */
 
-# if defined VMKPANIC || defined VMM
+# if defined VMKPANIC || defined VMM || defined ULM_ESX
+#  undef  NOT_REACHED
+#  define NOT_REACHED() __builtin_unreachable()
+# elif defined ULM_WIN
 #  undef  NOT_REACHED
-#  if defined __GNUC__ && (__GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 5)
-#   define NOT_REACHED() (__builtin_unreachable())
-#  else
-#   define NOT_REACHED() ((void)0)
-#  endif
+#  define NOT_REACHED() __assume(0)
 # else
  // keep debug definition
 # endif
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index dc378c56..4f8e04fc 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -142,8 +142,7 @@ typedef ALIGNED(8) struct Atomic_uint64 {
    volatile uint64 value;
 } Atomic_uint64;
 
-#if defined __GNUC__ && defined VM_64BIT && \
-     (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
+#ifdef VM_HAS_INT128
 typedef ALIGNED(16) struct Atomic_uint128 {
    volatile uint128 value;
 } Atomic_uint128;
@@ -201,10 +200,8 @@ Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
  * registers.
  */
 
-#if defined __GNUC__ && defined VM_ARM_32
 /* Force the link step to fail for unimplemented functions. */
 extern int AtomicUndefined(void const *);
-#endif
 
 
 /*
@@ -212,57 +209,80 @@ extern int AtomicUndefined(void const *);
  *
  * Atomic_ReadIfEqualWrite128 --
  *
- *      Compare and exchange a 16 byte tuple.
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
  * Results:
- *      old value
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      None
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
-#if defined __GNUC__ && defined VM_64BIT && \
-     (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
+
+#ifdef VM_HAS_INT128
 static INLINE uint128
 Atomic_ReadIfEqualWrite128(Atomic_uint128 *ptr,   // IN/OUT
                            uint128        oldVal, // IN
                            uint128        newVal) // IN
 {
-#ifdef __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16
+#if defined __GNUC__ && defined VM_ARM_64
+#define VM_HAS_ATOMIC_READIFEQUALWRITE128 // This function can be used.
+   /*
+    * Don't use __sync_val_compare_and_swap, as this cannot magically
+    * use the right (LL/SC vs LSE) atomics without -moutline-atomics.
+    */
+#if __GNUC__ >= 9
+   if (Atomic_HaveLSE) {
+      SMP_RW_BARRIER_RW();
+      __asm__ __volatile__(
+         ".arch armv8.2-a            \n\t"
+         "casp %0, %H0, %2, %H2, %1  \n\t"
+         : "+r" (oldVal),
+           "+Q" (ptr->value)
+         : "r" (newVal)
+      );
+      SMP_RW_BARRIER_RW();
+      return oldVal;
+   } else
+#endif /* __GNUC__ */
+   {
+      union {
+         uint128 raw;
+         struct {
+            uint64 lo;
+            uint64 hi;
+         };
+      } res, _old = { oldVal }, _new = { newVal };
+      uint32 failed;
+
+      SMP_RW_BARRIER_RW();
+      __asm__ __volatile__(
+         "1: ldxp    %x0, %x1, %3        \n\t"
+         "   cmp     %x0, %x4            \n\t"
+         "   ccmp    %x1, %x5, #0, eq    \n\t"
+         "   b.ne    2f                  \n\t"
+         "   stxp    %w2, %x6, %x7, %3   \n\t"
+         "   cbnz    %w2, 1b             \n\t"
+         "2:                             \n\t"
+         : "=&r" (res.lo),
+           "=&r" (res.hi),
+           "=&r" (failed),
+           "+Q" (ptr->value)
+         : "r" (_old.lo),
+           "r" (_old.hi),
+           "r" (_new.lo),
+           "r" (_new.hi)
+         : "cc"
+      );
+      SMP_RW_BARRIER_RW();
+      return res.raw;
+   }
+#elif defined __GNUC__ && defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16
+#define VM_HAS_ATOMIC_READIFEQUALWRITE128 // This function can be used.
    return __sync_val_compare_and_swap(&ptr->value, oldVal, newVal);
-#elif defined VM_ARM_64
-   union {
-      uint128 raw;
-      struct {
-         uint64 lo;
-         uint64 hi;
-      };
-   } res, _old = { oldVal }, _new = { newVal };
-   uint32 failed;
-
-   SMP_RW_BARRIER_RW();
-   __asm__ __volatile__(
-      "1: ldxp    %x0, %x1, %3        \n\t"
-      "   cmp     %x0, %x4            \n\t"
-      "   ccmp    %x1, %x5, #0, eq    \n\t"
-      "   b.ne    2f                  \n\t"
-      "   stxp    %w2, %x6, %x7, %3   \n\t"
-      "   cbnz    %w2, 1b             \n\t"
-      "2:                             \n\t"
-      : "=&r" (res.lo),
-        "=&r" (res.hi),
-        "=&r" (failed),
-        "+Q" (ptr->value)
-      : "r" (_old.lo),
-        "r" (_old.hi),
-        "r" (_new.lo),
-        "r" (_new.hi)
-      : "cc"
-   );
-   SMP_RW_BARRIER_RW();
-
-   return res.raw;
+#else
+   return AtomicUndefined(ptr + oldVal + newVal);
 #endif
 }
 #endif
@@ -302,7 +322,7 @@ Atomic_Read8(Atomic_uint8 const *var)  // IN:
 #elif defined _MSC_VER
    val = var->value;
 #else
-#error No compiler defined for Atomic_Read8
+#error Atomic_Read8 not implemented
 #endif
 
    return val;
@@ -345,7 +365,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
 #elif defined _MSC_VER
    return _InterlockedExchange8((volatile char *)&var->value, val);
 #else
-#error No compiler defined for Atomic_ReadWrite8
+#error Atomic_ReadWrite8 not implemented
 #endif
 }
 
@@ -383,7 +403,7 @@ Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
 #elif defined _MSC_VER
    var->value = val;
 #else
-#error No compiler defined for Atomic_Write8
+#error Atomic_Write8 not implemented
 #endif
 }
 
@@ -396,10 +416,10 @@ Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
  *      Compare exchange: Read variable, if equal to oldVal, write newVal.
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -430,7 +450,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
    return _InterlockedCompareExchange8((volatile char *)&var->value,
                                        newVal, oldVal);
 #else
-#error No compiler defined for Atomic_ReadIfEqualWrite8
+#error Atomic_ReadIfEqualWrite8 not implemented
 #endif
 }
 
@@ -859,7 +879,7 @@ Atomic_Read32(Atomic_uint32 const *var) // IN
 
    value = var->value;
 #else
-#error No compiler defined for Atomic_Read
+#error Atomic_Read32 not implemented
 #endif
 
    return value;
@@ -923,7 +943,7 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    return _InterlockedExchange((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_ReadWrite
+#error Atomic_ReadWrite32 not implemented
 #endif // __GNUC__
 }
 #define Atomic_ReadWrite Atomic_ReadWrite32
@@ -1005,7 +1025,7 @@ Atomic_Write32(Atomic_uint32 *var, // OUT
 
    var->value = val;
 #else
-#error No compiler defined for Atomic_Write
+#error Atomic_Write32 not implemented
 #endif
 }
 #define Atomic_Write Atomic_Write32
@@ -1019,10 +1039,10 @@ Atomic_Write32(Atomic_uint32 *var, // OUT
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -1075,7 +1095,7 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
                                       (long)newVal,
                                       (long)oldVal);
 #else
-#error No compiler defined for Atomic_ReadIfEqualWrite
+#error Atomic_ReadIfEqualWrite32 not implemented
 #endif
 }
 #define Atomic_ReadIfEqualWrite Atomic_ReadIfEqualWrite32
@@ -1090,10 +1110,10 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -1167,7 +1187,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
                                         (__int64)newVal,
                                         (__int64)oldVal);
 #else
-#error No compiler defined for Atomic_ReadIfEqualWrite64
+#error Atomic_ReadIfEqualWrite64 not implemented
 #endif
 }
 #endif
@@ -1226,7 +1246,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedAnd((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_And
+#error Atomic_And32 not implemented
 #endif
 }
 #define Atomic_And Atomic_And32
@@ -1285,7 +1305,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedOr((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_Or
+#error Atomic_Or32 not implemented
 #endif
 }
 #define Atomic_Or Atomic_Or32
@@ -1344,7 +1364,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedXor((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_Xor
+#error Atomic_Xor32 not implemented
 #endif
 }
 #define Atomic_Xor Atomic_Xor32
@@ -1386,7 +1406,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedXor64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_Xor64
+#error Atomic_Xor64 not implemented
 #endif
 }
 #endif
@@ -1445,7 +1465,7 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_Add
+#error Atomic_Add32 not implemented
 #endif
 }
 #define Atomic_Add Atomic_Add32
@@ -1502,9 +1522,23 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-   _InterlockedExchangeAdd((long *)&var->value, -(long)val);
+   /*
+    * Microsoft warning C4146, enabled by the /sdl option for
+    * additional security checks, objects to `-val' when val is
+    * unsigned, even though that is always well-defined by C and has
+    * exactly the semantics we want, namely negation modulo 2^32.
+    * (The signed version, in contrast, has undefined behaviour at
+    * some inputs.)
+    *
+    * https://docs.microsoft.com/en-us/cpp/error-messages/compiler-warnings/compiler-warning-level-2-c4146?view=msvc-170
+    * https://docs.microsoft.com/en-us/cpp/build/reference/sdl-enable-additional-security-checks?view=msvc-170
+    */
+#   pragma warning(push)
+#   pragma warning(disable: 4146)
+   _InterlockedExchangeAdd((long *)&var->value, (long)-val);
+#   pragma warning(pop)
 #else
-#error No compiler defined for Atomic_Sub
+#error Atomic_Sub32 not implemented
 #endif
 }
 #define Atomic_Sub Atomic_Sub32
@@ -1544,7 +1578,7 @@ Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
 #elif defined _MSC_VER
    _InterlockedIncrement((long *)&var->value);
 #else
-#error No compiler defined for Atomic_Inc
+#error Atomic_Inc32 not implemented
 #endif
 }
 #define Atomic_Inc Atomic_Inc32
@@ -1584,7 +1618,7 @@ Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
 #elif defined _MSC_VER
    _InterlockedDecrement((long *)&var->value);
 #else
-#error No compiler defined for Atomic_Dec
+#error Atomic_Dec32 not implemented
 #endif
 }
 #define Atomic_Dec Atomic_Dec32
@@ -1796,7 +1830,7 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    return _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_ReadAdd32
+#error Atomic_ReadAdd32 not implemented
 #endif
 }
 
@@ -1966,7 +2000,7 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
                                                            (__int64)newVal,
                                                            (__int64)oldVal);
 #else
-#error No compiler defined for Atomic_CMPXCHG64
+#error Atomic_CMPXCHG64 not implemented
 #endif // !GNUC
 }
 
@@ -2170,7 +2204,7 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
 #elif defined _MSC_VER
    return _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_ReadAdd64
+#error Atomic_ReadAdd64 not implemented
 #endif
 
 #else
@@ -2194,9 +2228,6 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
  *
  *      Atomically subtracts a 64-bit integer from another.
  *
- *      Note: It is expected that val <= var.  If untrue, the result
- *            cannot be represented in an unsigned type.
- *
  * Results:
  *      Returns the old value just prior to the subtraction
  *
@@ -2213,7 +2244,25 @@ Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
 #if defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
-   return Atomic_ReadAdd64(var, (uint64)-(int64)val);
+#   ifdef _MSC_VER
+   /*
+    * Microsoft warning C4146, enabled by the /sdl option for
+    * additional security checks, objects to `-val' when val is
+    * unsigned, even though that is always well-defined by C and has
+    * exactly the semantics we want, namely negation modulo 2^64.
+    * (The signed version, in contrast, has undefined behaviour at
+    * some inputs.)
+    *
+    * https://docs.microsoft.com/en-us/cpp/error-messages/compiler-warnings/compiler-warning-level-2-c4146?view=msvc-170
+    * https://docs.microsoft.com/en-us/cpp/build/reference/sdl-enable-additional-security-checks?view=msvc-170
+    */
+#      pragma warning(push)
+#      pragma warning(disable: 4146)
+#   endif
+   return Atomic_ReadAdd64(var, -val);
+#   ifdef _MSC_VER
+#      pragma warning(pop)
+#   endif
 #endif
 }
 
@@ -2301,7 +2350,7 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_Add64
+#error Atomic_Add64 not implemented
 #endif
 }
 
@@ -2343,7 +2392,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)-val);
 #else
-#error No compiler defined for Atomic_Sub64
+#error Atomic_Sub64 not implemented
 #endif
 }
 
@@ -2382,7 +2431,7 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 #elif defined _MSC_VER
    _InterlockedIncrement64((__int64 *)&var->value);
 #else
-#error No compiler defined for Atomic_Inc64
+#error Atomic_Inc64 not implemented
 #endif
 }
 
@@ -2421,7 +2470,7 @@ Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
 #elif defined _MSC_VER
    _InterlockedDecrement64((__int64 *)&var->value);
 #else
-#error No compiler defined for Atomic_Dec64
+#error Atomic_Dec64 not implemented
 #endif
 }
 
@@ -2819,7 +2868,7 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
 #elif defined VM_ARM_64
    value = _VMATOM_X(R, 16, &var->value);
 #else
-#error No 16-bits atomics.
+#error Atomic_Read16 not implemented
 #endif
 #endif
 
@@ -2881,7 +2930,7 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
 #elif defined VM_ARM_64
    return _VMATOM_X(RW, 16, TRUE, &var->value, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_ReadWrite16 not implemented
 #endif
 #endif
 }
@@ -2927,7 +2976,7 @@ Atomic_Write16(Atomic_uint16 *var,  // OUT:
     */
    Atomic_ReadWrite16(var, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Write16 not implemented
 #endif
 #endif
 }
@@ -2941,10 +2990,10 @@ Atomic_Write16(Atomic_uint16 *var,  // OUT:
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -2993,7 +3042,7 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
 #elif defined VM_ARM_64
    return _VMATOM_X(RIFEQW, 16, TRUE, &var->value, oldVal, newVal);
 #else
-#error No 16-bits atomics.
+#error Atomic_ReadIfEqualWrite16 not implemented
 #endif
 #endif
 }
@@ -3050,7 +3099,7 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, and, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_And16 not implemented
 #endif
 #endif
 }
@@ -3107,7 +3156,7 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, orr, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Or16 not implemented
 #endif
 #endif
 }
@@ -3164,7 +3213,7 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, eor, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Xor16 not implemented
 #endif
 #endif
 }
@@ -3221,7 +3270,7 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, add, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Add16 not implemented
 #endif
 #endif
 }
@@ -3278,7 +3327,7 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, sub, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Sub16 not implemented
 #endif
 #endif
 }
@@ -3314,7 +3363,7 @@ Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 #elif defined VM_ARM_ANY
    Atomic_Add16(var, 1);
 #else
-#error No 16-bits atomics.
+#error Atomic_Inc16 not implemented
 #endif
 #endif
 }
@@ -3350,7 +3399,7 @@ Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
 #elif defined VM_ARM_ANY
    Atomic_Sub16(var, 1);
 #else
-#error No 16-bits atomics.
+#error Atomic_Dec16 not implemented
 #endif
 #endif
 }
@@ -3446,7 +3495,7 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
 #elif defined VM_ARM_64
    return _VMATOM_X(ROP, 16, TRUE, &var->value, add, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_ReadAdd16 not implemented
 #endif
 #endif
 }
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index 51fd6f66..781cb1b1 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -773,7 +773,7 @@ RDTSC(void)
     * bora/lib/vprobe/arm64/vp_emit_tc.c::VpEmit_BuiltinRDTSCWork()
     * bora/modules/vmkernel/tests/core/xmapTest/xmapTest_arm64.c::XMapTest_SetupLoopCode()
     */
-#if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1)
+#if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1_OR_VHE)
    return MRS(CNTPCT_EL0);
 #else
    return MRS(CNTVCT_EL0);
@@ -830,9 +830,10 @@ RDTSC(void)
 /*
  *-----------------------------------------------------------------------------
  *
- * {Clear,Set,Test}Bit{32,64} --
+ * {Clear, Set, Test, Toggle}Bit{32, 64} --
  *
- *    Sets tests or clears a specified single bit in the provided variable.
+ *    Sets tests clears or toggles a specified single bit in the provided
+ *    variable.
  *
  *    The index input value specifies which bit to modify and is 0-based.
  *    Index is truncated by hardware to a 5-bit or 6-bit offset for the
@@ -857,6 +858,12 @@ ClearBit32(uint32 *var, unsigned index)
    *var &= ~(1 << index);
 }
 
+static INLINE void
+ToggleBit32(uint32 *var, unsigned index)
+{
+   *var ^= 1 << index;
+}
+
 static INLINE void
 SetBit64(uint64 *var, unsigned index)
 {
@@ -869,6 +876,12 @@ ClearBit64(uint64 *var, unsigned index)
    *var &= ~(CONST64U(1) << index);
 }
 
+static INLINE void
+ToggleBit64(uint64 *var, unsigned index)
+{
+   *var ^= (CONST64U(1) << index);
+}
+
 static INLINE Bool
 TestBit32(const uint32 *var, unsigned index)
 {
@@ -1262,7 +1275,7 @@ PopCount64(uint64 value)
  *      Enforce ordering on memory operations witnessed by and
  *      affected by interrupt handlers.
  *
- *      This should be used to replace the legacy COMPILER_*_BARRIER
+ *      This should be used to replace the legacy COMPILER_MEM_BARRIER
  *      for code that has been audited to determine it only needs
  *      ordering with respect to interrupt handlers, and not to other
  *      CPUs (SMP_*), memory-mapped I/O (MMIO_*), or DMA (DMA_*).
diff --git a/vmmon-only/include/vm_basic_asm_x86_64.h b/vmmon-only/include/vm_basic_asm_x86_64.h
index d3e2ab9e..2b9e8f8e 100644
--- a/vmmon-only/include/vm_basic_asm_x86_64.h
+++ b/vmmon-only/include/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -288,6 +288,37 @@ XRSTOR_AMD_ES0(const void *load, uint64 mask)
         : "eax", "memory");
 }
 
+#endif /* __GNUC__ */
+
+/*
+ * XSAVES/XRSTORS
+ *     saves/restores processor state components
+ *
+ * The pointer passed in must be 64-byte aligned.
+ */
+
+#if defined(__GNUC__)
+static INLINE void
+XSAVES(const void *save, uint64 mask)
+{
+   __asm__ __volatile__ (
+        "xsaves %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+}
+
+static INLINE void
+XRSTORS(const void *load, uint64 mask)
+{
+   __asm__ __volatile__ (
+        "xrstors %0 \n"
+        :
+        : "m" (*(const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+}
+
 #endif /* __GNUC__ */
 #endif /* VMM || VMKERNEL || FROBOS || ULM */
 
diff --git a/vmmon-only/include/vm_basic_asm_x86_common.h b/vmmon-only/include/vm_basic_asm_x86_common.h
index 9b659c8b..2f48fc17 100644
--- a/vmmon-only/include/vm_basic_asm_x86_common.h
+++ b/vmmon-only/include/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -417,39 +417,36 @@ LOCKED_INSN_BARRIER(void)
  *    Semantics
  *    ---------
  *
- * At the time COMPILER_*_BARRIER were created (and references to them were
+ * At the time COMPILER_MEM_BARRIER was created (and references to it were
  * added to the code), the code was only targetting x86. The intent of the code
  * was really to use a memory barrier, but because x86 uses a strongly ordered
- * memory model, the CPU would not re-order memory accesses, and the code could
- * get away with using just a compiler memory barrier. So COMPILER_*_BARRIER
- * were born and were implemented as compiler memory barriers _on x86_. But
- * make no mistake, _the semantics that the code expects from
- * COMPILER_*_BARRIER are that of a memory barrier_!
+ * memory model, the CPU would not re-order most memory accesses (store-load
+ * ordering still requires MFENCE even on x86), and the code could get away
+ * with using just a compiler memory barrier. So COMPILER_MEM_BARRIER was born
+ * and was implemented as a compiler memory barrier _on x86_. But make no
+ * mistake, _the semantics that the code expects from COMPILER_MEM_BARRIER is
+ * that of a memory barrier_!
  *
  *    DO NOT USE!
  *    -----------
  *
- * On at least one non-x86 architecture, COMPILER_*_BARRIER are
- * 1) Misnomers
+ * On at least one non-x86 architecture, COMPILER_MEM_BARRIER is
+ * 1) A misnomer
  * 2) Not fine-grained enough to provide the best performance.
- * For the above two reasons, usage of COMPILER_*_BARRIER is now deprecated.
- * _Do not add new references to COMPILER_*_BARRIER._ Instead, precisely
+ * For the above two reasons, usage of COMPILER_MEM_BARRIER is now deprecated.
+ * _Do not add new references to COMPILER_MEM_BARRIER._ Instead, precisely
  * document the intent of your code by using
  * <mem_type/purpose>_<before_access_type>_BARRIER_<after_access_type>.
- * Existing references to COMPILER_*_BARRIER are being slowly but surely
- * converted, and when no references are left, COMPILER_*_BARRIER will be
+ * Existing references to COMPILER_MEM_BARRIER are being slowly but surely
+ * converted, and when no references are left, COMPILER_MEM_BARRIER will be
  * retired.
  *
  * Thanks for pasting this whole comment into every architecture header.
  */
 
 #if defined __GNUC__
-#   define COMPILER_READ_BARRIER()  COMPILER_MEM_BARRIER()
-#   define COMPILER_WRITE_BARRIER() COMPILER_MEM_BARRIER()
 #   define COMPILER_MEM_BARRIER()   __asm__ __volatile__("" ::: "memory")
 #elif defined _MSC_VER
-#   define COMPILER_READ_BARRIER()  _ReadBarrier()
-#   define COMPILER_WRITE_BARRIER() _WriteBarrier()
 #   define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
 #endif
 
@@ -514,7 +511,7 @@ LOCKED_INSN_BARRIER(void)
  * i.e. WB using above terminology), so we only need to worry about store-load
  * reordering. In other cases a compiler barrier is sufficient. SMP store-load
  * reordering is handled with a locked XOR (instead of a proper MFENCE
- * instructon) for performance reasons. See PR 1674199 for more details.
+ * instruction) for performance reasons. See PR 1674199 for more details.
  *
  * DMA barriers are equivalent to SMP barriers on x86.
  *
@@ -524,14 +521,14 @@ LOCKED_INSN_BARRIER(void)
  * not guarding non-temporal/WC accesses.
  */
 
-#define SMP_R_BARRIER_R()     COMPILER_READ_BARRIER()
-#define SMP_R_BARRIER_W()     COMPILER_MEM_BARRIER()
-#define SMP_R_BARRIER_RW()    COMPILER_MEM_BARRIER()
+#define SMP_R_BARRIER_R()     INTR_R_BARRIER_R()
+#define SMP_R_BARRIER_W()     INTR_R_BARRIER_W()
+#define SMP_R_BARRIER_RW()    INTR_R_BARRIER_RW()
 #define SMP_W_BARRIER_R()     LOCKED_INSN_BARRIER()
-#define SMP_W_BARRIER_W()     COMPILER_WRITE_BARRIER()
+#define SMP_W_BARRIER_W()     INTR_W_BARRIER_W()
 #define SMP_W_BARRIER_RW()    LOCKED_INSN_BARRIER()
 #define SMP_RW_BARRIER_R()    LOCKED_INSN_BARRIER()
-#define SMP_RW_BARRIER_W()    COMPILER_MEM_BARRIER()
+#define SMP_RW_BARRIER_W()    INTR_RW_BARRIER_W()
 #define SMP_RW_BARRIER_RW()   LOCKED_INSN_BARRIER()
 
 /*
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index 006c60ca..fd597664 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -50,7 +50,10 @@
  * References:
  *   C90 7.17, C99 7.19, C11 7.19
  */
-#if !defined(VMKERNEL)
+/* Use linux/stddef.h when building Linux kernel modules. */
+#ifdef KBUILD_MODNAME
+#  include <linux/stddef.h>
+#elif !defined(VMKERNEL)
 #  include <stddef.h>
 #else
    /*
@@ -270,6 +273,10 @@ Max(int a, int b)
 #define BYTES_2_PAGES(_nbytes)  ((_nbytes) >> PAGE_SHIFT)
 #endif
 
+#ifndef BYTES_2_PAGES_4KB
+#define BYTES_2_PAGES_4KB(_nbytes)  ((_nbytes) >> PAGE_SHIFT_4KB)
+#endif
+
 #ifndef PAGES_2_BYTES
 #define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
 #endif
@@ -296,6 +303,11 @@ Max(int a, int b)
    ((uint64)(_nMbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
+#ifndef MBYTES_2_PAGES_4KB
+#define MBYTES_2_PAGES_4KB(_nMbytes) \
+   ((uint64)(_nMbytes) << (MBYTES_SHIFT - PAGE_SHIFT_4KB))
+#endif
+
 #ifndef PAGES_2_KBYTES
 #define PAGES_2_KBYTES(_npages) ((_npages) << (PAGE_SHIFT - KBYTES_SHIFT))
 #endif
@@ -564,6 +576,13 @@ typedef int pid_t;
 #define DEBUG_ONLY(...)
 #endif
 
+#if defined(VMX86_DEBUG) || defined(VMX86_ENABLE_SPLOCK_STATS)
+#define LOCK_STATS_ON
+#define LOCK_STATS_ONLY(...)  __VA_ARGS__
+#else
+#define LOCK_STATS_ONLY(...)
+#endif
+
 #ifdef VMX86_STATS
 #define vmx86_stats   1
 #define STATS_ONLY(x) x
@@ -628,6 +647,13 @@ typedef int pid_t;
 #define VMKERNEL_ONLY(x)
 #endif
 
+/*
+ * In MSVC, _WIN32 is defined as 1 when the compilation target is
+ * 32-bit ARM, 64-bit ARM, x86, or x64 (which implies _WIN64). This
+ * is documented in C/C++ preprocessor section of the Microsoft C++,
+ * C, and Assembler documentation (https://via.vmw.com/EchK).
+ */
+
 #ifdef _WIN32
 #define WIN32_ONLY(x) x
 #define POSIX_ONLY(x)
@@ -819,6 +845,11 @@ typedef int pid_t;
  * wasted.  On x86, GCC 6.3.0 behaves sub-optimally when variables are declared
  * on the stack using the aligned attribute, so this pattern is preferred.
  * See PRs 1795155, 1819963.
+ *
+ * GCC9 has been shown to exhibit aliasing issues when using
+ * '-fstrict-aliasing=2' that did not happen under GCC6 with this
+ * construct.
+ * See @9503890, PR 2906490.
  */
 #define WITH_PTR_TO_ALIGNED_VAR(_type, _align, _var)                     \
    do {                                                                  \
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index 8a0d41de..d05fcc79 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,13 +17,11 @@
  *********************************************************/
 
 /*
- *
  * vm_basic_types.h --
  *
- *    basic data types.
+ *      Basic data types.
  */
 
-
 #ifndef _VM_BASIC_TYPES_H_
 #define _VM_BASIC_TYPES_H_
 
@@ -312,7 +310,8 @@ typedef char           Bool;
 #endif
 
 
-#if defined(__GNUC__) && defined(__SIZEOF_INT128__)
+#if defined __GNUC__ && defined __SIZEOF_INT128__
+#define VM_HAS_INT128 // 128-bit integers can be used.
 
 typedef unsigned __int128 uint128;
 typedef          __int128  int128;
@@ -321,7 +320,6 @@ typedef          __int128  int128;
 #define MAX_INT128   (~MIN_INT128)
 #define MIN_UINT128  ((uint128)0)
 #define MAX_UINT128  (~MIN_UINT128)
-
 #endif
 
 
@@ -473,14 +471,7 @@ typedef uint64    PhysMemOff;
 typedef uint64    PhysMemSize;
 
 typedef uint64    BA;
-#ifdef VMKERNEL
-typedef void     *BPN;
-#else
 typedef uint64    BPN;
-#endif
-
-#define UINT64_2_BPN(u) ((BPN)(u))
-#define BPN_2_UINT64(b) ((uint64)(b))
 
 typedef uint64    PageCnt;
 typedef uint64    PageNum;
@@ -507,9 +498,6 @@ typedef User_CartelID User_SessionID;
 typedef User_CartelID User_CartelGroupID;
 #define INVALID_CARTELGROUP_ID INVALID_CARTEL_ID
 
-typedef uint32 Worldlet_ID;
-#define INVALID_WORLDLET_ID ((Worldlet_ID)-1)
-
 typedef  int8    Reg8;
 typedef  int16   Reg16;
 typedef  int32   Reg32;
@@ -527,7 +515,7 @@ typedef uint128 UReg128;
 
 #if (defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
      defined (VMKERNEL) || defined (VMKBOOT) || defined (ULM)) &&  \
-    !defined (FROBOS)
+    !defined (FROBOS) || defined (VSAN_USERLEVEL)
 typedef  Reg64  Reg;
 typedef UReg64 UReg;
 #endif
@@ -630,12 +618,12 @@ typedef void * UserVA;
 #define MAX_MPN           ((MPN)MPN38_MASK - 3) /* 50 bits of address space */
 
 #define INVALID_IOPN      ((IOPN)-1)
-#define MAX_IOPN          (INVALID_IOPN - 1)
+#define MAX_IOPN          (IOA_2_IOPN((IOA)-1))
 
 #define INVALID_LPN       ((LPN)-1)
 #define INVALID_VPN       ((VPN)-1)
 #define INVALID_LPN64     ((LPN64)-1)
-#define INVALID_PAGENUM   ((PageNum)0x000000ffffffffffull)
+#define INVALID_PAGENUM   ((PageNum)0x0000003fffffffffull)
 #define INVALID_PAGENUM32 ((uint32)-1)
 
 /*
@@ -736,11 +724,11 @@ typedef void * UserVA;
 #endif
 
 /*
- * Similarly, we require a compiler that is at least vs2012.
+ * Similarly, we require a compiler that is at least vs2015.
  * Enforce this here.
  */
-#if defined _MSC_VER && _MSC_VER < 1700
-#error "cl.exe version is too old, need vs2012 or better"
+#if defined _MSC_VER && _MSC_VER < 1900
+#error "cl.exe version is too old, need vs2015 or better"
 #endif
 
 
diff --git a/vmmon-only/include/vm_idt_x86.h b/vmmon-only/include/vm_idt_x86.h
index 0c8ba3fc..8672af02 100644
--- a/vmmon-only/include/vm_idt_x86.h
+++ b/vmmon-only/include/vm_idt_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2012,2017-2018,2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2012,2017-2018,2020,2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -46,6 +46,13 @@ extern "C" {
 #define TSS_RSP1 1
 #define TSS_RSP2 2
 
+/*
+ * IDTR limit is set to the maximum because after a vmexit Intel's VT restores
+ * the IDTR but sets the limit to the maximum value. Please see details 27.5.2
+ * Loading Host Segment and Descriptor-Table Registers from the Intel manual.
+ */
+#define IDT_LIMIT                  0xFFFF
+
 #define IDT_NUM_GATES              0x100
 /*
  * The monitor and the vmkernel use gate stub handlers of a single size in
diff --git a/vmmon-only/include/vmm_constants.h b/vmmon-only/include/vmm_constants.h
index 06800ff2..35ca94db 100644
--- a/vmmon-only/include/vmm_constants.h
+++ b/vmmon-only/include/vmm_constants.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2018, 2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,4 +39,11 @@
 
 #define VMM_PANIC_MSG_SIZE     256
 
+/* Ensure enough space for obj build with GCOV_VMM=1. */
+#if defined(VMX86_SERVER)
+#define VMMBLOB_SIZE_MAX (24 * 1024 * 1024)
+#else
+#define VMMBLOB_SIZE_MAX (24 * 1024 * 1024)
+#endif
+
 #endif
diff --git a/vmmon-only/include/x86/cpu_types_arch.h b/vmmon-only/include/x86/cpu_types_arch.h
index bf3663b0..786bbf47 100644
--- a/vmmon-only/include/x86/cpu_types_arch.h
+++ b/vmmon-only/include/x86/cpu_types_arch.h
@@ -19,11 +19,11 @@
 /*
  * cpu_types_arch.h --
  *
- *     Low-level CPU type definitions for the x86.
+ *      Low-level CPU type definitions for x86.
  */
 
-#if !defined(_X86_CPU_TYPES_ARCH_H_)
-#define _X86_CPU_TYPES_ARCH_H_
+#ifndef _CPU_TYPES_X86_H_
+#define _CPU_TYPES_X86_H_
 
 #define INCLUDE_ALLOW_USERLEVEL
 
@@ -142,7 +142,7 @@ typedef struct {
 
 // Task defaults to Task32 for everyone except vmkernel. Task64 is used where
 // needed by these products.
-#if defined VMX86_SERVER && defined VMKERNEL
+#if defined VMX86_SERVER && defined VMKERNEL || defined VSAN_USERLEVEL
 #ifdef VM_X86_64
 typedef Task64 Task;
 #else
@@ -461,5 +461,4 @@ typedef union SharedUReg64 {
    UReg64 ureg64;
 } SharedUReg64;
 
-#endif /* _X86_CPU_TYPES_ARCH_H_ */
-
+#endif /* _CPU_TYPES_X86_H_ */
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index f40b20a4..42885b08 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -103,6 +103,7 @@
 #define CR4_PKE        0x00400000
 #define CR4_CET        0x00800000
 #define CR4_PKS        0x01000000
+#define CR4_UINTR      0x02000000
 #define CR4_RESERVED   CONST64U(0xfffffffffe089000)
 #define CR8_RESERVED   CONST64U(0xfffffffffffffff0)
 
diff --git a/vmmon-only/include/x86cet.h b/vmmon-only/include/x86cet.h
new file mode 100644
index 00000000..94c3cbe6
--- /dev/null
+++ b/vmmon-only/include/x86cet.h
@@ -0,0 +1,83 @@
+/*********************************************************
+ * Copyright (C) 2020-2021 VMware, Inc. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License as published by the
+ * Free Software Foundation version 2 and no later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+ * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin St, Fifth Floor, Boston, MA  02110-1301 USA
+ *
+ *********************************************************/
+
+#ifndef _X86CET_H_
+#define _X86CET_H_
+
+/*
+ * x86cet.h --
+ *
+ *    Contains definitions for the x86 Control-flow Enforcement Technology
+ *    (CET) features: Shadow Stacks and Indirect Branch Tracking.
+ */
+
+#include "x86paging_64.h"
+
+/* Error codes for #CP causes. */
+#define CP_NEAR_RET               1
+#define CP_FAR_RET_IRET           2
+#define CP_ENDBRANCH              3
+#define CP_RSTORSSP               4
+#define CP_SETSSBSY               5
+#define CP_ENCL                   (1 << 15)
+
+/* Bits for token checks when switching %ssp. */
+#define SSP_SUPERVISOR_TOKEN_BUSY (1 << 0)
+#define SSP_RSTOR_TOKEN_LM        (1 << 0)
+#define SSP_PREV_TOKEN            (1 << 1)
+
+/* The Shadow Stack pointer is always 4-byte aligned. */
+#define SSP_ALIGN_MASK            0x3
+#define INVALID_SSP               SSP_ALIGN_MASK
+
+/*
+ * Shadow Frame --
+ *    Pushed onto the new shadow stack upon exceptions, interrupts, and
+ *    far calls except User->Supervisor.
+ *    Popped off the old shadow stack upon lret or iret, except
+ *    Supervisor->User.
+ */
+typedef struct {
+   uint64   ssp;
+   uint64   lip;
+   Selector cs, __cs_unused[3];
+} ShadowFrame64;
+
+typedef ALIGNED(8) struct {
+   uint32   ssp, __ssp_unused;
+   uint32   lip, __lip_unused;
+   Selector cs, __cs_unused[3];
+} ShadowFrame32;
+
+
+/*
+ * CET_IBTComputeLegacyByte --
+ *   Calculates the bit position in the legacy bitmap for the given LA.
+ *   LA [63  ...  48][47 .... 15][14 13 12][11  ...  0]
+ *         unused       byteNum    bitNum
+ */
+static INLINE void
+CET_IBTComputeLegacyByte(LA la, uint64 *byteNum, uint8 *byteMask)
+{
+   const unsigned bitsPerByte = 8;
+   uint64 bitNum = LA_2_LPN((LA64)la & MASK64(VA64_IMPL_BITS));
+   *byteNum = bitNum / bitsPerByte;
+   *byteMask = (uint8)(1 << (bitNum % bitsPerByte));
+}
+
+#endif /* ifndef _X86CET_H_ */
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 4d4de26e..1fe6fcda 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -98,7 +98,7 @@ typedef struct CPUIDQuery {
 #endif
 
 /*
- * CPUID levels the monitor caches.
+ * Table of known CPUID levels.
  *
  * The first parameter defines whether the level has its default masks
  * generated from the values in this file. Any level which is marked as FALSE
@@ -120,14 +120,14 @@ typedef struct CPUIDQuery {
  */
 
 /*            MASKS, LVL, VAL,      CNT, HWV */
-#define CPUID_CACHED_LEVELS                  \
+#define CPUID_KNOWN_LEVELS                   \
    CPUIDLEVEL(TRUE,  0,   0x0,        0,  0) \
    CPUIDLEVEL(TRUE,  1,   0x1,        0,  0) \
    CPUIDLEVEL(FALSE, 2,   0x2,        0,  0) \
    CPUIDLEVEL(FALSE, 4,   0x4,        7,  0) \
    CPUIDLEVEL(FALSE, 5,   0x5,        0,  0) \
    CPUIDLEVEL(TRUE,  6,   0x6,        0,  0) \
-   CPUIDLEVEL(TRUE,  7,   0x7,        2,  0) \
+   CPUIDLEVEL(TRUE,  7,   0x7,        3,  0) \
    CPUIDLEVEL(TRUE,  9,   0x9,        0, 17) \
    CPUIDLEVEL(FALSE, A,   0xa,        0,  0) \
    CPUIDLEVEL(FALSE, B,   0xb,        3,  0) \
@@ -148,6 +148,7 @@ typedef struct CPUIDQuery {
    CPUIDLEVEL(TRUE,  1E,  0x1e,       1, 19) \
    CPUIDLEVEL(FALSE, 1F,  0x1f,       6, 17) \
    CPUIDLEVEL(TRUE,  20,  0x20,       1, 20) \
+   CPUIDLEVEL(TRUE , 21,  0x21,       1, 20) \
    CPUIDLEVEL(FALSE, 400, 0x40000000, 0,  0) \
    CPUIDLEVEL(FALSE, 401, 0x40000001, 0,  0) \
    CPUIDLEVEL(FALSE, 402, 0x40000002, 0,  0) \
@@ -174,22 +175,23 @@ typedef struct CPUIDQuery {
    CPUIDLEVEL(FALSE, 81E, 0x8000001e, 0,  0) \
    CPUIDLEVEL(TRUE,  81F, 0x8000001f, 0, 14) \
    CPUIDLEVEL(TRUE,  820, 0x80000020, 2, 17) \
-   CPUIDLEVEL(TRUE,  821, 0x80000021, 0, 17)
+   CPUIDLEVEL(TRUE,  821, 0x80000021, 0, 17) \
+   CPUIDLEVEL(TRUE,  822, 0x80000022, 0, 20) \
+   CPUIDLEVEL(TRUE,  823, 0x80000023, 0, 20) \
+   CPUIDLEVEL(FALSE, 826, 0x80000026, 4, 20)
 
-#define CPUID_ALL_LEVELS CPUID_CACHED_LEVELS
-
-/* Define cached CPUID levels in the form: CPUID_LEVEL_<ShortName> */
+/* Define all CPUID levels in the form: CPUID_LEVEL_<ShortName> */
 typedef enum {
 #define CPUIDLEVEL(t, s, v, c, h) CPUID_LEVEL_##s,
-   CPUID_CACHED_LEVELS
+   CPUID_KNOWN_LEVELS
 #undef CPUIDLEVEL
-   CPUID_NUM_CACHED_LEVELS
-} CpuidCachedLevel;
+   CPUID_NUM_KNOWN_LEVELS
+} CpuidLevel;
 
 /* Enum to translate between shorthand name and actual CPUID level value. */
 enum {
 #define CPUIDLEVEL(t, s, v, c, h) CPUID_LEVEL_VAL_##s = v,
-   CPUID_ALL_LEVELS
+   CPUID_KNOWN_LEVELS
 #undef CPUIDLEVEL
 };
 
@@ -200,6 +202,7 @@ enum {
 #define CPUID_MWAIT_FEATURES         5
 #define CPUID_PMC_FEATURES           0xa
 #define CPUID_XSAVE_FEATURES         0xd
+#define CPUID_RDT_FEATURES           0x10
 #define CPUID_SGX_FEATURES           0x12
 #define CPUID_PT_FEATURES            0x14
 #define CPUID_HYPERVISOR_LEVEL_0     0x40000000
@@ -230,24 +233,26 @@ typedef enum {
 #define CPUID_CYRIX_VENDOR_STRING       "CyriteadxIns"
 #define CPUID_VIA_VENDOR_STRING         "CentaulsaurH"
 #define CPUID_HYGON_VENDOR_STRING       "HygouinenGen"
+#define CPUID_INTEL_TDX_VENDOR_STRING   "Inte    lTDX"
 
 #define CPUID_HYPERV_HYPERVISOR_VENDOR_STRING  "Microsoft Hv"
 #define CPUID_KVM_HYPERVISOR_VENDOR_STRING     "KVMKVMKVM\0\0\0"
 #define CPUID_VMWARE_HYPERVISOR_VENDOR_STRING  "VMwareVMware"
 #define CPUID_XEN_HYPERVISOR_VENDOR_STRING     "XenVMMXenVMM"
 
-#define CPUID_INTEL_VENDOR_STRING_FIXED "GenuineIntel"
-#define CPUID_AMD_VENDOR_STRING_FIXED   "AuthenticAMD"
-#define CPUID_CYRIX_VENDOR_STRING_FIXED "CyrixInstead"
-#define CPUID_VIA_VENDOR_STRING_FIXED   "CentaurHauls"
-#define CPUID_HYGON_VENDOR_STRING_FIXED "HygonGenuine"
+#define CPUID_INTEL_VENDOR_STRING_FIXED      "GenuineIntel"
+#define CPUID_AMD_VENDOR_STRING_FIXED        "AuthenticAMD"
+#define CPUID_CYRIX_VENDOR_STRING_FIXED      "CyrixInstead"
+#define CPUID_VIA_VENDOR_STRING_FIXED        "CentaurHauls"
+#define CPUID_HYGON_VENDOR_STRING_FIXED      "HygonGenuine"
+#define CPUID_INTEL_TDX_VENDOR_STRING_FIXED  "IntelTDX    "
 
 /*
  * FIELD can be defined to process the CPUID information provided in the
  * following CPUID_FIELD_DATA macro.
  *
  * The first parameter is the CPUID level of the feature (must be defined in
- * CPUID_ALL_LEVELS, above).
+ * CPUID_KNOWN_LEVELS, above).
  *
  * The second parameter is the CPUID sub-level (subleaf) of the feature. Please
  * make sure here the number is consistent with the "subleaf count" in
@@ -350,7 +355,7 @@ FIELD(  1,  0, EBX, 24,  8, APICID,                              ANY,   4 ) \
 FLAG(   1,  0, ECX,  0,  1, SSE3,                                YES,   4 ) \
 FLAG(   1,  0, ECX,  1,  1, PCLMULQDQ,                           YES,   4 ) \
 FLAG(   1,  0, ECX,  2,  1, DTES64,                              NO,    0 ) \
-FLAG(   1,  0, ECX,  3,  1, MWAIT,                               YES,   4 ) \
+FLAG(   1,  0, ECX,  3,  1, MWAIT,                               YES,   7 ) \
 FLAG(   1,  0, ECX,  4,  1, DSCPL,                               NO,    0 ) \
 FLAG(   1,  0, ECX,  5,  1, VMX,                                 YES,   8 ) \
 FLAG(   1,  0, ECX,  6,  1, SMX,                                 YES, FUT ) \
@@ -495,7 +500,7 @@ FLAG(   7,  0, EBX,  0,  1, FSGSBASE,                            YES,   9 ) \
 FLAG(   7,  0, EBX,  1,  1, TSC_ADJUST,                          ANY,  11 ) \
 FLAG(   7,  0, EBX,  2,  1, SGX,                                 ANY,  17 ) \
 FLAG(   7,  0, EBX,  3,  1, BMI1,                                YES,   9 ) \
-FLAG(   7,  0, EBX,  4,  1, HLE,                                 YES,  11 ) \
+FLAG(   7,  0, EBX,  4,  1, HLE,                                 ANY,  11 ) \
 FLAG(   7,  0, EBX,  5,  1, AVX2,                                YES,  11 ) \
 FLAG(   7,  0, EBX,  6,  1, FDP_EXCPTN_ONLY,                     ANY,   4 ) \
 FLAG(   7,  0, EBX,  7,  1, SMEP,                                YES,   9 ) \
@@ -506,7 +511,7 @@ FLAG(   7,  0, EBX, 11,  1, RTM,                                 YES,  11 ) \
 FLAG(   7,  0, EBX, 12,  1, PQM,                                 NO,    0 ) \
 FLAG(   7,  0, EBX, 13,  1, FP_SEGMENT_ZERO,                     ANY,  11 ) \
 FLAG(   7,  0, EBX, 14,  1, MPX,                                 ANY,  13 ) \
-FLAG(   7,  0, EBX, 15,  1, PQE,                                 NO,    0 ) \
+FLAG(   7,  0, EBX, 15,  1, PQE,                                 YES,  20 ) \
 FLAG(   7,  0, EBX, 16,  1, AVX512F,                             YES,  13 ) \
 FLAG(   7,  0, EBX, 17,  1, AVX512DQ,                            YES,  13 ) \
 FLAG(   7,  0, EBX, 18,  1, RDSEED,                              YES,  11 ) \
@@ -527,9 +532,9 @@ FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                          YES,  17 ) \
 FLAG(   7,  0, ECX,  2,  1, UMIP,                                YES,  17 ) \
 FLAG(   7,  0, ECX,  3,  1, PKU,                                 YES,  13 ) \
 FLAG(   7,  0, ECX,  4,  1, OSPKE,                               ANY,  13 ) \
-FLAG(   7,  0, ECX,  5,  1, WAITPKG,                             NO,    0 ) \
+FLAG(   7,  0, ECX,  5,  1, WAITPKG,                             YES, FUT ) \
 FLAG(   7,  0, ECX,  6,  1, AVX512VBMI2,                         YES,  17 ) \
-FLAG(   7,  0, ECX,  7,  1, CET_SS,                              NO,    0 ) \
+FLAG(   7,  0, ECX,  7,  1, CET_SS,                              YES,  20 ) \
 FLAG(   7,  0, ECX,  8,  1, GFNI,                                YES,  17 ) \
 FLAG(   7,  0, ECX,  9,  1, VAES,                                YES,  17 ) \
 FLAG(   7,  0, ECX, 10,  1, VPCLMULQDQ,                          YES,  17 ) \
@@ -541,6 +546,7 @@ FLAG(   7,  0, ECX, 16,  1, VA57,                                NO,    0 ) \
 FIELD(  7,  0, ECX, 17,  5, MAWA,                                NO,    0 ) \
 FLAG(   7,  0, ECX, 22,  1, RDPID,                               YES,  17 ) \
 FLAG(   7,  0, ECX, 23,  1, KEY_LOCKER,                          NO,    0 ) \
+FLAG(   7,  0, ECX, 24,  1, BUS_LOCK_DB,                         NO,    0 ) \
 FLAG(   7,  0, ECX, 25,  1, CLDEMOTE,                            YES,  18 ) \
 FLAG(   7,  0, ECX, 27,  1, MOVDIRI,                             YES,  18 ) \
 FLAG(   7,  0, ECX, 28,  1, MOVDIR64B,                           YES,  18 ) \
@@ -558,12 +564,12 @@ FLAG(   7,  0, EDX, 14,  1, SERIALIZE,                           YES,  20 ) \
 FLAG(   7,  0, EDX, 15,  1, HYBRID,                              NO,    0 ) \
 FLAG(   7,  0, EDX, 16,  1, TSXLDTRK,                            NO,    0 ) \
 FLAG(   7,  0, EDX, 18,  1, PCONFIG,                             NO,    0 ) \
-FLAG(   7,  0, EDX, 19,  1, ARCH_LBR,                            NO,    0 ) \
-FLAG(   7,  0, EDX, 20,  1, CET_IBT,                             NO,    0 ) \
-FLAG(   7,  0, EDX, 22,  1, AMX_BF16,                            NO,    0 ) \
-FLAG(   7,  0, EDX, 23,  1, AVX512FP16,                          NO,    0 ) \
-FLAG(   7,  0, EDX, 24,  1, AMX_TILE,                            NO,    0 ) \
-FLAG(   7,  0, EDX, 25,  1, AMX_INT8,                            NO,    0 ) \
+FLAG(   7,  0, EDX, 19,  1, ARCH_LBR,                            YES,  20 ) \
+FLAG(   7,  0, EDX, 20,  1, CET_IBT,                             YES,  20 ) \
+FLAG(   7,  0, EDX, 22,  1, AMX_BF16,                            YES,  20 ) \
+FLAG(   7,  0, EDX, 23,  1, AVX512FP16,                          YES,  20 ) \
+FLAG(   7,  0, EDX, 24,  1, AMX_TILE,                            YES,  20 ) \
+FLAG(   7,  0, EDX, 25,  1, AMX_INT8,                            YES,  20 ) \
 FLAG(   7,  0, EDX, 26,  1, IBRSIBPB,                            ANY,   9 ) \
 FLAG(   7,  0, EDX, 27,  1, STIBP,                               YES,   9 ) \
 FLAG(   7,  0, EDX, 28,  1, FCMD,                                YES,   9 ) \
@@ -572,11 +578,12 @@ FLAG(   7,  0, EDX, 30,  1, CORE_CAPABILITIES,                   NO,    0 ) \
 FLAG(   7,  0, EDX, 31,  1, SSBD,                                YES,   9 ) \
 FLAG(   7,  1, EAX,  4,  1, AVX_VNNI,                            YES,  20 ) \
 FLAG(   7,  1, EAX,  5,  1, AVX512BF16,                          YES,  18 ) \
-FLAG(   7,  1, EAX, 10,  1, FAST_ZERO_MOVSB,                     NO,    0 ) \
-FLAG(   7,  1, EAX, 11,  1, FAST_SHORT_STOSB,                    NO,    0 ) \
-FLAG(   7,  1, EAX, 12,  1, FAST_SHORT_CMPSB_SCASB,              NO,    0 ) \
+FLAG(   7,  1, EAX, 10,  1, FAST_ZERO_MOVSB,                     YES,  20 ) \
+FLAG(   7,  1, EAX, 11,  1, FAST_SHORT_STOSB,                    YES,  20 ) \
+FLAG(   7,  1, EAX, 12,  1, FAST_SHORT_CMPSB_SCASB,              YES,  20 ) \
 FLAG(   7,  1, EAX, 22,  1, HRESET,                              NO,    0 ) \
-FLAG(   7,  1, EAX, 26,  1, LAM,                                 NO,    0 )
+FLAG(   7,  1, EAX, 26,  1, LAM,                                 NO,    0 ) \
+FLAG(   7,  2, EDX,  0,  1, PSFD,                                YES,  20 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_9                                            \
@@ -623,8 +630,8 @@ FLAG(   D,  0, EAX,  5,  1, XCR0_MASTER_OPMASK,                  YES,  13 ) \
 FLAG(   D,  0, EAX,  6,  1, XCR0_MASTER_ZMM_H,                   YES,  13 ) \
 FLAG(   D,  0, EAX,  7,  1, XCR0_MASTER_HI16_ZMM,                YES,  13 ) \
 FLAG(   D,  0, EAX,  9,  1, XCR0_MASTER_PKRU,                    YES,  13 ) \
-FLAG(   D,  0, EAX, 17,  1, XCR0_MASTER_XTILECFG,                NO,    0 ) \
-FLAG(   D,  0, EAX, 18,  1, XCR0_MASTER_XTILEDATA,               NO,    0 ) \
+FLAG(   D,  0, EAX, 17,  1, XCR0_MASTER_XTILECFG,                YES,  20 ) \
+FLAG(   D,  0, EAX, 18,  1, XCR0_MASTER_XTILEDATA,               YES,  20 ) \
 FIELD(  D,  0, EBX,  0, 32, XSAVE_ENABLED_SIZE,                  ANY,   8 ) \
 FIELD(  D,  0, ECX,  0, 32, XSAVE_MAX_SIZE,                      YES,   8 ) \
 FIELD(  D,  0, EDX,  0, 29, XCR0_MASTER_UPPER,                   NO,    0 ) \
@@ -634,12 +641,12 @@ FLAG(   D,  1, EAX,  0,  1, XSAVEOPT,                            YES,  11 ) \
 FLAG(   D,  1, EAX,  1,  1, XSAVEC,                              YES,  13 ) \
 FLAG(   D,  1, EAX,  2,  1, XGETBV_ECX1,                         YES,  17 ) \
 FLAG(   D,  1, EAX,  3,  1, XSAVES,                              YES,  13 ) \
-FLAG(   D,  1, EAX,  4,  1, XFD,                                 NO,    0 ) \
+FLAG(   D,  1, EAX,  4,  1, XFD,                                 YES,  20 ) \
 FIELD(  D,  1, EBX,  0, 32, XSAVES_ENABLED_SIZE,                 ANY,  13 ) \
 FLAG(   D,  1, ECX,  8,  1, XSS_MASTER_PT,                       NO,    0 ) \
 FLAG(   D,  1, ECX, 10,  1, XSS_MASTER_PASID,                    NO,    0 ) \
-FLAG(   D,  1, ECX, 11,  1, XSS_MASTER_CET_U,                    NO,    0 ) \
-FLAG(   D,  1, ECX, 12,  1, XSS_MASTER_CET_S,                    NO,    0 ) \
+FLAG(   D,  1, ECX, 11,  1, XSS_MASTER_CET_U,                    YES,  20 ) \
+FLAG(   D,  1, ECX, 12,  1, XSS_MASTER_CET_S,                    YES,  20 ) \
 FLAG(   D,  1, ECX, 13,  1, XSS_MASTER_HDC,                      NO,    0 ) \
 FLAG(   D,  1, ECX, 14,  1, XSS_MASTER_UINTR,                    NO,    0 ) \
 FLAG(   D,  1, ECX, 15,  1, XSS_MASTER_LBR,                      NO,    0 ) \
@@ -688,14 +695,14 @@ FIELD(  D, 10, EAX,  0, 32, XSAVES_PASID_STATE_SIZE,             NO,    0 ) \
 FLAG(   D, 10, ECX,  0,  1, XSAVES_PASID_STATE_SUP_BY_XSS,       NO,    0 ) \
 FLAG(   D, 10, ECX,  1,  1, XSAVES_PASID_STATE_ALIGN,            NO,    0 ) \
 FLAG(   D, 10, ECX,  2,  1, XSAVES_PASID_STATE_XFD,              NO,    0 ) \
-FIELD(  D, 11, EAX,  0, 32, XSAVES_CET_U_SIZE,                   NO,    0 ) \
-FLAG(   D, 11, ECX,  0,  1, XSAVES_CET_U_SUP_BY_XSS,             NO,    0 ) \
-FLAG(   D, 11, ECX,  1,  1, XSAVES_CET_U_ALIGN,                  NO,    0 ) \
-FLAG(   D, 11, ECX,  2,  1, XSAVES_CET_U_XFD,                    NO,    0 ) \
-FIELD(  D, 12, EAX,  0, 32, XSAVES_CET_S_SIZE,                   NO,    0 ) \
-FLAG(   D, 12, ECX,  0,  1, XSAVES_CET_S_SUP_BY_XSS,             NO,    0 ) \
-FLAG(   D, 12, ECX,  1,  1, XSAVES_CET_S_ALIGN,                  NO,    0 ) \
-FLAG(   D, 12, ECX,  2,  1, XSAVES_CET_S_XFD,                    NO,    0 ) \
+FIELD(  D, 11, EAX,  0, 32, XSAVES_CET_U_SIZE,                   YES,  20 ) \
+FLAG(   D, 11, ECX,  0,  1, XSAVES_CET_U_SUP_BY_XSS,             YES,  20 ) \
+FLAG(   D, 11, ECX,  1,  1, XSAVES_CET_U_ALIGN,                  YES,  20 ) \
+FLAG(   D, 11, ECX,  2,  1, XSAVES_CET_U_XFD,                    YES,  20 ) \
+FIELD(  D, 12, EAX,  0, 32, XSAVES_CET_S_SIZE,                   YES,  20 ) \
+FLAG(   D, 12, ECX,  0,  1, XSAVES_CET_S_SUP_BY_XSS,             YES,  20 ) \
+FLAG(   D, 12, ECX,  1,  1, XSAVES_CET_S_ALIGN,                  YES,  20 ) \
+FLAG(   D, 12, ECX,  2,  1, XSAVES_CET_S_XFD,                    YES,  20 ) \
 FIELD(  D, 13, EAX,  0, 32, XSAVES_HDT_SIZE,                     NO,    0 ) \
 FLAG(   D, 13, ECX,  0,  1, XSAVES_HDT_SUP_BY_XSS,               NO,    0 ) \
 FLAG(   D, 13, ECX,  1,  1, XSAVES_HDT_ALIGN,                    NO,    0 ) \
@@ -712,16 +719,16 @@ FIELD(  D, 16, EAX,  0, 32, XSAVES_HWP_SIZE,                     NO,    0 ) \
 FLAG(   D, 16, ECX,  0,  1, XSAVES_HWP_SUP_BY_XSS,               NO,    0 ) \
 FLAG(   D, 16, ECX,  1,  1, XSAVES_HWP_ALIGN,                    NO,    0 ) \
 FLAG(   D, 16, ECX,  2,  1, XSAVES_HWP_XFD,                      NO,    0 ) \
-FIELD(  D, 17, EAX,  0, 32, XSAVE_XTILECFG_SIZE,                 NO,    0 ) \
-FIELD(  D, 17, EBX,  0, 32, XSAVE_XTILECFG_OFFSET,               NO,    0 ) \
+FIELD(  D, 17, EAX,  0, 32, XSAVE_XTILECFG_SIZE,                 YES,  20 ) \
+FIELD(  D, 17, EBX,  0, 32, XSAVE_XTILECFG_OFFSET,               YES,  20 ) \
 FLAG(   D, 17, ECX,  0,  1, XSAVE_XTILECFG_SUP_BY_XSS,           NO,    0 ) \
-FLAG(   D, 17, ECX,  1,  1, XSAVE_XTILECFG_ALIGN,                NO,    0 ) \
-FLAG(   D, 17, ECX,  2,  1, XSAVE_XTILECFG_XFD,                  NO,    0 ) \
-FIELD(  D, 18, EAX,  0, 32, XSAVE_XTILEDATA_SIZE,                NO,    0 ) \
-FIELD(  D, 18, EBX,  0, 32, XSAVE_XTILEDATA_OFFSET,              NO,    0 ) \
+FLAG(   D, 17, ECX,  1,  1, XSAVE_XTILECFG_ALIGN,                YES,  20 ) \
+FLAG(   D, 17, ECX,  2,  1, XSAVE_XTILECFG_XFD,                  YES,  20 ) \
+FIELD(  D, 18, EAX,  0, 32, XSAVE_XTILEDATA_SIZE,                YES,  20 ) \
+FIELD(  D, 18, EBX,  0, 32, XSAVE_XTILEDATA_OFFSET,              YES,  20 ) \
 FLAG(   D, 18, ECX,  0,  1, XSAVE_XTILEDATA_SUP_BY_XSS,          NO,    0 ) \
-FLAG(   D, 18, ECX,  1,  1, XSAVE_XTILEDATA_ALIGN,               NO,    0 ) \
-FLAG(   D, 18, ECX,  2,  1, XSAVE_XTILEDATA_XFD,                 NO,    0 ) \
+FLAG(   D, 18, ECX,  1,  1, XSAVE_XTILEDATA_ALIGN,               YES,  20 ) \
+FLAG(   D, 18, ECX,  2,  1, XSAVE_XTILEDATA_XFD,                 YES,  20 ) \
 /* D, 62: AMD LWP leaf on BD, PD, SR. Dropped in Zen. Never referenced. */
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
@@ -735,12 +742,19 @@ FLAG(   F,  1, EDX,  1,  1, PQM_MBM_TOTAL,                       NO,    0 ) \
 FLAG(   F,  1, EDX,  2,  1, PQM_MBM_LOCAL,                       NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
-#define CPUID_FIELD_DATA_LEVEL_10                                          \
-FLAG(  10,  0, EBX,  1,  1, PQE_L3,                              NO,    0 ) \
-FIELD( 10,  1, EAX,  0,  5, PQE_L3_MASK_LENGTH,                  NO,    0 ) \
+#define CPUID_FIELD_DATA_LEVEL_10                                           \
+FLAG(  10,  0, EBX,  1,  1, PQE_L3,                              YES,  20 ) \
+FLAG(  10,  0, EBX,  2,  1, PQE_L2,                              NO,    0 ) \
+FLAG(  10,  0, EBX,  3,  1, PQE_MBA,                             NO,    0 ) \
+FIELD( 10,  1, EAX,  0,  5, PQE_L3_MASK_LENGTH,                  YES,  20 ) \
 FIELD( 10,  1, EBX,  0, 32, PQE_L3_ISOLATION_UNIT_MAP,           NO,    0 ) \
 FLAG(  10,  1, ECX,  2,  1, PQE_L3_CDP,                          NO,    0 ) \
-FIELD( 10,  1, EDX,  0, 16, PQE_L3_MAX_COS_NUMBER,               NO,    0 )
+FIELD( 10,  1, EDX,  0, 16, PQE_L3_MAX_COS_NUMBER,               YES,  20 ) \
+FIELD( 10,  2, EAX,  0,  5, PQE_L2_MASK_LENGTH,                  NO,    0 ) \
+FIELD( 10,  2, EBX,  0, 32, PQE_L2_ISOLATION_UNIT_MAP,           NO,    0 ) \
+FLAG(  10,  2, ECX,  2,  1, PQE_L2_CDP,                          NO,    0 ) \
+FIELD( 10,  2, EDX,  0, 16, PQE_L2_MAX_COS_NUMBER,               NO,    0 )
+
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_12                                           \
@@ -860,29 +874,29 @@ FIELD( 1B,  0, EDX,  0, 32, PCONFIG_TARGET_ID3,                  NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1C                                           \
-FIELD( 1C,  0, EAX,  0,  8, LBR_DEPTH,                           NO,    0 ) \
-FLAG(  1C,  0, EAX, 30,  1, LBR_DEEP_CSTATE_RESET,               NO,    0 ) \
-FLAG(  1C,  0, EAX, 31,  1, LBR_IP_CONTAINS_LIP,                 NO,    0 ) \
-FLAG(  1C,  0, EBX,  0,  1, LBR_CPL_FILTERING,                   NO,    0 ) \
-FLAG(  1C,  0, EBX,  1,  1, LBR_BRANCH_FILTERING,                NO,    0 ) \
-FLAG(  1C,  0, EBX,  2,  1, LBR_CALL_STACK_MODE,                 NO,    0 ) \
-FLAG(  1C,  0, ECX,  0,  1, LBR_MISPREDICT,                      NO,    0 ) \
-FLAG(  1C,  0, ECX,  1,  1, LBR_TIMED_LBRS,                      NO,    0 ) \
-FLAG(  1C,  0, ECX,  2,  1, LBR_BRANCH_TYPE,                     NO,    0 ) \
+FIELD( 1C,  0, EAX,  0,  8, LBR_DEPTH,                           YES,  20 ) \
+FLAG(  1C,  0, EAX, 30,  1, LBR_DEEP_CSTATE_RESET,               YES,  20 ) \
+FLAG(  1C,  0, EAX, 31,  1, LBR_IP_CONTAINS_LIP,                 YES,  20 ) \
+FLAG(  1C,  0, EBX,  0,  1, LBR_CPL_FILTERING,                   YES,  20 ) \
+FLAG(  1C,  0, EBX,  1,  1, LBR_BRANCH_FILTERING,                YES,  20 ) \
+FLAG(  1C,  0, EBX,  2,  1, LBR_CALL_STACK_MODE,                 YES,  20 ) \
+FLAG(  1C,  0, ECX,  0,  1, LBR_MISPREDICT,                      YES,  20 ) \
+FLAG(  1C,  0, ECX,  1,  1, LBR_TIMED_LBRS,                      YES,  20 ) \
+FLAG(  1C,  0, ECX,  2,  1, LBR_BRANCH_TYPE,                     YES,  20 ) \
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1D                                           \
-FIELD( 1D,  0, EAX,  0, 32, TILE_PALETTE_MAX,                    NO,    0 ) \
-FIELD( 1D,  1, EAX,  0, 16, TILE_PALETTE1_TOTAL_BYTES,           NO,    0 ) \
-FIELD( 1D,  1, EAX, 16, 16, TILE_PALETTE1_BYTES_PER_TILE,        NO,    0 ) \
-FIELD( 1D,  1, EBX,  0, 16, TILE_PALETTE1_BYTES_PER_ROW,         NO,    0 ) \
-FIELD( 1D,  1, EBX, 16, 16, TILE_PALETTE1_NUM_REGS,              NO,    0 ) \
-FIELD( 1D,  1, ECX,  0, 16, TILE_PALETTE1_MAX_ROWS,              NO,    0 )
+FIELD( 1D,  0, EAX,  0, 32, TILE_PALETTE_MAX,                    YES,    20 ) \
+FIELD( 1D,  1, EAX,  0, 16, TILE_PALETTE1_TOTAL_BYTES,           YES,    20 ) \
+FIELD( 1D,  1, EAX, 16, 16, TILE_PALETTE1_BYTES_PER_TILE,        YES,    20 ) \
+FIELD( 1D,  1, EBX,  0, 16, TILE_PALETTE1_BYTES_PER_ROW,         YES,    20 ) \
+FIELD( 1D,  1, EBX, 16, 16, TILE_PALETTE1_NUM_REGS,              YES,    20 ) \
+FIELD( 1D,  1, ECX,  0, 16, TILE_PALETTE1_MAX_ROWS,              YES,    20 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1E                                           \
-FIELD( 1E,  0, EBX,  0,  8, TMUL_MAX_K,                          NO,    0 ) \
-FIELD( 1E,  0, EBX,  8, 16, TMUL_MAX_N,                          NO,    0 )
+FIELD( 1E,  0, EBX,  0,  8, TMUL_MAX_K,                          YES,    20 ) \
+FIELD( 1E,  0, EBX,  8, 16, TMUL_MAX_N,                          YES,    20 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1F                                           \
@@ -897,6 +911,13 @@ FIELD( 1F,  0, EDX,  0, 32, TOPOLOGY_V2_X2APIC_ID,               NA,    0 )
 FIELD( 20,  0, EAX,  0, 32, HRESET_MAX_SUBLEAF,                  NO,    0 ) \
 FIELD( 20,  0, EBX,  0, 32, HRESET_ENABLE_MSR_VALID_BITS,        NO,    0 )
 
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_21                                           \
+FIELD( 21,  0, EAX,  0, 32, TDX_MAX_SUBLEAF,                     NO,    0 ) \
+FIELD( 21,  0, EBX,  0, 32, TDX_VENDOR1,                         NO,    0 ) \
+FIELD( 21,  0, ECX,  0, 32, TDX_VENDOR3,                         NO,    0 ) \
+FIELD( 21,  0, EDX,  0, 32, TDX_VENDOR2,                         NO,    0 )
+
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_400                                          \
 FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                       NA,    0 ) \
@@ -963,7 +984,9 @@ FLAG( 403,  0, EDX, 10,  1, GUEST_CRASH_MSRS_AVAIL,              NA,    0 ) \
 FLAG( 403,  0, EDX, 11,  1, DEBUG_MSRS_AVAIL,                    NA,    0 ) \
 FLAG( 403,  0, EDX, 12,  1, NPIEP1_AVAIL,                        NA,    0 ) \
 FLAG( 403,  0, EDX, 13,  1, DISABLE_HYPERVISOR_AVAIL,            NA,    0 ) \
-FLAG( 403,  0, EDX, 15,  1, XMM_REGS_FOR_HYPERCALL_OUTPUT,       NA,    0 )
+FLAG( 403,  0, EDX, 15,  1, XMM_REGS_FOR_HYPERCALL_OUTPUT,       NA,    0 ) \
+FLAG( 403,  0, EDX, 17,  1, SINT_POLLING_AVAIL,                  NA,    0 ) \
+FLAG( 403,  0, EDX, 19,  1, DIRECT_SYN_TIMER,                    NA,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_404                                         \
@@ -1001,7 +1024,6 @@ FIELD(410,  0, EAX,  0, 32, TSC_HZ,                              NA,    0 ) \
 FIELD(410,  0, EBX,  0, 32, APICBUS_HZ,                          NA,    0 ) \
 FLAG( 410,  0, ECX,  0,  1, VMMCALL_BACKDOOR,                    NA,    0 ) \
 FLAG( 410,  0, ECX,  1,  1, VMCALL_BACKDOOR,                     NA,    0 ) \
-FLAG( 410,  0, ECX,  2,  1, TDX_ENABLED,                         NA,    0 ) \
 FLAG( 410,  0, ECX,  3,  1, TDX_API_ENABLED,                     NA,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
@@ -1046,7 +1068,7 @@ FLAG(  81,  0, ECX, 24,  1, PERFNB,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 26,  1, DATABK,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 27,  1, PERFTSC,                             NO,    0 ) \
 FLAG(  81,  0, ECX, 28,  1, PERFL3,                              NO,    0 ) \
-FLAG(  81,  0, ECX, 29,  1, MWAITX,                              NO,    0 ) \
+FLAG(  81,  0, ECX, 29,  1, MONITORX,                            NO,    0 ) \
 FLAG(  81,  0, ECX, 30,  1, ADDR_MASK_EXT,                       NO,    0 ) \
 FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                          YES,   4 ) \
 FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                          YES,   4 ) \
@@ -1175,12 +1197,12 @@ FLAG(  88,  0, EBX,  9,  1, WBNOINVD,                            YES,  17 ) \
 FLAG(  88,  0, EBX, 10,  1, LBREXTN,                             NO,    0 ) \
 FLAG(  88,  0, EBX, 12,  1, LEAF88_IBPB,                         ANY,   9 ) \
 FLAG(  88,  0, EBX, 13,  1, WBINVD_INT,                          NO,    0 ) \
-FLAG(  88,  0, EBX, 14,  1, LEAF88_IBRS,                         NO,    0 ) \
+FLAG(  88,  0, EBX, 14,  1, LEAF88_IBRS,                         ANY,  20 ) \
 FLAG(  88,  0, EBX, 15,  1, LEAF88_STIBP,                        NO,    0 ) \
-FLAG(  88,  0, EBX, 16,  1, LEAF88_IBRS_ALWAYS,                  NO,    0 ) \
+FLAG(  88,  0, EBX, 16,  1, LEAF88_IBRS_ALWAYS,                  YES,  20 ) \
 FLAG(  88,  0, EBX, 17,  1, LEAF88_STIBP_ALWAYS,                 NO,    0 ) \
-FLAG(  88,  0, EBX, 18,  1, LEAF88_PREFER_IBRS,                  NO,    0 ) \
-FLAG(  88,  0, EBX, 19,  1, LEAF88_IBRS_SAME_MODE,               NO,    0 ) \
+FLAG(  88,  0, EBX, 18,  1, LEAF88_PREFER_IBRS,                  YES,  20 ) \
+FLAG(  88,  0, EBX, 19,  1, LEAF88_IBRS_SAME_MODE,               YES,  20 ) \
 FLAG(  88,  0, EBX, 20,  1, LMSLE_UNSUPPORTED,                   NO,    0 ) \
 FLAG(  88,  0, EBX, 23,  1, PPIN,                                NO,    0 ) \
 FLAG(  88,  0, EBX, 24,  1, LEAF88_SSBD_SPEC_CTRL,               YES,  20 ) \
@@ -1222,7 +1244,8 @@ CPUID_8A_EDX_14 \
 FLAG(  8A,  0, EDX, 15,  1, SVM_V_VMSAVE_VMLOAD,                 NO,    0 ) \
 FLAG(  8A,  0, EDX, 16,  1, SVM_VGIF,                            NO,    0 ) \
 FLAG(  8A,  0, EDX, 17,  1, SVM_GMET,                            YES,  17 ) \
-FIELD( 8A,  0, EDX, 18,  2, SVMEDX_RSVD3,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 18,  1, SVMEDX_RSVD3,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 19,  1, SVM_SSS,                             YES,  20 ) \
 FLAG(  8A,  0, EDX, 20,  1, SVM_GUEST_SPEC_CTRL,                 NO,    0 ) \
 FIELD( 8A,  0, EDX, 21,  3, SVMEDX_RSVD4,                        NO,    0 ) \
 FLAG(  8A,  0, EDX, 24,  1, SVM_TLB_CTL,                         NO,    0 ) \
@@ -1325,6 +1348,7 @@ FLAG( 81F,  0, EAX,  2,  1, PAGE_FLUSH_MSR,                      NO,    0 ) \
 FLAG( 81F,  0, EAX,  3,  1, SEV_ES,                              YES,  17 ) \
 FLAG( 81F,  0, EAX,  4,  1, SEV_SNP,                             NO,    0 ) \
 FLAG( 81F,  0, EAX,  5,  1, VMPL,                                NO,    0 ) \
+FLAG( 81F,  0, EAX,  9,  1, TSC_AUX_VIRT,                        YES,  20 ) \
 FLAG( 81F,  0, EAX, 10,  1, SEV_HEC,                             NO,    0 ) \
 FLAG( 81F,  0, EAX, 11,  1, SEV_64BIT_REQ,                       NO,    0 ) \
 FLAG( 81F,  0, EAX, 12,  1, SEV_RESTR_INJECTION,                 NO,    0 ) \
@@ -1343,7 +1367,14 @@ FLAG( 820,  0, EBX,  1,  1, LEAF820_MBE,                         NO,    0 ) \
 FIELD(820,  1, EAX,  0, 32, CAPACITY_MASK_LEN,                   NO,    0 ) \
 FIELD(820,  1, EDX,  0, 32, NUM_SERVICE_CLASSES,                 NO,    0 )
 
-#define CPUID_FIELD_DATA_LEVEL_821
+#define CPUID_FIELD_DATA_LEVEL_821                                          \
+FLAG( 821,  0, EAX,  7,  1, UPPER_ADDRESS_IGNORE,                YES,  20 )
+
+#define CPUID_FIELD_DATA_LEVEL_822
+
+#define CPUID_FIELD_DATA_LEVEL_823
+
+#define CPUID_FIELD_DATA_LEVEL_826
 
 #define CPUID_FIELD_DATA                                              \
    CPUID_FIELD_DATA_LEVEL_0                                           \
@@ -1373,6 +1404,7 @@ FIELD(820,  1, EDX,  0, 32, NUM_SERVICE_CLASSES,                 NO,    0 )
    CPUID_FIELD_DATA_LEVEL_1E                                          \
    CPUID_FIELD_DATA_LEVEL_1F                                          \
    CPUID_FIELD_DATA_LEVEL_20                                          \
+   CPUID_FIELD_DATA_LEVEL_21                                          \
    CPUID_FIELD_DATA_LEVEL_400                                         \
    CPUID_FIELD_DATA_LEVEL_401                                         \
    CPUID_FIELD_DATA_LEVEL_402                                         \
@@ -1399,7 +1431,10 @@ FIELD(820,  1, EDX,  0, 32, NUM_SERVICE_CLASSES,                 NO,    0 )
    CPUID_FIELD_DATA_LEVEL_81E                                         \
    CPUID_FIELD_DATA_LEVEL_81F                                         \
    CPUID_FIELD_DATA_LEVEL_820                                         \
-   CPUID_FIELD_DATA_LEVEL_821
+   CPUID_FIELD_DATA_LEVEL_821                                         \
+   CPUID_FIELD_DATA_LEVEL_822                                         \
+   CPUID_FIELD_DATA_LEVEL_823                                         \
+   CPUID_FIELD_DATA_LEVEL_826
 
 /*
  * Define all field and flag values as an enum.  The result is a full
@@ -1638,9 +1673,12 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_ICELAKE_7E        0x7e  // Ice Lake U/Y
 #define CPUID_MODEL_ICELAKE_6A        0x6a  // Ice Lake SP (ICX)
 #define CPUID_MODEL_ICELAKE_6C        0x6c  // Ice Lake D
-#define CPUID_MODEL_TIGERLAKE_8C      0x8c  // Tiger Lake
+#define CPUID_MODEL_TIGERLAKE_8C      0x8c  // Tiger Lake UP3/UP4/H35
+#define CPUID_MODEL_TIGERLAKE_8D      0x8d  // Tiger Lake H81
 #define CPUID_MODEL_KNM_85            0x85  // Knights Mill
 #define CPUID_MODEL_KABYLAKE_8E       0x8e  // Kaby Lake U/Y QS
+#define CPUID_MODEL_ALDERLAKE_97      0x97  // Alder Lake-S
+#define CPUID_MODEL_ALDERLAKE_9A      0x9a  // Alder Lake-P
 #define CPUID_MODEL_KABYLAKE_9E       0x9e  // Kaby Lake S/H QS
 #define CPUID_MODEL_COMETLAKE_A5      0xa5  // Comet Lake S
 #define CPUID_MODEL_COMETLAKE_A6      0xa6  // Comet Lake U
@@ -1713,7 +1751,7 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
  *----------------------------------------------------------------------
  */
 static INLINE Bool
-CPUID_IsRawVendor(CPUIDRegs *id0, const char* vendor)
+CPUID_IsRawVendor(const CPUIDRegs *id0, const char* vendor)
 {
    // hard to get strcmp() in some environments, so do it in the raw
    return (id0->ebx == *(const uint32 *)(uintptr_t) (vendor + 0) &&
@@ -1722,25 +1760,25 @@ CPUID_IsRawVendor(CPUIDRegs *id0, const char* vendor)
 }
 
 static INLINE Bool
-CPUID_IsVendorAMD(CPUIDRegs *id0)
+CPUID_IsVendorAMD(const CPUIDRegs *id0)
 {
    return CPUID_IsRawVendor(id0, CPUID_AMD_VENDOR_STRING);
 }
 
 static INLINE Bool
-CPUID_IsVendorIntel(CPUIDRegs *id0)
+CPUID_IsVendorIntel(const CPUIDRegs *id0)
 {
    return CPUID_IsRawVendor(id0, CPUID_INTEL_VENDOR_STRING);
 }
 
 static INLINE Bool
-CPUID_IsVendorVIA(CPUIDRegs *id0)
+CPUID_IsVendorVIA(const CPUIDRegs *id0)
 {
    return CPUID_IsRawVendor(id0, CPUID_VIA_VENDOR_STRING);
 }
 
 static INLINE Bool
-CPUID_IsVendorHygon(CPUIDRegs *id0)
+CPUID_IsVendorHygon(const CPUIDRegs *id0)
 {
    return CPUID_IsRawVendor(id0, CPUID_HYGON_VENDOR_STRING);
 }
@@ -1753,7 +1791,8 @@ CPUID_EFFECTIVE_FAMILY(uint32 v) /* %eax from CPUID with %eax=1. */
       CPUID_GET(1, EAX, EXTENDED_FAMILY, v);
 }
 
-/* Normally only used when FAMILY==CPUID_FAMILY_EXTENDED, but Intel is
+/*
+ * Normally only used when FAMILY==CPUID_FAMILY_EXTENDED, but Intel is
  * now using the extended model field for FAMILY==CPUID_FAMILY_P6 to
  * refer to the newer Core2 CPUs
  */
@@ -2014,7 +2053,8 @@ CPUID_MODEL_IS_TIGERLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
 {
    /* Assumes the CPU manufacturer is Intel. */
    return CPUID_FAMILY_IS_P6(v) &&
-          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_TIGERLAKE_8C);
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_TIGERLAKE_8C ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_TIGERLAKE_8D);
 }
 
 static INLINE Bool
@@ -2034,6 +2074,15 @@ CPUID_UARCH_IS_ICELAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
           CPUID_MODEL_IS_ROCKETLAKE(v);
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_ALDERLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ALDERLAKE_97 ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ALDERLAKE_9A);
+}
+
 
 static INLINE Bool
 CPUID_UARCH_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
@@ -2242,6 +2291,7 @@ CPUID_FAMILY_IS_ZEN3(uint32 eax)
    return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN3;
 }
 
+
 /*
  * AMD Barcelona (of either Opteron or Phenom kind).
  */
@@ -2373,15 +2423,11 @@ CPUID_MODEL_IS_DHYANA_A(uint32 eax)
 static INLINE Bool
 CPUID_MODEL_IS_ZEN3(uint32 eax)
 {
-  return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN3 &&
-         CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN3_0F;
+   return CPUID_EFFECTIVE_FAMILY(eax) == CPUID_FAMILY_ZEN3 &&
+          CPUID_EFFECTIVE_MODEL(eax) <= CPUID_MODEL_ZEN3_0F;
 }
 
 
-#define CPUID_TYPE_PRIMARY     0
-#define CPUID_TYPE_OVERDRIVE   1
-#define CPUID_TYPE_SECONDARY   2
-
 #define CPUID_LEAF4_CACHE_TYPE_NULL      0
 #define CPUID_LEAF4_CACHE_TYPE_DATA      1
 #define CPUID_LEAF4_CACHE_TYPE_INST      2
@@ -2389,9 +2435,6 @@ CPUID_MODEL_IS_ZEN3(uint32 eax)
 #define CPUID_LEAF4_CACHE_INDEXING_DIRECT  0
 #define CPUID_LEAF4_CACHE_INDEXING_COMPLEX 1
 
-#define CPUID_LEAF4_CACHE_SELF_INIT      0x00000100
-#define CPUID_LEAF4_CACHE_FULLY_ASSOC    0x00000200
-
 #define CPUID_TOPOLOGY_LEVEL_TYPE_INVALID   0
 #define CPUID_TOPOLOGY_LEVEL_TYPE_SMT       1
 #define CPUID_TOPOLOGY_LEVEL_TYPE_CORE      2
@@ -2406,20 +2449,11 @@ CPUID_MODEL_IS_ZEN3(uint32 eax)
 #define CPUID_AMD_LEAF81D_CACHE_TYPE_INST   2
 #define CPUID_AMD_LEAF81D_CACHE_TYPE_UNIF   3
 
-/*
- * For certain AMD processors, an lfence instruction is necessary at various
- * places to ensure ordering.
- */
-
-static INLINE Bool
-CPUID_RequiresFence(CpuidVendor vendor, // IN
-                    uint32 version)     // IN: %eax from CPUID with %eax=1.
-{
-   return vendor == CPUID_VENDOR_AMD &&
-          CPUID_EFFECTIVE_FAMILY(version) == CPUID_FAMILY_K8 &&
-          CPUID_EFFECTIVE_MODEL(version) < 0x40;
-}
-
+#define CPUID_AMD_TOPOLOGY_LEVEL_TYPE_INVALID   0
+#define CPUID_AMD_TOPOLOGY_LEVEL_TYPE_CORE      1
+#define CPUID_AMD_TOPOLOGY_LEVEL_TYPE_COMPLEX   2
+#define CPUID_AMD_TOPOLOGY_LEVEL_TYPE_CCD       3
+#define CPUID_AMD_TOPOLOGY_LEVEL_TYPE_SOCKET    4
 
 /*
  * Hypervisor CPUID space is 0x400000XX.
@@ -2449,7 +2483,7 @@ CPUID_LevelUsesEcx(uint32 level) {
       case v:                         \
          return c != 0;
 
-      CPUID_ALL_LEVELS
+      CPUID_KNOWN_LEVELS
 
 #undef CPUIDLEVEL
 
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 855eeb32..7def93ab 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -113,6 +113,14 @@ typedef struct MSRQuery {
 #define MSR_S_CET                            0x6a2
 #define MSR_CET_SH_STK_EN                         (1ULL << 0)
 #define MSR_CET_WR_SHSTK_EN                       (1ULL << 1)
+#define MSR_CET_ENDBR_EN                          (1ULL << 2)
+#define MSR_CET_LEG_IW_EN                         (1ULL << 3)
+#define MSR_CET_NO_TRACK_EN                       (1ULL << 4)
+#define MSR_CET_SUPPRESS_DIS                      (1ULL << 5)
+#define MSR_CET_RSVD                              (0xfULL << 6)
+#define MSR_CET_SUPPRESS                          (1ULL << 10)
+#define MSR_CET_TRACKER                           (1ULL << 11)
+#define MSR_CET_EB_LEG_BITMAP_BASE                (~0xfffULL)  // bits 63:12
 #define MSR_PL0_SSP                          0x6a4
 #define MSR_PL1_SSP                          0x6a5
 #define MSR_PL2_SSP                          0x6a6
@@ -169,11 +177,35 @@ typedef struct MSRQuery {
 #define MSR_PERF_CAPABILITIES_PEBS_ADAPTIVE_DATA     (1u << 14)
 #define MSR_PERF_CAPABILITIES_PERF_METRICS_AVAILABLE (1u << 15)
 
-#define IA32_MSR_PEBS_ENABLE                      0x3f1
-
-#define MSR_UMWAIT_CONTROL                        0xe1
-#define MSR_UMWAIT_CONTROL_C0_MASK                0x1
-#define MSR_UMWAIT_CONTROL_TSC_MASK               0xfffffffc
+#define IA32_MSR_PEBS_ENABLE                 0x3f1
+
+#define MSR_UMWAIT_CONTROL                   0xe1
+#define MSR_UMWAIT_CONTROL_C0                        (1u << 0)
+#define MSR_UMWAIT_CONTROL_TSC                       0xfffffffc
+
+#define MSR_UINTR_RR                         0x985
+#define MSR_UINTR_HANDLER                    0x986
+#define MSR_UINTR_STACKADJUST                0x987
+#define MSR_UINTR_STACKADJUST_INT_DELIVERY           (1ULL << 0)
+#define MSR_UINTR_MISC                       0x988
+#define MSR_UINTR_MISC_UITTSZ_SHIFT                  0
+#define MSR_UINTR_MISC_UITTSZ_MASK                   CONST64U(0xffffffff)
+                                                                     // [31:0]
+#define MSR_UINTR_MISC_UINV_SHIFT                    32
+#define MSR_UINTR_MISC_UINV_MASK                     CONST64U(0xff)  // [39:32]
+#define MSR_UINTR_MISC_RSVD_SHIFT                    40
+#define MSR_UINTR_MISC_RSVD_MASK                     CONST64U(0xffffff)
+                                                                     // [63:40]
+#define MSR_UINTR_PD                         0x989
+#define MSR_UINTR_PD_RSVD_SHIFT                      0
+#define MSR_UINTR_PD_RSVD_MASK                       CONST64U(0x3f)  // [5:0]
+#define MSR_UINTR_TT                         0x98a
+#define MSR_UINTR_TT_UITTADDR_SHIFT                  4
+#define MSR_UINTR_TT_UITTADDR_MASK                   CONST64U(0xfffffffffffffff)
+                                                                     // [63:4]
+#define MSR_UINTR_TT_RSVD_SHIFT                      1
+#define MSR_UINTR_TT_RSVD_MASK                       CONST64U(0x7)   // [3:1]
+#define MSR_UINTR_TT_SENDUIPI_EN                     (1ULL << 0)
 
 #define MSR_MTRR_BASE0        0x00000200
 #define MSR_MTRR_MASK0        0x00000201
@@ -259,6 +291,8 @@ typedef struct MSRQuery {
 #define MSR_ARCH_LBR_CTL_NEAR_IND_CALL 0x100000
 #define MSR_ARCH_LBR_CTL_NEAR_RET      0x200000
 #define MSR_ARCH_LBR_CTL_OTHER_BRANCH  0x400000
+#define MSR_ARCH_LBR_CTL_CPL_MASK      0x000006
+#define MSR_ARCH_LBR_CTL_BRANCH_MASK   0x7f0000
 #define MSR_ARCH_LBR_CTL_ALL           0x7f000f
 
 /* Power Management MSRs */
@@ -505,12 +539,15 @@ typedef struct MSRQuery {
 #define MSR_RTIT_CR3_MATCH_RSVD CONST64U(0x1f)
 
 /* SGX MSRs */
-#define MSR_SGX_SVN_STATUS               0x00000500
+#define MSR_SGX_SVN_STATUS                       0x00000500
 
 /* SGX SVN status MSR fields */
-#define MSR_SGX_SVN_STATUS_LOCK          0x1
-#define MSR_SGX_SVN_STATUS_SINIT_SVN     CONST64U(0xff0000)
-#define MSR_SGX_SVN_STATUS_RSVD          CONST64U(0xffffffffff00fffe)
+#define MSR_SGX_SVN_STATUS_LOCK                  0x1
+#define MSR_SGX_SVN_STATUS_SINIT_SVN_SHIFT       16
+#define MSR_SGX_SVN_STATUS_SINIT_SVN_MASK        CONST64U(0xff)
+#define MSR_SGX_SVN_STATUS_NP_SEAMLDR_SVN_SHIFT  56
+#define MSR_SGX_SVN_STATUS_NP_SEAMLDR_SVN_MASK   CONST64U(0xff)
+#define MSR_SGX_SVN_STATUS_RSVD                  CONST64U(0xffffffff00fffe)
 
 /*
  * SGX Flexible Launch Control MSRs.
@@ -543,6 +580,7 @@ typedef struct MSRQuery {
 /* DebugCtlMSR bits */
 #define MSR_DEBUGCTL_LBR                   0x00000001
 #define MSR_DEBUGCTL_BTF                   0x00000002
+#define MSR_DEBUGCTL_BUS_LOCK_DB           0x00000004
 #define MSR_DEBUGCTL_TR                    0x00000040
 #define MSR_DEBUGCTL_BTS                   0x00000080
 #define MSR_DEBUGCTL_BTINT                 0x00000100
@@ -553,7 +591,7 @@ typedef struct MSRQuery {
 #define MSR_DEBUGCTL_ENABLE_UNCORE_PMI     0x00002000
 #define MSR_DEBUGCTL_FREEZE_WHILE_SMM      0x00004000
 #define MSR_DEBUGCTL_RTM                   0x00008000
-#define MSR_DEBUGCTL_RSVD          0xffffffffffff003cULL
+#define MSR_DEBUGCTL_RSVD          0xffffffffffff0038ULL
 
 /* Feature control bits */
 #define MSR_FEATCTL_LOCK     0x00000001
@@ -574,10 +612,12 @@ typedef struct MSRQuery {
 #define MSR_EFER_LMSLE       0x0000000000002000ULL  /* LM seg lim enable:r/w */
 #define MSR_EFER_FFXSR       0x0000000000004000ULL  /* Fast FXSAVE:      r/w */
 #define MSR_EFER_TCE         0x0000000000008000ULL  /* Trans. cache ext. r/w */
+#define MSR_EFER_UAIE        0x0000000000100000ULL  /* UAI(AMD) enable:  r/w */
+#define MSR_EFER_AUTO_IBRS   0x0000000000200000ULL  /* Automatic IBRS:   r/w */
 /* Vendor specific EFER bits */
 #define MSR_EFER_INTEL_MBZ   0xffffffffffff02feULL  /* Must be zero (resrvd) */
 #define MSR_EFER_INTEL_RAZ   0x0000000000000000ULL  /* Read as zero          */
-#define MSR_EFER_AMD_MBZ     0xffffffffffff0200ULL  /* Must be zero (resrvd) */
+#define MSR_EFER_AMD_MBZ     0xffffffffffcf0200ULL  /* Must be zero (resrvd) */
 #define MSR_EFER_AMD_RAZ     0x00000000000000feULL  /* Read as zero          */
 
 #define MSR_AMD_PATCH_LOADER 0xc0010020
@@ -649,10 +689,16 @@ typedef struct MSRQuery {
 #define MSR_GHCB_PA_AP_JUMP_TABLE           0x3
 #define MSR_GHCB_PA_CPUID_REQ               0x4
 #define MSR_GHCB_PA_CPUID_RESP              0x5
+#define MSR_GHCB_PA_AP_RESET_HOLD_REQ       0x6
+#define MSR_GHCB_PA_AP_RESET_HOLD_RESP      0x7
 #define MSR_GHCB_PA_PREFERRED_GHCB_GPA_REQ  0x10
 #define MSR_GHCB_PA_PREFERRED_GHCB_GPA_RESP 0x11
 #define MSR_GHCB_PA_REGISTER_GHCB_GPA_REQ   0x12
 #define MSR_GHCB_PA_REGISTER_GHCB_GPA_RESP  0x13
+#define MSR_GHCB_PA_SNP_PSC_REQ             0x14
+#define MSR_GHCB_PA_SNP_PSC_RESP            0x15
+#define MSR_GHCB_PA_FEATURES_REQ            0x80
+#define MSR_GHCB_PA_FEATURES_RESP           0x81
 #define MSR_GHCB_PA_TERMINATE               0x100
 
 /* Field definitions for SEVInfo block returned by MSR_GHCB_PA_SEVINFO_REQ. */
@@ -668,6 +714,12 @@ typedef struct MSRQuery {
 #define SEVINFO_MINVER(_si) SEVINFO_GET(_si, MINVER)
 #define SEVINFO_MAXVER(_si) SEVINFO_GET(_si, MAXVER)
 
+/* Field definitions for MSR_GHCB_PA_AP_RESET_HOLD_REQ */
+#define MSR_GHCB_PA_AP_RESET_HOLD_SHIFT     12
+
+/* Field definitions for MSR_GHCB_PA_FEATURES_REQ */
+#define MSR_GHCB_PA_FEATURES_SHIFT          12
+
 /* Field definitions for MSR_GHCB_PA_TERMINATE request. */
 #define MSR_GHCB_PA_TERMINATE_ECS_MASK      0xfULL
 #define MSR_GHCB_PA_TERMINATE_ECS_SHIFT     12
@@ -679,6 +731,9 @@ typedef struct MSRQuery {
 #define SEV_TERM_ECS_EFI    1    /* Used for VMware EFI errors. */
 #define SEV_TERM_ECS_FROBOS 2    /* Used for FrobOS errors.     */
 
+#define SEV_TERM_FROBOS_REG_FAILED       1  /* GHCB PA registration failed. */
+#define SEV_TERM_FROBOS_PVALIDATE_FAILED 2  /* PVALIDATE failed unexpectedly. */
+
 /* SEV feature-enabled bits in MSR_SEV_STATUS. */
 #define MSR_SEV_STATUS_SEV_EN_BIT      0
 #define MSR_SEV_STATUS_SEV_EN          (1ULL << MSR_SEV_STATUS_SEV_EN_BIT)
@@ -925,18 +980,20 @@ typedef unsigned char MTRRType;
 
 
 // Platform Quality of Service (PQM) MSRs
-#define MSR_INTEL_PQM_EVTSEL    0xc8d
-#define MSR_INTEL_PQM_CTR       0xc8e
-#define MSR_INTEL_PQM_ASSOC     0xc8f
+#define MSR_INTEL_PQM_EVTSEL             0xc8d
+#define MSR_INTEL_PQM_CTR                0xc8e
+#define MSR_INTEL_PQM_ASSOC              0xc8f
+#define MSR_INTEL_PQM_ASSOC_RMID_SHIFT   0
+#define MSR_INTEL_PQM_ASSOC_RMID_MASK    CONST64U(0x3ff)
+#define MSR_INTEL_PQM_ASSOC_COS_SHIFT    32
+#define MSR_INTEL_PQM_ASSOC_COS_MASK     CONST64U(0xffffffff)
+#define MSR_INTEL_PQM_ASSOC_RSV_MASK     CONST64U(0xfffffc00)
 
  // Platform Quality Enforcement (PQE) MSRs
-#define MSR_INTEL_PQE_CLOS_MASK_BASE     0xc90
-#define MSR_INTEL_PQE_CLOS_MASK_MAX      0xd8f
-
-#define MSR_INTEL_PQE_CLOS_L3_MASK_BASE     0xc90
-#define MSR_INTEL_PQE_CLOS_L3_MASK_MAX      0xd0f
-#define MSR_INTEL_PQE_CLOS_L2_MASK_BASE     0xd10
-#define MSR_INTEL_PQE_CLOS_L2_MASK_MAX      0xd4f
+#define MSR_INTEL_PQE_CLOS_L3_MASK_BASE  0xc90
+#define MSR_INTEL_PQE_CLOS_L3_MASK_MAX   0xd0f
+#define MSR_INTEL_PQE_CLOS_L2_MASK_BASE  0xd10
+#define MSR_INTEL_PQE_CLOS_L2_MASK_MAX   0xd4f
 
 static INLINE uint32
 X86MSR_SysCallEIP(uint64 star)
diff --git a/vmmon-only/include/x86paging_64.h b/vmmon-only/include/x86paging_64.h
index 632ec818..85f04cfd 100644
--- a/vmmon-only/include/x86paging_64.h
+++ b/vmmon-only/include/x86paging_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016,2018-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016,2018-2020,2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -137,6 +137,13 @@ LMPTEIsSafe(VM_PAE_PTE pte, PT_Level level, uint64 physMask)
 #define VA64_CANONICAL_HOLE_START   (CONST64U(1) << (VA64_IMPL_BITS - 1))
 #define VA64_CANONICAL_HOLE_LEN  VA64_CANONICAL_MASK - VA64_CANONICAL_HOLE_START
 
+/*
+ * x86-64 architecture allows 57 bits of virtual address space if 5-level
+ * paging is enabled.
+ */
+#define VA64_L5_IMPL_BITS          57
+#define VA64_L5_IMPL_MASK          ((CONST64U(1) << VA64_L5_IMPL_BITS) - 1)
+
 static INLINE Bool
 x86IsCanonicalC(VA64 va)
 {
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
index 1e4d8a85..76550c09 100644
--- a/vmmon-only/include/x86svm.h
+++ b/vmmon-only/include/x86svm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2005-2014,2017-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2005-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -45,14 +45,13 @@
 #include "x86cpuid.h"
 #include "x86msr.h"
 #include "x86vendor.h"
-#if defined(USERLEVEL) || defined(MONITOR_APP)
-#include "vm_basic_asm.h"
-#else
-#include "vm_asm.h"
-#endif
 #ifdef VM_X86_ANY
 #include "x86cpuid_asm.h"
 #endif
+#if !defined(VMMON)
+#include "vmcore_types.h"
+#include "cpuidInfo.h"
+#endif
 
 #define SVM_VMCB_IO_BITMAP_PAGES   (3)
 #define SVM_VMCB_IO_BITMAP_SIZE    PAGES_2_BYTES(SVM_VMCB_IO_BITMAP_PAGES)
@@ -157,6 +156,7 @@
 #define SVM_VMCB_NPTCTL_SEV_ENABLE         (1 << 1)
 #define SVM_VMCB_NPTCTL_SEV_ES_ENABLE      (1 << 2)
 #define SVM_VMCB_NPTCTL_GMET_ENABLE        (1 << 3)
+#define SVM_VMCB_NPTCTL_SSS_CHECK_ENABLE   (1 << 4)
 
 /* VMCB.virtExt */
 #define SVM_VMCB_VIRTEXT_LBR_ENABLE        (1 << 0)
@@ -218,7 +218,12 @@
 #define SVM_VMSA_SEV_FEAT_BTB_ISOLATE  0x0000000000000080ULL
 #define SVM_VMSA_SEV_FEAT_RSVD         0xffffffffffffff00ULL
 
-/* Unique Exit Codes */
+/*
+ * Unique Exit Codes
+ * The HW exit codes are comprised of two contiguous groups.  If you add a new
+ * exit reason you should update either SVM_LAST_LO_EXIT_REASON or
+ * SVM_LAST_HI_EXIT_REASON and update svmExitStats.h.
+ */
 #define SVM_EXITCODE_CR_READ(n)             (0 + (n))
 #define SVM_EXITCODE_CR_WRITE(n)           (16 + (n))
 #define SVM_EXITCODE_DR_READ(n)            (32 + (n))
@@ -272,16 +277,31 @@
 #define SVM_EXITCODE_XSETBV               141
 #define SVM_EXITCODE_EFER_WRITE_TRAP      143
 #define SVM_EXITCODE_CR_WRITE_TRAP(n)    (144 + (n))
+/* Adjust SVM_LAST_LO_EXIT_REASON if you add a high exit reason. */
+#define SVM_FIRST_LO_EXIT_REASON 0
+#define SVM_LAST_LO_EXIT_REASON  159
+#define SVM_NUM_LO_EXIT_REASONS  (SVM_LAST_LO_EXIT_REASON + 1 - \
+                                  SVM_FIRST_LO_EXIT_REASON)
+
 #define SVM_EXITCODE_NPF                 1024
 #define SVM_EXITCODE_AVIC_INCOMPLETE_IPI 1025
 #define SVM_EXITCODE_AVIC_NOACCEL        1026
 #define SVM_EXITCODE_VMGEXIT             1027
 #define SVM_EXITCODE_PVALIDATE           1028
+/* Adjust SVM_LAST_HI_EXIT_REASON if you add a high exit reason. */
+#define SVM_FIRST_HI_EXIT_REASON 1024
+#define SVM_LAST_HI_EXIT_REASON  1028
+#define SVM_NUM_HI_EXIT_REASONS  (SVM_LAST_HI_EXIT_REASON + 1 - \
+                                  SVM_FIRST_HI_EXIT_REASON)
+
 #define SVM_EXITCODE_MMIO_READ           0x80000001   // SW only
 #define SVM_EXITCODE_MMIO_WRITE          0x80000002   // SW only
 #define SVM_EXITCODE_NMI_COMPLETE        0x80000003   // SW only
 #define SVM_EXITCODE_AP_RESET_HOLD       0x80000004   // SW only
 #define SVM_EXITCODE_AP_JUMP_TABLE       0x80000005   // SW only
+#define SVM_EXITCODE_SNP_PSC_REQ         0x80000010   // SW only
+#define SVM_EXITCODE_SNP_GUEST_REQ       0x80000011   // SW only
+#define SVM_EXITCODE_HV_FEATURES         0x8000FFFD   // SW only
 #define SVM_EXITCODE_UNSUPPORTED         0x8000FFFF   // SW only
 #define SVM_EXITCODE_INVALID             (-1ULL)
 
@@ -307,6 +327,7 @@
 #define SVM_IOEXIT_SBZ           0x0000e000
 
 /* ExitInfo1 for MSR exits */
+#define SVM_MSREXIT_RDMSR        0x00000000
 #define SVM_MSREXIT_WRMSR        0x00000001
 
 /* ExitInfo1 for CR exits */
@@ -336,13 +357,19 @@
 #define SVM_SMIEXIT_MBZ            0x0000fc00fffffffeULL
 
 /* ExitInfo1 for NPF exits */
-#define SVM_NPFEXIT_P              (1 << 0)
-#define SVM_NPFEXIT_RW             (1 << 1)
-#define SVM_NPFEXIT_US             (1 << 2)
-#define SVM_NPFEXIT_RSVD           (1 << 3)
-#define SVM_NPFEXIT_ID             (1 << 4)
+#define SVM_NPFEXIT_P              (1ULL << 0)
+#define SVM_NPFEXIT_RW             (1ULL << 1)
+#define SVM_NPFEXIT_US             (1ULL << 2)
+#define SVM_NPFEXIT_RSVD           (1ULL << 3)
+#define SVM_NPFEXIT_ID             (1ULL << 4)
+#define SVM_NPFEXIT_SS             (1ULL << 6)
+#define SVM_NPFEXIT_RMP            (1ULL << 31)    /* APM Vol 2, sec 15.36.10 */
 #define SVM_NPFEXIT_FINAL_ADDR     (1ULL << 32)    /* Rev. C */
 #define SVM_NPFEXIT_PTE_ACCESS     (1ULL << 33)    /* Rev. C */
+#define SVM_NPFEXIT_ENC            (1ULL << 34)    /* APM Vol 2, sec 15.36.10 */
+#define SVM_NPFEXIT_SIZEM          (1ULL << 35)    /* APM Vol 2, sec 15.36.10 */
+#define SVM_NPFEXIT_VMPL           (1ULL << 36)    /* APM Vol 2, sec 15.36.10 */
+#define SVM_NPFEXIT_SSS_LEAF       (1ULL << 37)
 
 /* ExitInfo1 for AP jump table exits */
 #define SVM_APEXIT_SET            0x0
@@ -439,6 +466,43 @@ SVM_ExecCtlBit(uint32 exitCode)
 }
 
 
+#if !defined(VMMON)
+/*
+ *----------------------------------------------------------------------
+ * SVM_MSRNumToIndex --
+ *
+ *   Given MSR number and access mode, return the bit position
+ *   in the VMCS MSR permission bitmap.
+ *
+ *   -1 is returned for invalid input MSR number.
+ *
+ *   The bitmap is organized into three contiguous 2k-bit arrays, one
+ *   for each of three disjoint MSR ranges.  Each array element is 2
+ *   bits, with the low order bit indicating a RDMSR intercept and
+ *   the high order bit indicating a WRMSR intercept.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE int
+SVM_MSRNumToIndex(uint32 msrNum, AccessMode accessMode)
+{
+   ASSERT(accessMode == ACCESS_MODE_READ || accessMode == ACCESS_MODE_WRITE);
+   if (msrNum < 0x2000) {
+      return msrNum * 2 + (accessMode == ACCESS_MODE_WRITE ? 1 : 0);
+   } else if (msrNum >= 0xC0000000 && msrNum < 0xC0002000) {
+      return 0x4000 + LOWORD(msrNum) * 2 +
+         (accessMode == ACCESS_MODE_WRITE ? 1 : 0);
+   } else if (msrNum >= 0xC0010000 && msrNum < 0xC0012000) {
+      return 0x8000 + LOWORD(msrNum) * 2 +
+         (accessMode == ACCESS_MODE_WRITE ? 1 : 0);
+   } else {
+      return -1;
+   }
+}
+#endif
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -470,8 +534,8 @@ SVM_LockedFromFeatures(uint64 vmCR)
    return (vmCR & MSR_VM_CR_SVM_LOCK) != 0;
 }
 
-
-#if !defined(USERLEVEL) && !defined(MONITOR_APP) /* { */
+#if defined(FROBOS) || defined(VMKERNEL) || \
+    defined(VMM) || defined(VMMON)
 /*
  *----------------------------------------------------------------------
  * SVM_EnabledCPU --
@@ -485,7 +549,7 @@ SVM_EnabledCPU(void)
 {
    return SVM_EnabledFromFeatures(X86MSR_GetMSR(MSR_VM_CR));
 }
-#endif /* } !defined(USERLEVEL) */
+#endif
 
 
 #ifndef VMM
@@ -509,11 +573,12 @@ SVM_CapableCPU(void)
 #endif  // ifdef VM_X86_ANY
 
 
+#if !defined(VMMON)
 /*
  *----------------------------------------------------------------------
- * SVM_SupportedVersion --
+ * SVM_SupportedRev --
  *
- *   Verify that a CPU has the SVM capabilities required to run the
+ *   Verify that a CPU has the minimum revision required to run the
  *   SVM-enabled monitor.  This function assumes that the processor is
  *   SVM_Capable().  We only support CPUs that populate the exitIntInfo
  *   field of the VMCB when IDT vectoring is interrupted by a task switch
@@ -523,12 +588,33 @@ SVM_CapableCPU(void)
  *----------------------------------------------------------------------
  */
 static INLINE Bool
-SVM_SupportedVersion(CpuidVendor vendor, uint32 version)
+SVM_SupportedRev(const CpuidInfo *cpuid)
 {
-   return (vendor == CPUID_VENDOR_AMD &&
-           CPUID_EFFECTIVE_FAMILY(version) >= CPUID_FAMILY_K8L) ||
+   CpuidVendor vendor = CpuidInfo_Vendor(cpuid);
+   uint32 family = CPUID_EFFECTIVE_FAMILY(CpuidInfo_Version(cpuid));
+
+   return (vendor == CPUID_VENDOR_AMD && family >= CPUID_FAMILY_K8L) ||
           vendor == CPUID_VENDOR_HYGON;
 }
+
+/*
+ *----------------------------------------------------------------------
+ * SVM_SupportedCPU --
+ *
+ *   Verify that a CPU has the SVM capabilities required to run the
+ *   SVM-enabled monitor.  In addition to having the minimum revision the CPU
+ *   must support NPT, NRIP and flush by ASID.
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+SVM_SupportedCPU(const CpuidInfo *cpuid)
+{
+   return SVM_SupportedRev(cpuid) &&
+          CpuidInfo_IsSet(SVM_NPT, cpuid) &&
+          CpuidInfo_IsSet(SVM_NRIP, cpuid) &&
+          CpuidInfo_IsSet(SVM_FLUSH_BY_ASID, cpuid);
+}
+#endif /* VMMON */
 #endif /* VMM */
 
 #endif /* _X86SVM_H_ */
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
index 93be5876..d9af56ab 100644
--- a/vmmon-only/include/x86vt-vmcs-fields.h
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -182,17 +182,17 @@ VMCS_GROUP_END(16, DATA)
 
 /* 16-bit guest state. */
 VMCS_GROUP_START(16, GUEST)
-VMCS_FIELD(ES,                      0x0800, _S16, _TG,  0, _NC,  _V, _RW, _NS)
-VMCS_FIELD(CS,                      0x0802, _S16, _TG,  1, _NC,  _V, _RW, _NS)
-VMCS_FIELD(SS,                      0x0804, _S16, _TG,  2, _NC,  _V, _RW, _NS)
-VMCS_FIELD(DS,                      0x0806, _S16, _TG,  3, _NC,  _V, _RW, _NS)
-VMCS_FIELD(FS,                      0x0808, _S16, _TG,  4, _NC,  _V, _RW, _NS)
-VMCS_FIELD(GS,                      0x080A, _S16, _TG,  5, _NC,  _V, _RW, _NS)
-VMCS_FIELD(LDTR,                    0x080C, _S16, _TG,  6, _NC,  _V, _RW, _NS)
-VMCS_FIELD(TR,                      0x080E, _S16, _TG,  7, _NC,  _V, _RW, _NS)
-VMCS_FIELD(INTR_STATUS,             0x0810, _S16, _TG,  8, _NC, _NV, _NA, _NS)
-VMCS_FIELD(PML_INDEX,               0x0812, _S16, _TG,  9, _NC,  _V, _NA, _NS)
-VMCS_UNUSED(                        0x0814, _S16, _TG,  10)
+VMCS_FIELD(ES,                      0x0800, _S16, _TG,  0,  _NC,  _V, _RW, _NS)
+VMCS_FIELD(CS,                      0x0802, _S16, _TG,  1,  _NC,  _V, _RW, _NS)
+VMCS_FIELD(SS,                      0x0804, _S16, _TG,  2,  _NC,  _V, _RW, _NS)
+VMCS_FIELD(DS,                      0x0806, _S16, _TG,  3,  _NC,  _V, _RW, _NS)
+VMCS_FIELD(FS,                      0x0808, _S16, _TG,  4,  _NC,  _V, _RW, _NS)
+VMCS_FIELD(GS,                      0x080A, _S16, _TG,  5,  _NC,  _V, _RW, _NS)
+VMCS_FIELD(LDTR,                    0x080C, _S16, _TG,  6,  _NC,  _V, _RW, _NS)
+VMCS_FIELD(TR,                      0x080E, _S16, _TG,  7,  _NC,  _V, _RW, _NS)
+VMCS_FIELD(INTR_STATUS,             0x0810, _S16, _TG,  8,  _NC, _NV, _NA, _NS)
+VMCS_FIELD(PML_INDEX,               0x0812, _S16, _TG,  9,  _NC,  _V, _NA, _NS)
+VMCS_FIELD(UINV,                    0x0814, _S16, _TG,  10, _NC, _NV, _NA, _NS)
 VMCS_UNUSED(                        0x0816, _S16, _TG,  11)
 VMCS_UNUSED(                        0x0818, _S16, _TG,  12)
 VMCS_UNUSED(                        0x081A, _S16, _TG,  13)
@@ -340,7 +340,7 @@ VMCS_FIELD(PDPTE2,                  0x280E, _S64, _TG,  7, _NC,  _V,  _RW, _NS)
 VMCS_FIELD(PDPTE3,                  0x2810, _S64, _TG,  8, _NC,  _V,  _RW, _NS)
 VMCS_FIELD(BNDCFGS,                 0x2812, _S64, _TG,  9, _NC,  _V,  _NA, _NS)
 VMCS_UNUSED(                        0x2814, _S64, _TG,  10)
-VMCS_UNUSED(                        0x2816, _S64, _TG,  11)
+VMCS_FIELD(LBR_CTL,                 0x2816, _S64, _TG,  11,_NC, _NV,  _NA, _NS)
 VMCS_FIELD(PKRS,                    0x2818, _S64, _TG,  12,_NC,  _V,  _NA, _NS)
 VMCS_UNUSED(                        0x281A, _S64, _TG,  13)
 VMCS_UNUSED(                        0x281C, _S64, _TG,  14)
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
index 8e4267f5..3dfe840d 100644
--- a/vmmon-only/include/x86vt.h
+++ b/vmmon-only/include/x86vt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2004-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2004-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -34,11 +34,6 @@
 #include "vm_basic_defs.h"
 #include "vm_assert.h"
 #include "x86msr.h"
-#if defined(USERLEVEL) || defined(MONITOR_APP)
-#include "vm_basic_asm.h"
-#else
-#include "vm_asm.h"
-#endif
 #ifdef VM_X86_ANY
 #include "x86cpuid_asm.h"  // for CPUID_ISSET in VT_CapableCPU
 #endif
@@ -86,8 +81,8 @@
    (CONST64U(1) << MSR_VMX_BASIC_ADVANCED_IOINFO_SHIFT)
 #define MSR_VMX_BASIC_TRUE_CTLS                 \
    (CONST64U(1) << MSR_VMX_BASIC_TRUE_CTLS_SHIFT)
-#define MSR_VMX_BASIC_VMENTRY_NO_ERR_CODE       \
-   (CONST64U(1) << MSR_VMX_BASIC_VMENTRY_NO_ERR_CODE_SHIFT)
+#define MSR_VMX_BASIC_VMENTRY_IGNS_ERR_CODE     \
+   (CONST64U(1) << MSR_VMX_BASIC_VMENTRY_IGNS_ERR_CODE_SHIFT)
 
 #define MSR_VMX_MISC_VMEXIT_SAVES_LMA           \
    (CONST64U(1) << MSR_VMX_MISC_VMEXIT_SAVES_LMA_SHIFT)
@@ -141,6 +136,8 @@
    (CONST64U(1) << MSR_VMX_EPT_VPID_INVVPID_VPID_CTX_LOCAL_SHIFT)
 #define MSR_VMX_EPT_VPID_ADV_EXIT_INFO          \
    (CONST64U(1) << MSR_VMX_EPT_VPID_ADV_EXIT_INFO_SHIFT)
+#define MSR_VMX_EPT_VPID_SUP_SHADOW_STK         \
+   (CONST64U(1) << MSR_VMX_EPT_VPID_SUP_SHADOW_STK_SHIFT)
 
 #define VT_VMCS_STANDARD_TAG           0x00000000
 #define VT_VMCS_SHADOW_TAG             0x80000000
@@ -151,6 +148,7 @@
 #define VT_ENCODING_ACCESS_HIGH        0x00000001
 #define VT_ENCODING_INDEX_MASK         0x000003fe
 #define VT_ENCODING_INDEX_SHIFT                 1
+#define VT_ENCODING_NUM_INDEXES               512
 #define VT_ENCODING_TYPE_MASK          0x00000c00
 #define VT_ENCODING_TYPE_SHIFT                 10
 #define VT_ENCODING_TYPE_CTL                    0
@@ -167,12 +165,30 @@
 #define VT_ENCODING_NUM_SIZES                   4
 #define VT_ENCODING_RSVD               0xffff9000
 
+/* 512 indices * 4 types * 4 sizes = 8192 fields. */
+#define VT_ENCODING_NUM_FIELDS   (VT_ENCODING_NUM_INDEXES * \
+                                  VT_ENCODING_NUM_TYPES *   \
+                                  VT_ENCODING_NUM_SIZES)
 /*
  * The highest index of any currently defined field is 27, for
  * ENCLV_EXITING_BITMAP.
  */
 #define VT_ENCODING_MAX_INDEX                  27
 
+/* VMCS ID's for various CPU models. */
+#define  VT_VMCS_ID_VMWARE       1
+#define  VT_VMCS_ID_AVOTON       2
+#define  VT_VMCS_ID_NOCONA       3
+#define  VT_VMCS_ID_SKYLAKE      4
+#define  VT_VMCS_ID_MEROM        7
+#define  VT_VMCS_ID_CLOVERTOWN   11
+#define  VT_VMCS_ID_PENRYN       13
+#define  VT_VMCS_ID_NEHALEM      14
+#define  VT_VMCS_ID_WESTMERE     15
+#define  VT_VMCS_ID_SANDYBRIDGE  16
+#define  VT_VMCS_ID_HASWELL      18
+#define  VT_VMCS_ID_TREMONT      19
+
 enum {
 #define VMCS_FIELD(_name, _val, ...) VT_VMCS_##_name = _val,
 #include "x86vt-vmcs-fields.h"
@@ -212,14 +228,14 @@ enum {
    VMXCAP(_BASIC, _field, _pos, _len)
 #define VMX_BASIC_CAP_NDA
 #define VMX_BASIC_CAP_PUB                                \
-   VMX_BASIC(VMCS_ID,               0, 32)               \
-   VMX_BASIC(VMCS_SIZE,            32, 13)               \
-   VMX_BASIC(32BITPA,              48,  1)               \
-   VMX_BASIC(DUALVMM,              49,  1)               \
-   VMX_BASIC(MEMTYPE,              50,  4)               \
-   VMX_BASIC(ADVANCED_IOINFO,      54,  1)               \
-   VMX_BASIC(TRUE_CTLS,            55,  1)               \
-   VMX_BASIC(VMENTRY_NO_ERR_CODE,  56,  1)
+   VMX_BASIC(VMCS_ID,                0, 32)              \
+   VMX_BASIC(VMCS_SIZE,             32, 13)              \
+   VMX_BASIC(32BITPA,               48,  1)              \
+   VMX_BASIC(DUALVMM,               49,  1)              \
+   VMX_BASIC(MEMTYPE,               50,  4)              \
+   VMX_BASIC(ADVANCED_IOINFO,       54,  1)              \
+   VMX_BASIC(TRUE_CTLS,             55,  1)              \
+   VMX_BASIC(VMENTRY_IGNS_ERR_CODE, 56,  1)
 
 #define VMX_BASIC_CAP                                    \
         VMX_BASIC_CAP_NDA                                \
@@ -541,10 +557,11 @@ enum {
 #define VT_VMCS_PENDDBG_B1         0x00000002
 #define VT_VMCS_PENDDBG_B2         0x00000004
 #define VT_VMCS_PENDDBG_B3         0x00000008
+#define VT_VMCS_PENDDBG_BUS_LOCK   0x00000800
 #define VT_VMCS_PENDDBG_BE         0x00001000
 #define VT_VMCS_PENDDBG_BS         0x00004000
 #define VT_VMCS_PENDDBG_RTM        0x00010000
-#define VT_VMCS_PENDDBG_MBZ        0xfffeaff0
+#define VT_VMCS_PENDDBG_MBZ        0xfffea7f0
 
 /* Exception error must-be-zero bits for VMEntry */
 #define VT_XCP_ERR_MBZ             0xffff0000
@@ -665,6 +682,8 @@ enum {
 #define VT_EPT_QUAL_GUEST_RW           (1 << 10)
 #define VT_EPT_QUAL_GUEST_NX           (1 << 11)
 #define VT_EPT_QUAL_NMIUNMASK          (1 << 12)
+#define VT_EPT_QUAL_ACCESS_SS          (1 << 13)
+#define VT_EPT_QUAL_SSS_LEAF           (1 << 14)
 #define VT_EPT_QUAL_SYNTH_PML_FULL     (1 << 31)
 
 
@@ -731,6 +750,7 @@ enum {
     VT_VMCS_CPU_VMEXEC_CTL_STCR8                     | \
     VT_VMCS_CPU_VMEXEC_CTL_TPR_SHADOW                | \
     VT_VMCS_CPU_VMEXEC_CTL_VNMI_WINDOW               | \
+    VT_VMCS_CPU_VMEXEC_CTL_MSRBITMAP                 | \
     VT_VMCS_CPU_VMEXEC_CTL_MONITOR)
 
 #define VT_DEFAULT_PROCBASED_CTLS                      \
@@ -741,7 +761,6 @@ enum {
      ~VT_VMCS_CPU_VMEXEC_CTL_STCR8                   & \
      ~VT_VMCS_CPU_VMEXEC_CTL_LDCR3                   & \
      ~VT_VMCS_CPU_VMEXEC_CTL_STCR3)                  | \
-    VT_VMCS_CPU_VMEXEC_CTL_MSRBITMAP                 | \
     VT_VMCS_CPU_VMEXEC_CTL_USE_2ND)
 
 #define VT_DEFAULT_PROCBASED_CTLS2                     \
@@ -756,19 +775,23 @@ enum {
 
 #define VT_REQUIRED_EXIT_CTLS                          \
    (VT_EXIT_CTLS_DEFAULT1                            | \
+    VT_VMCS_VMEXIT_CTL_LOAD_EFER                     | \
     VT_VMCS_VMEXIT_CTL_LONGMODE                      | \
     VT_VMCS_VMEXIT_CTL_INTRACK)
 
 #define VT_DEFAULT_EXIT_CTLS                           \
    (VT_REQUIRED_EXIT_CTLS                            & \
+    ~VT_VMCS_VMEXIT_CTL_LOAD_EFER                    & \
     ~VT_VMCS_VMEXIT_CTL_SAVE_DEBUGCTL)
 
 #define VT_REQUIRED_ENTRY_CTLS                         \
    (VT_ENTRY_CTLS_DEFAULT1                           | \
+    VT_VMCS_VMENTRY_CTL_LOAD_EFER                    | \
     VT_VMCS_VMENTRY_CTL_LONGMODE)
 
 #define VT_DEFAULT_ENTRY_CTLS                          \
    (VT_REQUIRED_ENTRY_CTLS                           & \
+    ~VT_VMCS_VMENTRY_CTL_LOAD_EFER                   & \
     ~VT_VMCS_VMENTRY_CTL_LOAD_DEBUGCTL)
 
 #define VT_REQUIRED_VPID_SUPPORT                       \
@@ -781,7 +804,12 @@ enum {
    (MSR_VMX_EPT_VPID_GAW_48                          | \
     MSR_VMX_EPT_VPID_ETMT_WB                         | \
     MSR_VMX_EPT_VPID_SP_2MB                          | \
-    MSR_VMX_EPT_VPID_INVEPT)
+    MSR_VMX_EPT_VPID_INVEPT                          | \
+    MSR_VMX_EPT_VPID_INVEPT_EPT_CTX)
+
+#define VT_REQUIRED_EPT_VPID_SUPPORT                   \
+   (VT_REQUIRED_VPID_SUPPORT                         | \
+    VT_REQUIRED_EPT_SUPPORT)
 
 #define VT_TSQUAL_CALL  0
 #define VT_TSQUAL_IRET  1
@@ -1031,7 +1059,8 @@ VT_LockedFromFeatures(uint64 featCtl)
  */
 static INLINE Bool
 VT_SupportedFromFeatures(uint64 pinBasedCtl, uint64 procBasedCtl,
-                         uint64 entryCtl, uint64 exitCtl, uint64 basicCtl)
+                         uint64 entryCtl, uint64 exitCtl, uint64 basicCtl,
+                         uint64 eptVpidFeat)
 {
    unsigned memType;
 
@@ -1053,7 +1082,15 @@ VT_SupportedFromFeatures(uint64 pinBasedCtl, uint64 procBasedCtl,
       return FALSE;
    }
 
-   return TRUE;
+   if ((eptVpidFeat & VT_REQUIRED_EPT_VPID_SUPPORT) !=
+       VT_REQUIRED_EPT_VPID_SUPPORT) {
+      return FALSE;
+   }
+
+   /* Check that intercepts for MOV to/from CR3 and INVLPG can be cleared. */
+   return ((procBasedCtl & (VT_VMCS_CPU_VMEXEC_CTL_INVLPG |
+                            VT_VMCS_CPU_VMEXEC_CTL_LDCR3  |
+                            VT_VMCS_CPU_VMEXEC_CTL_STCR3)) == 0);
 }
 
 
@@ -1113,8 +1150,10 @@ VT_ConvEPTViolSupportedFromFeatures(uint64 secondary)
    return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_EPT_VIOL_VE) != 0;
 }
 
-
-#if !defined(USERLEVEL) && !defined(MONITOR_APP) /* { */
+#if !defined(VM_ARM_64) /* PR 2822467 */ &&                     \
+    (defined(DECODER) || defined(FROBOS) || defined(ULM) ||     \
+     defined(VMKBOOT) || defined(VMKERNEL) || defined(VMM) ||   \
+     defined(VMMON)) /* { */
 /*
  *----------------------------------------------------------------------
  *
@@ -1156,7 +1195,8 @@ VT_SupportedCPU(void)
                                    X86MSR_GetMSR(MSR_VMX_TRUE_PROCBASED_CTLS),
                                    X86MSR_GetMSR(MSR_VMX_TRUE_ENTRY_CTLS),
                                    X86MSR_GetMSR(MSR_VMX_TRUE_EXIT_CTLS),
-                                   X86MSR_GetMSR(MSR_VMX_BASIC));
+                                   X86MSR_GetMSR(MSR_VMX_BASIC),
+                                   X86MSR_GetMSR(MSR_VMX_EPT_VPID));
 }
 
 #endif /* } !defined(USERLEVEL) */
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index d0a153d3..3d8b7228 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -256,7 +256,7 @@ LinuxDriverInitTSCkHz(void)
 /*
  *----------------------------------------------------------------------
  *
- * init_module --
+ * LinuxDriverInit --
  *
  *      linux module entry point. Called by /sbin/insmod command
  *
@@ -268,7 +268,7 @@ LinuxDriverInitTSCkHz(void)
  */
 
 int
-init_module(void)
+LinuxDriverInit(void)
 {
    int retval;
 
@@ -328,16 +328,15 @@ init_module(void)
 /*
  *----------------------------------------------------------------------
  *
- * cleanup_module --
+ * LinuxDriverExit --
  *
  *      Called by /sbin/rmmod
  *
- *
  *----------------------------------------------------------------------
  */
 
 void
-cleanup_module(void)
+LinuxDriverExit(void)
 {
    /*
     * XXX smp race?
@@ -725,7 +724,6 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_SET_UID:
    case IOCTL_VMX86_GET_NUM_VMS:
    case IOCTL_VMX86_SET_HARD_LIMIT:
-   case IOCTL_VMX86_GET_IPI_VECTORS:
    case IOCTL_VMX86_GET_KHZ_ESTIMATE:
    case IOCTL_VMX86_GET_ALL_CPUID:
    case IOCTL_VMX86_GET_ALL_MSRS:
@@ -735,6 +733,7 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
    case IOCTL_VMX86_GET_PSEUDO_TSC:
    case IOCTL_VMX86_SYNC_GET_TSCS:
    case IOCTL_VMX86_GET_UNAVAIL_PERF_CTRS:
+   case IOCTL_VMX86_KERNEL_CET_ENABLED:
       break;
 
    default:
@@ -764,16 +763,15 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       if (retval != 0) {
          break;
       }
-      vm = Vmx86_CreateVM(args.bsBlob, args.bsBlobSize, args.numVCPUs);
-
-      if (vm == NULL) {
-         retval = -ENOMEM;
-      } else {
+      vm = Vmx86_CreateVM(args.bsBlob, args.bsBlobSize, args.numVCPUs,
+                          &args.status);
+      if (vm != NULL) {
          device->vm = vm;
+         ASSERT(vm->userID <= MAX_UINT16);
          args.vmid = vm->userID;
          vm->vmhost->vmmonData = (void *__user)args.vmmonData;
-         retval = HostIF_CopyToUser((VA64)ioarg, &args, sizeof args);
       }
+      retval = HostIF_CopyToUser((VA64)ioarg, &args, sizeof args);
       break;
    }
 
@@ -913,22 +911,6 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
-   case IOCTL_VMX86_GET_VMM_PAGE_ROOT: {
-      VcpuPageRoot args;
-
-      retval = HostIF_CopyFromUser(&args, ioarg, sizeof args);
-      if (retval) {
-         break;
-      }
-      if (args.vcpuid >= vm->numVCPUs || vm->ptRootMpns == NULL) {
-         retval = -EINVAL;
-      } else {
-         args.pageRoot = vm->ptRootMpns[args.vcpuid];
-         retval = HostIF_CopyToUser(ioarg, &args, sizeof args);
-      }
-      break;
-   }
-
    case IOCTL_VMX86_GET_NUM_VMS:
       retval = Vmx86_GetNumVMs();
       break;
@@ -1055,16 +1037,6 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
-   case IOCTL_VMX86_GET_IPI_VECTORS: {
-      IPIVectors ipiVectors;
-
-      ipiVectors.monitorIPIVector = HostIF_GetMonitorIPIVector();
-      ipiVectors.hvIPIVector      = HostIF_GetHVIPIVector();
-
-      retval = HostIF_CopyToUser(ioarg, &ipiVectors, sizeof ipiVectors);
-      break;
-   }
-
    case IOCTL_VMX86_GET_SWITCH_ERROR_ADDR: {
       VMSwitchErrorArgs args;
 
@@ -1315,6 +1287,13 @@ LinuxDriver_Ioctl(struct file *filp,    // IN:
       break;
    }
 
+   case IOCTL_VMX86_KERNEL_CET_ENABLED: {
+      Bool kernelCETEnabled = Vmx86_KernelCETEnabled();
+      retval = HostIF_CopyToUser(ioarg, &kernelCETEnabled,
+                                 sizeof kernelCETEnabled);
+      break;
+   }
+
    default:
       Warning("Unknown ioctl %d\n", iocmd);
       retval = -EINVAL;
@@ -1450,3 +1429,5 @@ MODULE_LICENSE("GPL v2");
  * by default (i.e., neither mkinitrd nor modprobe will accept it).
  */
 MODULE_INFO(supported, "external");
+module_init(LinuxDriverInit);
+module_exit(LinuxDriverExit);
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 0f45125e..4fac1e43 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -68,6 +68,7 @@
 #include "apic.h"
 #include "memDefaults.h"
 #include "vcpuid.h"
+#include "vm_asm_x86.h"
 #include "x86svm.h"
 #include "crosspage.h"
 #include "cpu_defs.h"
@@ -1259,31 +1260,6 @@ HostIFGetUserPages(void *uvAddr,          // IN
 }
 
 
-/*
- *----------------------------------------------------------------------
- *
- * HostIF_IsLockedByMPN --
- *
- *      Checks if mpn was locked using allowMultipleMPNsPerVA.
- *
- * Results:
- *      TRUE if mpn is present in the physTracker.
- *
- *
- * Side effects:
- *     None.
- *
- *----------------------------------------------------------------------
- */
-
-Bool
-HostIF_IsLockedByMPN(VMDriver *vm,  // IN:
-                     MPN mpn)       // IN:
-{
-  return PhysTrack_Test(vm->vmhost->lockedPages, mpn);
-}
-
-
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2356,7 +2332,11 @@ isVAReadable(VA r)  // IN:
    int ret;
 
    r = APICR_TO_ADDR(r, APICR_VERSION);
-#ifdef HAVE_GET_KERNEL_NOFAULT
+#if defined(HAVE_GET_KERNEL_NOFAULT) || LINUX_VERSION_CODE >= KERNEL_VERSION(5, 17, 0)
+   /*
+    * Exists from 5.10, first indicated by HAVE_GET_KERNEL_NOFAULT,
+    * and from post-5.17 just existing everywhere.
+    */
    ret = get_kernel_nofault(dummy, (void *)r);
 #else
    {
diff --git a/vmnet-only/bridge.c b/vmnet-only/bridge.c
index 25a74429..feb22eec 100644
--- a/vmnet-only/bridge.c
+++ b/vmnet-only/bridge.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013, 2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2013, 2017, 2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -684,14 +684,11 @@ VNetBridgeReceiveFromVNet(VNetJack        *this, // IN: jack
 	 }
          spin_unlock_irqrestore(&bridge->historyLock, flags);
 
-         /*
-          * We used to cli() before calling netif_rx() here. It was probably
-          * unneeded (as we never did it in netif.c, and the code worked). In
-          * any case, now that we are using netif_rx_ni(), we should certainly
-          * not do it, or netif_rx_ni() will deadlock on the cli() lock --hpreg
-          */
-
-	 netif_rx_ni(clone);
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 18, 0)
+         netif_rx_ni(clone);
+#else
+         netif_rx(clone);
+#endif
 #	 if LOGLEVEL >= 4
 	 do_gettimeofday(&vnetTime);
 #	 endif
@@ -810,8 +807,10 @@ VNetBridgeIsDeviceWireless(struct net_device *dev) //IN: sock
 {
 #if defined(CONFIG_WIRELESS_EXT)
    return dev->ieee80211_ptr != NULL || dev->wireless_handlers != NULL;
-#else
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(5, 19, 0) || IS_ENABLED(CONFIG_CFG80211)
    return dev->ieee80211_ptr != NULL;
+#else
+   return FALSE;
 #endif
 }
 
diff --git a/vmnet-only/driver.c b/vmnet-only/driver.c
index b3da8cbb..197a2134 100644
--- a/vmnet-only/driver.c
+++ b/vmnet-only/driver.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -625,26 +625,23 @@ VNetFileOpPoll(struct file *filp, // IN:
  * VNetFileOpUnlockedIoctl --
  *
  *      The virtual network's ioctl file operation. This is used for
- *      setup of the connection. Currently supported commands are
- *      (taken from sockios.h):
+ *      setup of the connection.
  *
- *      SIOCGIFADDR - get ethernet address          - ioarg OUT: 6 bytes
- *      SIOCSIFADDR - set ethernet address          - ioarg IN:  6 bytes
- *      SIOCSIFFLAGS - set flags                    - ioarg IN:  4 bytes
- *
- *      Private ioctl calls, taken from device-private ioctl space
- *      in sockios.h, and defined in includes/vm_oui.h:
+ *      Currently supported commands are in device-private ioctl space:
  *
+ *      SIOCGETAPIVERSION2 - version check          - ioarg IN: uint32 version
+ *      SIOCSPORTFLAGS - set flags                  - ioarg IN:  4 bytes
  *      SIOCSLADRF (0x89F2) - set logical address filter (for
  *         filtering multicast packets)             - ioarg IN:  8 bytes
- *
  *      SIOCGBRSTATUS - get bridging status         - ioarg OUT: 4 bytes
- *      SIOCSPEER - set bridge peer interface       - ioarg IN:  8 bytes
- *      SIOCSPEER2 - set bridge peer interface      - ioarg IN: 32 bytes
+ *      SIOCSPEER3 - set bridge peer interface      - ioarg IN: 36 bytes
  *      SIOCSBIND - bind to a particular vnet/PVN   - ioarg IN: VNet_Bind
  *      SIOCSFILTERRULES - set host filter rules    - ioarg IN: VNet_Filter
- *      SIOCBRIDGE - (legacy see SIOCSPEER)
  *      SIOCSUSERLISTENER - set user listener - ioarg IN: VNet_SetUserListener
+ *      SIOCNETIF - set peer                        - ioarg IN: 8-char name
+ *      SIOCGETMACADDR - get ethernet address       - ioarg OUT: 6 bytes
+ *      SIOCSETMACADDR - set ethernet address       - ioarg IN: 6 bytes
+ *      SIOCSMCASTFILTER - set multicast filter     - ioarg IN: VNetMcastFilter
  *
  *      Supported flags are (taken from if.h):
  *
@@ -687,21 +684,9 @@ VNetFileOpUnlockedIoctl(struct file    *filp,  // IN:
    // sprintf(vnetHub[hubNum]->devName, "vmnet%d", hubNum);
 
    switch (iocmd) {
-   case SIOCSPEER:
-   case SIOCBRIDGE:
-   case SIOCSPEER2:
    case SIOCSPEER3:
-      memset(&bridgeParams, 0, sizeof bridgeParams);
-      if (iocmd == SIOCSPEER3) {
-         retval = copy_from_user(&bridgeParams, (void *)ioarg,
-                                 sizeof bridgeParams);
-      } else if (iocmd == SIOCSPEER2) {
-         retval = copy_from_user(&bridgeParams.name, (void *)ioarg,
-                                 sizeof bridgeParams.name);
-      } else {
-         retval = copy_from_user(&bridgeParams.name, (void *)ioarg, 8);
-      }
-
+      retval = copy_from_user(&bridgeParams, (void *)ioarg,
+                              sizeof bridgeParams);
       if (retval) {
          return -EFAULT;
       }
@@ -748,16 +733,6 @@ VNetFileOpUnlockedIoctl(struct file    *filp,  // IN:
       }
       break;
 
-   case SIOCPORT:
-      mutex_lock(&vnetIoctlMutex);
-      retval = VNetUserIf_Create(&new);
-      if (retval == 0) {
-         retval = VNetSwitchToDifferentPeer(&port->jack, &new->jack,
-                                            TRUE, filp, port, new);
-      }
-      mutex_unlock(&vnetIoctlMutex);
-      break;
-
    case SIOCNETIF:
       if (copy_from_user(name, (void *)ioarg, 8)) {
          return -EFAULT;
@@ -845,7 +820,7 @@ VNetFileOpUnlockedIoctl(struct file    *filp,  // IN:
       }
       break;
 
-   case SIOCGIFADDR:
+   case SIOCGETMACADDR:
       {
          uint8 paddr[ETH_ALEN];
 
@@ -857,9 +832,6 @@ VNetFileOpUnlockedIoctl(struct file    *filp,  // IN:
       }
       break;
 
-   case SIOCSIFADDR:
-      return -EFAULT;
-
    case SIOCSLADRF:
       {
          uint8 ladrf[VNET_LADRF_LEN];
@@ -877,7 +849,7 @@ VNetFileOpUnlockedIoctl(struct file    *filp,  // IN:
       }
       break;
 
-   case SIOCSIFFLAGS:
+   case SIOCSPORTFLAGS:
       {
          uint32 flags;
 
@@ -971,9 +943,6 @@ VNetFileOpUnlockedIoctl(struct file    *filp,  // IN:
          }
          /* Should we require verFromUser == VNET_API_VERSION? */
       }
-      /* fall thru */
-
-   case SIOCGETAPIVERSION:
       retval = put_user(VNET_API_VERSION, (uint32 *)ioarg) ?  -EFAULT : 0;
       break;
 
diff --git a/vmnet-only/hub.c b/vmnet-only/hub.c
index 8f578353..0be9a236 100644
--- a/vmnet-only/hub.c
+++ b/vmnet-only/hub.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -234,7 +234,7 @@ VNetHub_AllocVnet(int hubNum) // IN: the vnet number to alloc on
  */
 
 VNetJack *
-VNetHub_AllocPvn(uint8 id[]) // IN: the PVN ID to alloc on
+VNetHub_AllocPvn(uint8 id[VNET_PVN_ID_LEN]) // IN: the PVN ID to alloc on
 {
    return VNetHubAlloc(TRUE, -1, id);
 }
@@ -256,9 +256,9 @@ VNetHub_AllocPvn(uint8 id[]) // IN: the PVN ID to alloc on
  */
 
 VNetJack *
-VNetHubAlloc(Bool allocPvn, // IN: TRUE for PVN, FALSE for vnet
-	     int hubNum,    // IN: vnet # to use (-1 if allocPvn == TRUE)
-	     uint8 id[])    // IN: PVN ID to use (NULL if allocPvn == FALSE)
+VNetHubAlloc(Bool allocPvn,             // IN: TRUE for PVN, FALSE for vnet
+	     int hubNum,                // IN: vnet # to use (-1 if allocPvn == TRUE)
+	     uint8 id[VNET_PVN_ID_LEN]) // IN: PVN ID to use (NULL if allocPvn == FALSE)
 {
    VNetHub *hub;
    VNetJack *jack;
diff --git a/vmnet-only/netif.c b/vmnet-only/netif.c
index c70f7f4c..e97ff5ce 100644
--- a/vmnet-only/netif.c
+++ b/vmnet-only/netif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016,2019,2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -253,7 +253,11 @@ VNetNetIf_Create(char *devName,  // IN:
 
    memset(&netIf->stats, 0, sizeof netIf->stats);
 
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 15, 0)
    memcpy(dev->dev_addr, netIf->port.paddr, sizeof netIf->port.paddr);
+#else
+   eth_hw_addr_set(dev, netIf->port.paddr);
+#endif
 
    if (register_netdev(dev) != 0) {
       LOG(0, (KERN_NOTICE "%s: could not register network device\n",
@@ -345,7 +349,11 @@ VNetNetIfReceive(VNetJack        *this, // IN: jack
    /* send to the host interface */
    skb->dev = netIf->dev;
    skb->protocol = eth_type_trans(skb, netIf->dev);
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 18, 0)
    netif_rx_ni(skb);
+#else
+   netif_rx(skb);
+#endif
    netIf->stats.rx_packets++;
 
    return;
@@ -532,7 +540,11 @@ VNetNetifSetMAC(struct net_device *dev, // IN:
       return -EINVAL;
    }
    memcpy(netIf->port.paddr, addr->sa_data, dev->addr_len);
-   memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 15, 0)
+   memcpy(dev->dev_addr, netIf->port.paddr, dev->addr_len);
+#else
+   eth_hw_addr_set(dev, netIf->port.paddr);
+#endif
    return 0;
 }
 
diff --git a/vmnet-only/smac.c b/vmnet-only/smac.c
index f18be8a7..4518d89e 100644
--- a/vmnet-only/smac.c
+++ b/vmnet-only/smac.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002,2018,2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2018,2020,2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -4116,7 +4116,7 @@ SMAC_InitState(SMACState **ptr) // OUT: pointer to alloced/inited state
 
 void SMACINT
 SMAC_SetMac(SMACState *state,  // IN: state to update
-	    uint8 *mac)        // IN: pointer to host adapter's MAC
+	    const uint8 *mac)  // IN: pointer to host adapter's MAC
 {
    VNETKdPrintCall(("SMAC_SetMac"));
    ASSERT(state);
diff --git a/vmnet-only/smac.h b/vmnet-only/smac.h
index c8df9d2d..647e772b 100644
--- a/vmnet-only/smac.h
+++ b/vmnet-only/smac.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2010,2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -70,11 +70,11 @@ Bool BridgeIPv6MatchAddrMAC(const IPv6Addr *addr, const uint8 *mac);
 Bool BridgeIPv4MatchAddrMAC(const ULONG ipAddr, const uint8 *mac);
 #endif
 void SMACINT
-SMAC_InitState(struct SMACState **ptr);           // IN: state to alloc/init
+SMAC_InitState(struct SMACState **ptr);                 // IN: state to alloc/init
 void SMACINT
-SMAC_SetMac(struct SMACState *state, uint8 *mac); // IN: state, and host MAC
+SMAC_SetMac(struct SMACState *state, const uint8 *mac); // IN: state, and host MAC
 void SMACINT
-SMAC_CleanupState(struct SMACState **ptr);        // IN: state to cleanup/dealloc
+SMAC_CleanupState(struct SMACState **ptr);              // IN: state to cleanup/dealloc
 
 /* 
  * Structure is used to separate out differences 
diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index e99c4368..0d6b258b 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2017,2019,2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2017,2019-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -519,6 +519,50 @@ VNetCopyDatagram(const struct sk_buff *skb,	// IN: skb to copy
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * VNetCsumAndCopyToUser --
+ *
+ *      Checksum data and copy them to userspace.
+ *
+ * Results:
+ *      folded checksum (non-zero value) on success,
+ *      err set to 0 on success, negative errno on failure.
+ *
+ * Side effects:
+ *      Data copied to the buffer.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static unsigned int
+VNetCsumAndCopyToUser(const void *src,   // IN: Source
+                      void *dst,         // IN: Destination
+                      int len,           // IN: Bytes to copy
+                      int *err)          // OUT: Error code
+{
+   unsigned int csum;
+
+#if COMPAT_LINUX_VERSION_CHECK_LT(5, 10, 0)
+   csum = csum_and_copy_to_user(src, dst, len, 0, err);
+#elif LINUX_VERSION_CODE < KERNEL_VERSION(5, 19, 0)
+   csum = csum_and_copy_to_user(src, dst, len);
+   *err = (csum == 0) ? -EFAULT : 0;
+#else
+   if (!user_access_begin(dst, len)) {
+      *err = -EFAULT;
+      csum = 0;
+   } else {
+      *err = 0;
+      csum = csum_partial_copy_nocheck(src, dst, len);
+      user_access_end();
+   }
+#endif
+   return csum;
+}
+
+
 /*
  *----------------------------------------------------------------------
  *
@@ -561,12 +605,7 @@ VNetCsumCopyDatagram(const struct sk_buff *skb,	// IN: skb to copy
       return -EINVAL;
    }
 
-#if COMPAT_LINUX_VERSION_CHECK_LT(5, 10, 0)
-   csum = csum_and_copy_to_user(skb->data + offset, curr, len, 0, &err);
-#else
-   csum = csum_and_copy_to_user(skb->data + offset, curr, len);
-   err = (csum == 0) ? -EFAULT : 0;
-#endif
+   csum = VNetCsumAndCopyToUser(skb->data + offset, curr, len, &err);
    if (err) {
       return err;
    }
@@ -580,14 +619,8 @@ VNetCsumCopyDatagram(const struct sk_buff *skb,	// IN: skb to copy
 	 const void *vaddr;
 
 	 vaddr = kmap(skb_frag_page(frag));
-#if COMPAT_LINUX_VERSION_CHECK_LT(5, 10, 0)
-	 tmpCsum = csum_and_copy_to_user(vaddr + skb_frag_off(frag),
-					 curr, skb_frag_size(frag), 0, &err);
-#else
-	 tmpCsum = csum_and_copy_to_user(vaddr + skb_frag_off(frag),
-					 curr, skb_frag_size(frag));
-         err = (tmpCsum == 0) ? -EFAULT : 0;
-#endif
+         tmpCsum = VNetCsumAndCopyToUser(vaddr + skb_frag_off(frag),
+                                         curr, skb_frag_size(frag), &err);
 	 kunmap(skb_frag_page(frag));
 
 	 if (err) {
@@ -853,8 +886,6 @@ VNetUserIfIoctl(VNetPort      *port,  // IN
    VNetUserIF *userIf = (VNetUserIF*)port->jack.private;
 
    switch (iocmd) {
-   case SIOCSETNOTIFY:
-      return -EINVAL;
    case SIOCSETNOTIFY2:
    /*
     * ORs pollMask into the integer pointed to by ptr if pending packet. Is
@@ -887,21 +918,21 @@ VNetUserIfIoctl(VNetPort      *port,  // IN
       VNetUserIfUnsetupNotify(userIf);
       break;
 
-   case SIOCSIFFLAGS:
-      /* 
-       * Drain queue when interface is no longer active. We drain the queue to 
+   case SIOCSPORTFLAGS:
+      /*
+       * Drain queue when interface is no longer active. We drain the queue to
        * avoid having old packets delivered to the guest when reneabled.
        */
-      
+
       if (!UP_AND_RUNNING(userIf->port.flags)) {
          struct sk_buff *skb;
          unsigned long flags;
          struct sk_buff_head *q = &userIf->packetQueue;
-         
+
          while ((skb = skb_dequeue(q)) != NULL) {
             dev_kfree_skb(skb);
          }
-         
+
          spin_lock_irqsave(&q->lock, flags);
          if (userIf->pollPtr) {
             if (skb_queue_empty(q)) {
@@ -918,11 +949,11 @@ VNetUserIfIoctl(VNetPort      *port,  // IN
    case SIOCINJECTLINKSTATE:
       {
          uint8 linkUpFromUser;
-         if (copy_from_user(&linkUpFromUser, (void *)ioarg, 
+         if (copy_from_user(&linkUpFromUser, (void *)ioarg,
                             sizeof linkUpFromUser)) {
             return -EFAULT;
          }
-         
+
          if (linkUpFromUser != 0 && linkUpFromUser != 1) {
             return -EINVAL;
          }
@@ -934,7 +965,7 @@ VNetUserIfIoctl(VNetPort      *port,  // IN
       return -ENOIOCTLCMD;
       break;
    }
-   
+
    return 0;
 }
 
diff --git a/vmnet-only/vm_assert.h b/vmnet-only/vm_assert.h
index cf344460..fca85007 100644
--- a/vmnet-only/vm_assert.h
+++ b/vmnet-only/vm_assert.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,7 +40,11 @@
 
 // XXX not necessary except some places include vm_assert.h improperly
 #include "vm_basic_types.h"
+
+/* No stdarg.h on Linux kernels 5.15+ */
+#ifndef KBUILD_MODNAME
 #include <stdarg.h>
+#endif
 
 #ifdef __cplusplus
 extern "C" {
@@ -62,7 +66,10 @@ extern "C" {
  * so it uses generic functions.
  */
 
-#if !defined VMM || defined MONITOR_APP // {
+#if !defined VMM ||                                                     \
+    defined BINARY_CHECKER || defined COREQUERY || defined DECODER ||   \
+    defined DIS16 || defined FROBOS || defined TRAPAPI_APP ||           \
+    defined VMM_LINKER || defined VMSS2CORE
 
 # if defined (VMKPANIC)
 #  include "vmk_assert.h"
@@ -76,8 +83,7 @@ extern "C" {
 #  define _ASSERT_PANIC_BUG_NORETURN(bug, name) \
            Panic(_##name##Fmt " bugNr=%d\n", __FILE__, __LINE__, bug)
 # endif /* VMKPANIC */
-
-#endif // }
+#endif
 
 
 // These strings don't have newline so that a bug can be tacked on.
@@ -307,22 +313,21 @@ void WarningThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);
  * compilation options will lead to different control-flow-derived
  * errors, causing some make targets to fail while others succeed.
  *
- * VC++ has the __assume() built-in function which we don't trust
- * (see bug 43485); gcc has no such construct; we just panic in
- * userlevel code.  The monitor doesn't want to pay the size penalty
- * (measured at 212 bytes for the release vmm for a minimal infinite
- * loop; panic would cost even more) so it does without and lives
- * with the inconsistency.
+ * VC++ has the __assume() built-in function which we don't trust (see
+ * bug 43485).  However, __assume() is used in the Windows ULM
+ * implementation, because the newer compiler used for that project
+ * generates correct code.
  *
+ * With gcc, the __builtin_unreachable() extension is used when the
+ * compiler is known to support it.
  */
 
-# if defined VMKPANIC || defined VMM
+# if defined VMKPANIC || defined VMM || defined ULM_ESX
+#  undef  NOT_REACHED
+#  define NOT_REACHED() __builtin_unreachable()
+# elif defined ULM_WIN
 #  undef  NOT_REACHED
-#  if defined __GNUC__ && (__GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 5)
-#   define NOT_REACHED() (__builtin_unreachable())
-#  else
-#   define NOT_REACHED() ((void)0)
-#  endif
+#  define NOT_REACHED() __assume(0)
 # else
  // keep debug definition
 # endif
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index dc378c56..4f8e04fc 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -142,8 +142,7 @@ typedef ALIGNED(8) struct Atomic_uint64 {
    volatile uint64 value;
 } Atomic_uint64;
 
-#if defined __GNUC__ && defined VM_64BIT && \
-     (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
+#ifdef VM_HAS_INT128
 typedef ALIGNED(16) struct Atomic_uint128 {
    volatile uint128 value;
 } Atomic_uint128;
@@ -201,10 +200,8 @@ Atomic_VolatileToAtomic64(volatile uint64 *var)  // IN:
  * registers.
  */
 
-#if defined __GNUC__ && defined VM_ARM_32
 /* Force the link step to fail for unimplemented functions. */
 extern int AtomicUndefined(void const *);
-#endif
 
 
 /*
@@ -212,57 +209,80 @@ extern int AtomicUndefined(void const *);
  *
  * Atomic_ReadIfEqualWrite128 --
  *
- *      Compare and exchange a 16 byte tuple.
+ *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
  * Results:
- *      old value
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      None
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
-#if defined __GNUC__ && defined VM_64BIT && \
-     (defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16 || defined VM_ARM_64)
+
+#ifdef VM_HAS_INT128
 static INLINE uint128
 Atomic_ReadIfEqualWrite128(Atomic_uint128 *ptr,   // IN/OUT
                            uint128        oldVal, // IN
                            uint128        newVal) // IN
 {
-#ifdef __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16
+#if defined __GNUC__ && defined VM_ARM_64
+#define VM_HAS_ATOMIC_READIFEQUALWRITE128 // This function can be used.
+   /*
+    * Don't use __sync_val_compare_and_swap, as this cannot magically
+    * use the right (LL/SC vs LSE) atomics without -moutline-atomics.
+    */
+#if __GNUC__ >= 9
+   if (Atomic_HaveLSE) {
+      SMP_RW_BARRIER_RW();
+      __asm__ __volatile__(
+         ".arch armv8.2-a            \n\t"
+         "casp %0, %H0, %2, %H2, %1  \n\t"
+         : "+r" (oldVal),
+           "+Q" (ptr->value)
+         : "r" (newVal)
+      );
+      SMP_RW_BARRIER_RW();
+      return oldVal;
+   } else
+#endif /* __GNUC__ */
+   {
+      union {
+         uint128 raw;
+         struct {
+            uint64 lo;
+            uint64 hi;
+         };
+      } res, _old = { oldVal }, _new = { newVal };
+      uint32 failed;
+
+      SMP_RW_BARRIER_RW();
+      __asm__ __volatile__(
+         "1: ldxp    %x0, %x1, %3        \n\t"
+         "   cmp     %x0, %x4            \n\t"
+         "   ccmp    %x1, %x5, #0, eq    \n\t"
+         "   b.ne    2f                  \n\t"
+         "   stxp    %w2, %x6, %x7, %3   \n\t"
+         "   cbnz    %w2, 1b             \n\t"
+         "2:                             \n\t"
+         : "=&r" (res.lo),
+           "=&r" (res.hi),
+           "=&r" (failed),
+           "+Q" (ptr->value)
+         : "r" (_old.lo),
+           "r" (_old.hi),
+           "r" (_new.lo),
+           "r" (_new.hi)
+         : "cc"
+      );
+      SMP_RW_BARRIER_RW();
+      return res.raw;
+   }
+#elif defined __GNUC__ && defined __GCC_HAVE_SYNC_COMPARE_AND_SWAP_16
+#define VM_HAS_ATOMIC_READIFEQUALWRITE128 // This function can be used.
    return __sync_val_compare_and_swap(&ptr->value, oldVal, newVal);
-#elif defined VM_ARM_64
-   union {
-      uint128 raw;
-      struct {
-         uint64 lo;
-         uint64 hi;
-      };
-   } res, _old = { oldVal }, _new = { newVal };
-   uint32 failed;
-
-   SMP_RW_BARRIER_RW();
-   __asm__ __volatile__(
-      "1: ldxp    %x0, %x1, %3        \n\t"
-      "   cmp     %x0, %x4            \n\t"
-      "   ccmp    %x1, %x5, #0, eq    \n\t"
-      "   b.ne    2f                  \n\t"
-      "   stxp    %w2, %x6, %x7, %3   \n\t"
-      "   cbnz    %w2, 1b             \n\t"
-      "2:                             \n\t"
-      : "=&r" (res.lo),
-        "=&r" (res.hi),
-        "=&r" (failed),
-        "+Q" (ptr->value)
-      : "r" (_old.lo),
-        "r" (_old.hi),
-        "r" (_new.lo),
-        "r" (_new.hi)
-      : "cc"
-   );
-   SMP_RW_BARRIER_RW();
-
-   return res.raw;
+#else
+   return AtomicUndefined(ptr + oldVal + newVal);
 #endif
 }
 #endif
@@ -302,7 +322,7 @@ Atomic_Read8(Atomic_uint8 const *var)  // IN:
 #elif defined _MSC_VER
    val = var->value;
 #else
-#error No compiler defined for Atomic_Read8
+#error Atomic_Read8 not implemented
 #endif
 
    return val;
@@ -345,7 +365,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
 #elif defined _MSC_VER
    return _InterlockedExchange8((volatile char *)&var->value, val);
 #else
-#error No compiler defined for Atomic_ReadWrite8
+#error Atomic_ReadWrite8 not implemented
 #endif
 }
 
@@ -383,7 +403,7 @@ Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
 #elif defined _MSC_VER
    var->value = val;
 #else
-#error No compiler defined for Atomic_Write8
+#error Atomic_Write8 not implemented
 #endif
 }
 
@@ -396,10 +416,10 @@ Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
  *      Compare exchange: Read variable, if equal to oldVal, write newVal.
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -430,7 +450,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
    return _InterlockedCompareExchange8((volatile char *)&var->value,
                                        newVal, oldVal);
 #else
-#error No compiler defined for Atomic_ReadIfEqualWrite8
+#error Atomic_ReadIfEqualWrite8 not implemented
 #endif
 }
 
@@ -859,7 +879,7 @@ Atomic_Read32(Atomic_uint32 const *var) // IN
 
    value = var->value;
 #else
-#error No compiler defined for Atomic_Read
+#error Atomic_Read32 not implemented
 #endif
 
    return value;
@@ -923,7 +943,7 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    return _InterlockedExchange((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_ReadWrite
+#error Atomic_ReadWrite32 not implemented
 #endif // __GNUC__
 }
 #define Atomic_ReadWrite Atomic_ReadWrite32
@@ -1005,7 +1025,7 @@ Atomic_Write32(Atomic_uint32 *var, // OUT
 
    var->value = val;
 #else
-#error No compiler defined for Atomic_Write
+#error Atomic_Write32 not implemented
 #endif
 }
 #define Atomic_Write Atomic_Write32
@@ -1019,10 +1039,10 @@ Atomic_Write32(Atomic_uint32 *var, // OUT
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -1075,7 +1095,7 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
                                       (long)newVal,
                                       (long)oldVal);
 #else
-#error No compiler defined for Atomic_ReadIfEqualWrite
+#error Atomic_ReadIfEqualWrite32 not implemented
 #endif
 }
 #define Atomic_ReadIfEqualWrite Atomic_ReadIfEqualWrite32
@@ -1090,10 +1110,10 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -1167,7 +1187,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
                                         (__int64)newVal,
                                         (__int64)oldVal);
 #else
-#error No compiler defined for Atomic_ReadIfEqualWrite64
+#error Atomic_ReadIfEqualWrite64 not implemented
 #endif
 }
 #endif
@@ -1226,7 +1246,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedAnd((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_And
+#error Atomic_And32 not implemented
 #endif
 }
 #define Atomic_And Atomic_And32
@@ -1285,7 +1305,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedOr((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_Or
+#error Atomic_Or32 not implemented
 #endif
 }
 #define Atomic_Or Atomic_Or32
@@ -1344,7 +1364,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedXor((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_Xor
+#error Atomic_Xor32 not implemented
 #endif
 }
 #define Atomic_Xor Atomic_Xor32
@@ -1386,7 +1406,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedXor64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_Xor64
+#error Atomic_Xor64 not implemented
 #endif
 }
 #endif
@@ -1445,7 +1465,7 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_Add
+#error Atomic_Add32 not implemented
 #endif
 }
 #define Atomic_Add Atomic_Add32
@@ -1502,9 +1522,23 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
-   _InterlockedExchangeAdd((long *)&var->value, -(long)val);
+   /*
+    * Microsoft warning C4146, enabled by the /sdl option for
+    * additional security checks, objects to `-val' when val is
+    * unsigned, even though that is always well-defined by C and has
+    * exactly the semantics we want, namely negation modulo 2^32.
+    * (The signed version, in contrast, has undefined behaviour at
+    * some inputs.)
+    *
+    * https://docs.microsoft.com/en-us/cpp/error-messages/compiler-warnings/compiler-warning-level-2-c4146?view=msvc-170
+    * https://docs.microsoft.com/en-us/cpp/build/reference/sdl-enable-additional-security-checks?view=msvc-170
+    */
+#   pragma warning(push)
+#   pragma warning(disable: 4146)
+   _InterlockedExchangeAdd((long *)&var->value, (long)-val);
+#   pragma warning(pop)
 #else
-#error No compiler defined for Atomic_Sub
+#error Atomic_Sub32 not implemented
 #endif
 }
 #define Atomic_Sub Atomic_Sub32
@@ -1544,7 +1578,7 @@ Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
 #elif defined _MSC_VER
    _InterlockedIncrement((long *)&var->value);
 #else
-#error No compiler defined for Atomic_Inc
+#error Atomic_Inc32 not implemented
 #endif
 }
 #define Atomic_Inc Atomic_Inc32
@@ -1584,7 +1618,7 @@ Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
 #elif defined _MSC_VER
    _InterlockedDecrement((long *)&var->value);
 #else
-#error No compiler defined for Atomic_Dec
+#error Atomic_Dec32 not implemented
 #endif
 }
 #define Atomic_Dec Atomic_Dec32
@@ -1796,7 +1830,7 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
 #elif defined _MSC_VER
    return _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
-#error No compiler defined for Atomic_ReadAdd32
+#error Atomic_ReadAdd32 not implemented
 #endif
 }
 
@@ -1966,7 +2000,7 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
                                                            (__int64)newVal,
                                                            (__int64)oldVal);
 #else
-#error No compiler defined for Atomic_CMPXCHG64
+#error Atomic_CMPXCHG64 not implemented
 #endif // !GNUC
 }
 
@@ -2170,7 +2204,7 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
 #elif defined _MSC_VER
    return _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_ReadAdd64
+#error Atomic_ReadAdd64 not implemented
 #endif
 
 #else
@@ -2194,9 +2228,6 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
  *
  *      Atomically subtracts a 64-bit integer from another.
  *
- *      Note: It is expected that val <= var.  If untrue, the result
- *            cannot be represented in an unsigned type.
- *
  * Results:
  *      Returns the old value just prior to the subtraction
  *
@@ -2213,7 +2244,25 @@ Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
 #if defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
-   return Atomic_ReadAdd64(var, (uint64)-(int64)val);
+#   ifdef _MSC_VER
+   /*
+    * Microsoft warning C4146, enabled by the /sdl option for
+    * additional security checks, objects to `-val' when val is
+    * unsigned, even though that is always well-defined by C and has
+    * exactly the semantics we want, namely negation modulo 2^64.
+    * (The signed version, in contrast, has undefined behaviour at
+    * some inputs.)
+    *
+    * https://docs.microsoft.com/en-us/cpp/error-messages/compiler-warnings/compiler-warning-level-2-c4146?view=msvc-170
+    * https://docs.microsoft.com/en-us/cpp/build/reference/sdl-enable-additional-security-checks?view=msvc-170
+    */
+#      pragma warning(push)
+#      pragma warning(disable: 4146)
+#   endif
+   return Atomic_ReadAdd64(var, -val);
+#   ifdef _MSC_VER
+#      pragma warning(pop)
+#   endif
 #endif
 }
 
@@ -2301,7 +2350,7 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
 #else
-#error No compiler defined for Atomic_Add64
+#error Atomic_Add64 not implemented
 #endif
 }
 
@@ -2343,7 +2392,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
 #elif defined _MSC_VER
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)-val);
 #else
-#error No compiler defined for Atomic_Sub64
+#error Atomic_Sub64 not implemented
 #endif
 }
 
@@ -2382,7 +2431,7 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 #elif defined _MSC_VER
    _InterlockedIncrement64((__int64 *)&var->value);
 #else
-#error No compiler defined for Atomic_Inc64
+#error Atomic_Inc64 not implemented
 #endif
 }
 
@@ -2421,7 +2470,7 @@ Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
 #elif defined _MSC_VER
    _InterlockedDecrement64((__int64 *)&var->value);
 #else
-#error No compiler defined for Atomic_Dec64
+#error Atomic_Dec64 not implemented
 #endif
 }
 
@@ -2819,7 +2868,7 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
 #elif defined VM_ARM_64
    value = _VMATOM_X(R, 16, &var->value);
 #else
-#error No 16-bits atomics.
+#error Atomic_Read16 not implemented
 #endif
 #endif
 
@@ -2881,7 +2930,7 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
 #elif defined VM_ARM_64
    return _VMATOM_X(RW, 16, TRUE, &var->value, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_ReadWrite16 not implemented
 #endif
 #endif
 }
@@ -2927,7 +2976,7 @@ Atomic_Write16(Atomic_uint16 *var,  // OUT:
     */
    Atomic_ReadWrite16(var, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Write16 not implemented
 #endif
 #endif
 }
@@ -2941,10 +2990,10 @@ Atomic_Write16(Atomic_uint16 *var,  // OUT:
  *      Compare exchange: Read variable, if equal to oldVal, write newVal
  *
  * Results:
- *      The value of the atomic variable before the write.
+ *      The value that was compared against oldVal.
  *
  * Side effects:
- *      The variable may be modified.
+ *      None.
  *
  *-----------------------------------------------------------------------------
  */
@@ -2993,7 +3042,7 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
 #elif defined VM_ARM_64
    return _VMATOM_X(RIFEQW, 16, TRUE, &var->value, oldVal, newVal);
 #else
-#error No 16-bits atomics.
+#error Atomic_ReadIfEqualWrite16 not implemented
 #endif
 #endif
 }
@@ -3050,7 +3099,7 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, and, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_And16 not implemented
 #endif
 #endif
 }
@@ -3107,7 +3156,7 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, orr, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Or16 not implemented
 #endif
 #endif
 }
@@ -3164,7 +3213,7 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, eor, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Xor16 not implemented
 #endif
 #endif
 }
@@ -3221,7 +3270,7 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, add, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Add16 not implemented
 #endif
 #endif
 }
@@ -3278,7 +3327,7 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
 #elif defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, sub, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_Sub16 not implemented
 #endif
 #endif
 }
@@ -3314,7 +3363,7 @@ Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 #elif defined VM_ARM_ANY
    Atomic_Add16(var, 1);
 #else
-#error No 16-bits atomics.
+#error Atomic_Inc16 not implemented
 #endif
 #endif
 }
@@ -3350,7 +3399,7 @@ Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
 #elif defined VM_ARM_ANY
    Atomic_Sub16(var, 1);
 #else
-#error No 16-bits atomics.
+#error Atomic_Dec16 not implemented
 #endif
 #endif
 }
@@ -3446,7 +3495,7 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
 #elif defined VM_ARM_64
    return _VMATOM_X(ROP, 16, TRUE, &var->value, add, val);
 #else
-#error No 16-bits atomics.
+#error Atomic_ReadAdd16 not implemented
 #endif
 #endif
 }
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index 51fd6f66..781cb1b1 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -773,7 +773,7 @@ RDTSC(void)
     * bora/lib/vprobe/arm64/vp_emit_tc.c::VpEmit_BuiltinRDTSCWork()
     * bora/modules/vmkernel/tests/core/xmapTest/xmapTest_arm64.c::XMapTest_SetupLoopCode()
     */
-#if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1)
+#if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1_OR_VHE)
    return MRS(CNTPCT_EL0);
 #else
    return MRS(CNTVCT_EL0);
@@ -830,9 +830,10 @@ RDTSC(void)
 /*
  *-----------------------------------------------------------------------------
  *
- * {Clear,Set,Test}Bit{32,64} --
+ * {Clear, Set, Test, Toggle}Bit{32, 64} --
  *
- *    Sets tests or clears a specified single bit in the provided variable.
+ *    Sets tests clears or toggles a specified single bit in the provided
+ *    variable.
  *
  *    The index input value specifies which bit to modify and is 0-based.
  *    Index is truncated by hardware to a 5-bit or 6-bit offset for the
@@ -857,6 +858,12 @@ ClearBit32(uint32 *var, unsigned index)
    *var &= ~(1 << index);
 }
 
+static INLINE void
+ToggleBit32(uint32 *var, unsigned index)
+{
+   *var ^= 1 << index;
+}
+
 static INLINE void
 SetBit64(uint64 *var, unsigned index)
 {
@@ -869,6 +876,12 @@ ClearBit64(uint64 *var, unsigned index)
    *var &= ~(CONST64U(1) << index);
 }
 
+static INLINE void
+ToggleBit64(uint64 *var, unsigned index)
+{
+   *var ^= (CONST64U(1) << index);
+}
+
 static INLINE Bool
 TestBit32(const uint32 *var, unsigned index)
 {
@@ -1262,7 +1275,7 @@ PopCount64(uint64 value)
  *      Enforce ordering on memory operations witnessed by and
  *      affected by interrupt handlers.
  *
- *      This should be used to replace the legacy COMPILER_*_BARRIER
+ *      This should be used to replace the legacy COMPILER_MEM_BARRIER
  *      for code that has been audited to determine it only needs
  *      ordering with respect to interrupt handlers, and not to other
  *      CPUs (SMP_*), memory-mapped I/O (MMIO_*), or DMA (DMA_*).
diff --git a/vmnet-only/vm_basic_asm_x86_64.h b/vmnet-only/vm_basic_asm_x86_64.h
index d3e2ab9e..2b9e8f8e 100644
--- a/vmnet-only/vm_basic_asm_x86_64.h
+++ b/vmnet-only/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -288,6 +288,37 @@ XRSTOR_AMD_ES0(const void *load, uint64 mask)
         : "eax", "memory");
 }
 
+#endif /* __GNUC__ */
+
+/*
+ * XSAVES/XRSTORS
+ *     saves/restores processor state components
+ *
+ * The pointer passed in must be 64-byte aligned.
+ */
+
+#if defined(__GNUC__)
+static INLINE void
+XSAVES(const void *save, uint64 mask)
+{
+   __asm__ __volatile__ (
+        "xsaves %0 \n"
+        : "=m" (*(uint8 *)save)
+        : "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+}
+
+static INLINE void
+XRSTORS(const void *load, uint64 mask)
+{
+   __asm__ __volatile__ (
+        "xrstors %0 \n"
+        :
+        : "m" (*(const uint8 *)load),
+          "a" ((uint32)mask), "d" ((uint32)(mask >> 32))
+        : "memory");
+}
+
 #endif /* __GNUC__ */
 #endif /* VMM || VMKERNEL || FROBOS || ULM */
 
diff --git a/vmnet-only/vm_basic_asm_x86_common.h b/vmnet-only/vm_basic_asm_x86_common.h
index 9b659c8b..2f48fc17 100644
--- a/vmnet-only/vm_basic_asm_x86_common.h
+++ b/vmnet-only/vm_basic_asm_x86_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2013-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2013-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -417,39 +417,36 @@ LOCKED_INSN_BARRIER(void)
  *    Semantics
  *    ---------
  *
- * At the time COMPILER_*_BARRIER were created (and references to them were
+ * At the time COMPILER_MEM_BARRIER was created (and references to it were
  * added to the code), the code was only targetting x86. The intent of the code
  * was really to use a memory barrier, but because x86 uses a strongly ordered
- * memory model, the CPU would not re-order memory accesses, and the code could
- * get away with using just a compiler memory barrier. So COMPILER_*_BARRIER
- * were born and were implemented as compiler memory barriers _on x86_. But
- * make no mistake, _the semantics that the code expects from
- * COMPILER_*_BARRIER are that of a memory barrier_!
+ * memory model, the CPU would not re-order most memory accesses (store-load
+ * ordering still requires MFENCE even on x86), and the code could get away
+ * with using just a compiler memory barrier. So COMPILER_MEM_BARRIER was born
+ * and was implemented as a compiler memory barrier _on x86_. But make no
+ * mistake, _the semantics that the code expects from COMPILER_MEM_BARRIER is
+ * that of a memory barrier_!
  *
  *    DO NOT USE!
  *    -----------
  *
- * On at least one non-x86 architecture, COMPILER_*_BARRIER are
- * 1) Misnomers
+ * On at least one non-x86 architecture, COMPILER_MEM_BARRIER is
+ * 1) A misnomer
  * 2) Not fine-grained enough to provide the best performance.
- * For the above two reasons, usage of COMPILER_*_BARRIER is now deprecated.
- * _Do not add new references to COMPILER_*_BARRIER._ Instead, precisely
+ * For the above two reasons, usage of COMPILER_MEM_BARRIER is now deprecated.
+ * _Do not add new references to COMPILER_MEM_BARRIER._ Instead, precisely
  * document the intent of your code by using
  * <mem_type/purpose>_<before_access_type>_BARRIER_<after_access_type>.
- * Existing references to COMPILER_*_BARRIER are being slowly but surely
- * converted, and when no references are left, COMPILER_*_BARRIER will be
+ * Existing references to COMPILER_MEM_BARRIER are being slowly but surely
+ * converted, and when no references are left, COMPILER_MEM_BARRIER will be
  * retired.
  *
  * Thanks for pasting this whole comment into every architecture header.
  */
 
 #if defined __GNUC__
-#   define COMPILER_READ_BARRIER()  COMPILER_MEM_BARRIER()
-#   define COMPILER_WRITE_BARRIER() COMPILER_MEM_BARRIER()
 #   define COMPILER_MEM_BARRIER()   __asm__ __volatile__("" ::: "memory")
 #elif defined _MSC_VER
-#   define COMPILER_READ_BARRIER()  _ReadBarrier()
-#   define COMPILER_WRITE_BARRIER() _WriteBarrier()
 #   define COMPILER_MEM_BARRIER()   _ReadWriteBarrier()
 #endif
 
@@ -514,7 +511,7 @@ LOCKED_INSN_BARRIER(void)
  * i.e. WB using above terminology), so we only need to worry about store-load
  * reordering. In other cases a compiler barrier is sufficient. SMP store-load
  * reordering is handled with a locked XOR (instead of a proper MFENCE
- * instructon) for performance reasons. See PR 1674199 for more details.
+ * instruction) for performance reasons. See PR 1674199 for more details.
  *
  * DMA barriers are equivalent to SMP barriers on x86.
  *
@@ -524,14 +521,14 @@ LOCKED_INSN_BARRIER(void)
  * not guarding non-temporal/WC accesses.
  */
 
-#define SMP_R_BARRIER_R()     COMPILER_READ_BARRIER()
-#define SMP_R_BARRIER_W()     COMPILER_MEM_BARRIER()
-#define SMP_R_BARRIER_RW()    COMPILER_MEM_BARRIER()
+#define SMP_R_BARRIER_R()     INTR_R_BARRIER_R()
+#define SMP_R_BARRIER_W()     INTR_R_BARRIER_W()
+#define SMP_R_BARRIER_RW()    INTR_R_BARRIER_RW()
 #define SMP_W_BARRIER_R()     LOCKED_INSN_BARRIER()
-#define SMP_W_BARRIER_W()     COMPILER_WRITE_BARRIER()
+#define SMP_W_BARRIER_W()     INTR_W_BARRIER_W()
 #define SMP_W_BARRIER_RW()    LOCKED_INSN_BARRIER()
 #define SMP_RW_BARRIER_R()    LOCKED_INSN_BARRIER()
-#define SMP_RW_BARRIER_W()    COMPILER_MEM_BARRIER()
+#define SMP_RW_BARRIER_W()    INTR_RW_BARRIER_W()
 #define SMP_RW_BARRIER_RW()   LOCKED_INSN_BARRIER()
 
 /*
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index 006c60ca..fd597664 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -50,7 +50,10 @@
  * References:
  *   C90 7.17, C99 7.19, C11 7.19
  */
-#if !defined(VMKERNEL)
+/* Use linux/stddef.h when building Linux kernel modules. */
+#ifdef KBUILD_MODNAME
+#  include <linux/stddef.h>
+#elif !defined(VMKERNEL)
 #  include <stddef.h>
 #else
    /*
@@ -270,6 +273,10 @@ Max(int a, int b)
 #define BYTES_2_PAGES(_nbytes)  ((_nbytes) >> PAGE_SHIFT)
 #endif
 
+#ifndef BYTES_2_PAGES_4KB
+#define BYTES_2_PAGES_4KB(_nbytes)  ((_nbytes) >> PAGE_SHIFT_4KB)
+#endif
+
 #ifndef PAGES_2_BYTES
 #define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
 #endif
@@ -296,6 +303,11 @@ Max(int a, int b)
    ((uint64)(_nMbytes) << (MBYTES_SHIFT - PAGE_SHIFT))
 #endif
 
+#ifndef MBYTES_2_PAGES_4KB
+#define MBYTES_2_PAGES_4KB(_nMbytes) \
+   ((uint64)(_nMbytes) << (MBYTES_SHIFT - PAGE_SHIFT_4KB))
+#endif
+
 #ifndef PAGES_2_KBYTES
 #define PAGES_2_KBYTES(_npages) ((_npages) << (PAGE_SHIFT - KBYTES_SHIFT))
 #endif
@@ -564,6 +576,13 @@ typedef int pid_t;
 #define DEBUG_ONLY(...)
 #endif
 
+#if defined(VMX86_DEBUG) || defined(VMX86_ENABLE_SPLOCK_STATS)
+#define LOCK_STATS_ON
+#define LOCK_STATS_ONLY(...)  __VA_ARGS__
+#else
+#define LOCK_STATS_ONLY(...)
+#endif
+
 #ifdef VMX86_STATS
 #define vmx86_stats   1
 #define STATS_ONLY(x) x
@@ -628,6 +647,13 @@ typedef int pid_t;
 #define VMKERNEL_ONLY(x)
 #endif
 
+/*
+ * In MSVC, _WIN32 is defined as 1 when the compilation target is
+ * 32-bit ARM, 64-bit ARM, x86, or x64 (which implies _WIN64). This
+ * is documented in C/C++ preprocessor section of the Microsoft C++,
+ * C, and Assembler documentation (https://via.vmw.com/EchK).
+ */
+
 #ifdef _WIN32
 #define WIN32_ONLY(x) x
 #define POSIX_ONLY(x)
@@ -819,6 +845,11 @@ typedef int pid_t;
  * wasted.  On x86, GCC 6.3.0 behaves sub-optimally when variables are declared
  * on the stack using the aligned attribute, so this pattern is preferred.
  * See PRs 1795155, 1819963.
+ *
+ * GCC9 has been shown to exhibit aliasing issues when using
+ * '-fstrict-aliasing=2' that did not happen under GCC6 with this
+ * construct.
+ * See @9503890, PR 2906490.
  */
 #define WITH_PTR_TO_ALIGNED_VAR(_type, _align, _var)                     \
    do {                                                                  \
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index 8a0d41de..d05fcc79 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,13 +17,11 @@
  *********************************************************/
 
 /*
- *
  * vm_basic_types.h --
  *
- *    basic data types.
+ *      Basic data types.
  */
 
-
 #ifndef _VM_BASIC_TYPES_H_
 #define _VM_BASIC_TYPES_H_
 
@@ -312,7 +310,8 @@ typedef char           Bool;
 #endif
 
 
-#if defined(__GNUC__) && defined(__SIZEOF_INT128__)
+#if defined __GNUC__ && defined __SIZEOF_INT128__
+#define VM_HAS_INT128 // 128-bit integers can be used.
 
 typedef unsigned __int128 uint128;
 typedef          __int128  int128;
@@ -321,7 +320,6 @@ typedef          __int128  int128;
 #define MAX_INT128   (~MIN_INT128)
 #define MIN_UINT128  ((uint128)0)
 #define MAX_UINT128  (~MIN_UINT128)
-
 #endif
 
 
@@ -473,14 +471,7 @@ typedef uint64    PhysMemOff;
 typedef uint64    PhysMemSize;
 
 typedef uint64    BA;
-#ifdef VMKERNEL
-typedef void     *BPN;
-#else
 typedef uint64    BPN;
-#endif
-
-#define UINT64_2_BPN(u) ((BPN)(u))
-#define BPN_2_UINT64(b) ((uint64)(b))
 
 typedef uint64    PageCnt;
 typedef uint64    PageNum;
@@ -507,9 +498,6 @@ typedef User_CartelID User_SessionID;
 typedef User_CartelID User_CartelGroupID;
 #define INVALID_CARTELGROUP_ID INVALID_CARTEL_ID
 
-typedef uint32 Worldlet_ID;
-#define INVALID_WORLDLET_ID ((Worldlet_ID)-1)
-
 typedef  int8    Reg8;
 typedef  int16   Reg16;
 typedef  int32   Reg32;
@@ -527,7 +515,7 @@ typedef uint128 UReg128;
 
 #if (defined(VMM) || defined(COREQUERY) || defined(EXTDECODER) ||  \
      defined (VMKERNEL) || defined (VMKBOOT) || defined (ULM)) &&  \
-    !defined (FROBOS)
+    !defined (FROBOS) || defined (VSAN_USERLEVEL)
 typedef  Reg64  Reg;
 typedef UReg64 UReg;
 #endif
@@ -630,12 +618,12 @@ typedef void * UserVA;
 #define MAX_MPN           ((MPN)MPN38_MASK - 3) /* 50 bits of address space */
 
 #define INVALID_IOPN      ((IOPN)-1)
-#define MAX_IOPN          (INVALID_IOPN - 1)
+#define MAX_IOPN          (IOA_2_IOPN((IOA)-1))
 
 #define INVALID_LPN       ((LPN)-1)
 #define INVALID_VPN       ((VPN)-1)
 #define INVALID_LPN64     ((LPN64)-1)
-#define INVALID_PAGENUM   ((PageNum)0x000000ffffffffffull)
+#define INVALID_PAGENUM   ((PageNum)0x0000003fffffffffull)
 #define INVALID_PAGENUM32 ((uint32)-1)
 
 /*
@@ -736,11 +724,11 @@ typedef void * UserVA;
 #endif
 
 /*
- * Similarly, we require a compiler that is at least vs2012.
+ * Similarly, we require a compiler that is at least vs2015.
  * Enforce this here.
  */
-#if defined _MSC_VER && _MSC_VER < 1700
-#error "cl.exe version is too old, need vs2012 or better"
+#if defined _MSC_VER && _MSC_VER < 1900
+#error "cl.exe version is too old, need vs2015 or better"
 #endif
 
 
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
index 9650f7fe..7691618d 100644
--- a/vmnet-only/vm_device_version.h
+++ b/vmnet-only/vm_device_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2005-2012,2014-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2005-2012,2014-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -256,10 +256,13 @@
 /************* NVME implementation limits ********************************/
 #define NVME_MAX_CONTROLLERS   4
 #define NVME_MIN_NAMESPACES    1
-#define NVME_MAX_NAMESPACES    15 /* We support only 15 namespaces same
-                                   * as SCSI devices.
+#define NVME_MAX_NAMESPACES    64 /* We support 64 namespaces same
+                                   * as PVSCSI controller.
                                    */
-
+#define NVME_HW19_MAX_NAMESPACES 15 // HWv19 and before supports 15 namespaces
+#define NVME_FUTURE_MAX_NAMESPACES 256 /* To support NVME to the possible 256
+                                        * disks per controller in future.
+                                        */
 /************* SCSI implementation limits ********************************/
 #define SCSI_MAX_CONTROLLERS	 4	  // Need more than 1 for MSCS clustering
 #define	SCSI_MAX_DEVICES         16	  // BT-958 emulates only 16
@@ -276,26 +279,11 @@
 #define AHCI_MAX_PORTS SATA_MAX_DEVICES
 
 /*
- * Publicly supported maximum number of disks per VM.
+ * Official limit for supported number of disks is 440 per VM.
+ * VM can have more disks (up to 636 as of now), but such VM is not
+ * supported (main reason being too long downtime during (s)vmotion).
  */
-#define MAX_NUM_DISKS \
-   ((SATA_MAX_CONTROLLERS * SATA_MAX_DEVICES) + \
-    (SCSI_MAX_CONTROLLERS * SCSI_MAX_DEVICES) + \
-    (NVME_MAX_CONTROLLERS * NVME_MAX_NAMESPACES) + \
-    (IDE_NUM_INTERFACES * IDE_DRIVES_PER_IF))
-
-/*
- * Maximum number of supported disks in a VM from HWV14 or later, using PVSCSI updated max
- * devices.  The note above still holds true, but instead of publicly supporting
- * all devices, HWv14 simply extends the maximum support to 256 devices,
- * instead ~244 calculated above.
- *
- * PVSCSI_HW_MAX_DEVICES is 65 - allowing 64 disks + controller (at ID 7)
- * 4 * 64 = 256 devices.
- *
- */
-#define MAX_NUM_DISKS_HWV14 MAX(MAX_NUM_DISKS, \
-   (SCSI_MAX_CONTROLLERS * PVSCSI_MAX_NUM_DISKS))
+#define MAX_NUM_DISKS_SUPPORTED 440
 
 /*
  * VSCSI_BV_INTS is the number of uint32's needed for a bit vector
@@ -339,10 +327,10 @@
 #define MAX_FLOPPY_DRIVES      2
 
 /************* PCI Passthrough implementation limits ********************/
-#define MAX_PCI_PASSTHRU_DEVICES 32
+#define MAX_PCI_PASSTHRU_DEVICES 128
 
 /************* Test device implementation limits ********************/
-#define MAX_PCI_TEST_DEVICES 32
+#define MAX_PCI_TEST_DEVICES 128
 
 /************* VDTI PCI Device implementation limits ********************/
 #define MAX_VDTI_PCI_DEVICES 16
@@ -366,6 +354,10 @@
 /************* DeviceGroup implementation limits ********************/
 #define MAX_DEVICE_GROUP_DEVICES 4
 
+/************* Serial/Parallel Ports limits ********************/
+#define NUM_SERIAL_PORTS     32
+#define NUM_PARALLEL_PORTS   3
+
 /************* Strings for Host USB Driver *******************************/
 
 #ifdef _WIN32
diff --git a/vmnet-only/vnet.h b/vmnet-only/vnet.h
index 4e2ba555..d6691d5c 100644
--- a/vmnet-only/vnet.h
+++ b/vmnet-only/vnet.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2017,2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -46,39 +46,32 @@ typedef struct VNet_Bind {
    uint8  id[VNET_PVN_ABI_ID_LEN]; // used for VNET_BIND_TO_PVN
 } VNet_Bind;
 
-/*
- * We define customized ioctl commands by adding 0x1000
- * to the standard Linux definitions.
- *
- * See comments in iocontrols.h
- */
-
-#define VNET_FIRST_CMD     0x99F2
+#define VNET_FIRST_CMD     0x99E0
 
 // #define SIOCSKEEP          0x99F0  // not used
 // #define SIOCGKEEP          0x99F1  // not used
 #define SIOCSLADRF         0x99F2
-#define SIOCPORT           0x99F3
-#define SIOCBRIDGE         0x99F4
+// #define SIOCPORT           0x99F3  // obsolete
+// #define SIOCBRIDGE         0x99F4  // obsolete
 #define SIOCNETIF          0x99F5
 
 #define SIOCSETMACADDR     0x99F6
 #define SIOCSSWITCHMAP     0x99F7
-#define SIOCSETNOTIFY      0x99F8
+// #define SIOCSETNOTIFY      0x99F8  // obsolete
 #define SIOCUNSETNOTIFY    0x99F9
 // #define SIOCSETCLUSTERSIZE 0x99FA  // obsolete
 #define SIOCSETNOTIFY2     0x99FB
-#define SIOCGETAPIVERSION  0x99FC
+// #define SIOCGETAPIVERSION  0x99FC  // obsolete
 #define SIOCINJECTLINKSTATE 0x99FD
 
 #define VNET_NOTIFY_VERSION     6
-#define VNET_LAST_CMD      0x99FD
+#define VNET_LAST_CMD      0x99FF
 
 #if defined __linux__ || defined __APPLE__
 #define SIOCGETAPIVERSION2 _IOWR(0x99, 0xE0, uint32)
-#define SIOCGBRSTATUS	    _IOR(0x99, 0xFD, uint32)
-#define SIOCSPEER	    _IOW(0x99, 0xFE, char[8])
-#define SIOCSPEER2          _IOW(0x99, 0xFE, char[32])
+#define SIOCGBRSTATUS       _IOR(0x99, 0xFD, uint32)
+// #define SIOCSPEER        _IOW(0x99, 0xFE, char[8])   // obsolete
+// #define SIOCSPEER2       _IOW(0x99, 0xFE, char[32])  // obsolete
 #define SIOCSBIND           _IOW(0x99, 0xFF, VNet_Bind)
 #define SIOCSFILTERRULES    _IOW(0x99, 0xE1, VNet_RuleHeader)
 #define SIOCSUSERLISTENER   _IOW(0x99, 0xE2, VNet_SetUserListener)
@@ -95,7 +88,9 @@ typedef struct VNet_BridgeParams {
 } VNet_BridgeParams;
 #pragma pack(pop)
 
-#define SIOCSPEER3         _IOW(0x99, 0xE4, VNet_BridgeParams)
+#define SIOCSPEER3          _IOW(0x99, 0xE4, VNet_BridgeParams)
+#define SIOCGETMACADDR      _IOR(0x99, 0xE5, char[6])
+#define SIOCSPORTFLAGS      _IOW(0x99, 0xE6, uint32)
 #endif
 
 #ifdef __APPLE__
@@ -160,7 +155,7 @@ typedef struct VNet_Read {
  */
 
 #ifdef __linux__
-#define VNET_API_VERSION                (3 << 16 | 0)
+#define VNET_API_VERSION                (4 << 16 | 0)
 #elif defined __APPLE__
 #define VNET_API_VERSION                (6 << 16 | 0)
 #else

From fee62c948e22f8fbccdb20ca258ed1a9da317973 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 4 Feb 2023 16:32:02 +0100
Subject: [PATCH 22/41] import Workstation 17.0.1 module sources

---
 vmnet-only/smac.c      | 43 ++++++++++++++++++++++++++----------------
 vmnet-only/vnetEvent.c | 27 +++++++++++++-------------
 2 files changed, 40 insertions(+), 30 deletions(-)

diff --git a/vmnet-only/smac.c b/vmnet-only/smac.c
index 4518d89e..a3b0cf5b 100644
--- a/vmnet-only/smac.c
+++ b/vmnet-only/smac.c
@@ -3289,13 +3289,13 @@ ProcessOutgoingIPv4Packet(SMACPacket *packet,  // IN: cloned packet to process
 		*/
 
 	       dhcpFlags |= 0x8000;
-	       if (!SetPacketByte(packet, ethHeaderLen + ipHeaderLen + 
-                                  UDP_HEADER_LEN + 11, dhcpFlags & 0xff) || 
-		   !SetPacketByte(packet, ethHeaderLen + ipHeaderLen + 
-                                  UDP_HEADER_LEN + 10, dhcpFlags >> 8)) {
-		  VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't set "
-		               "new UDP flags, non-checksum case\n"));
-		  return;
+	       if (!SetPacketByte(packet, ethHeaderLen + ipHeaderLen +
+                         UDP_HEADER_LEN + 11, dhcpFlags & 0xff) ||
+	           !SetPacketByte(packet, ethHeaderLen + ipHeaderLen +
+                         UDP_HEADER_LEN + 10, dhcpFlags >> 8)) {
+                     VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't set "
+	                            "new UDP flags, non-checksum case\n"));
+	             return;
 	       }
 	    }
 	 }
@@ -3303,7 +3303,7 @@ ProcessOutgoingIPv4Packet(SMACPacket *packet,  // IN: cloned packet to process
 #ifdef DBG
 	 {
 	    uint32 IPDestAddr;
-	    if (!GetPacketData(packet, ethHeaderLen + IP_HEADER_DEST_ADDR_OFFSET, 
+	    if (!GetPacketData(packet, ethHeaderLen + IP_HEADER_DEST_ADDR_OFFSET,
 			       sizeof IPDestAddr, &IPDestAddr)) {
 	       VNETKdPrint((MODULE_NAME "ProcessOutgoing: couldn't get "
 			    "IP dest addr\n"));
@@ -4614,11 +4614,16 @@ GetSystemUptime(SMACState *state) // IN: smac state
  *----------------------------------------------------------------------
  */
 
-static INLINE uint32 
+static INLINE uint32
 GetPacketLength(SMACPacket *packet) // IN: packet
 {
    ASSERT(packet);
+
 #ifdef _WIN32
+   if (packet == NULL) {
+       return 0;
+   }
+
    return packet->buf1Len + packet->buf2Len;
 #elif defined __linux__
    ASSERT(packet->skb);
@@ -4682,12 +4687,14 @@ GetPacketData(SMACPacket *packet, // IN: packet to copy from
       data = ((uint8*)data) + copyLength;
       length -= copyLength;
    }
-   /* copy any remaining data from second buffer */   
+   /* copy any remaining data from second buffer */
    if (length) {
       copyOffset = offset - packet->buf1Len;
       copyLength = length;
-      MEMCPY(data, ((uint8*)packet->buf2) + copyOffset, copyLength);
-   }   
+      if (data && packet->buf2) {
+          MEMCPY(data, ((uint8*)packet->buf2) + copyOffset, copyLength);
+      }
+   }
 
 #elif __linux__
 
@@ -4740,8 +4747,8 @@ ClonePacket(SMACPackets *packets)   // IN: struct in which to clone packet
    if (packets->orig.buf1Len) {
       MEMCPY(packetClone->data, packets->orig.buf1, packets->orig.buf1Len);
    }
-   if (packets->orig.buf2Len) {
-      MEMCPY(packetClone->data + packets->orig.buf1Len, packets->orig.buf2, 
+   if (packets->orig.buf2Len && packets->orig.buf2) {
+      MEMCPY((uint8 *)packetClone->data + packets->orig.buf1Len, packets->orig.buf2,
 	     packets->orig.buf2Len);
    }
 
@@ -4859,15 +4866,19 @@ SetPacketByte(SMACPacket *packet, // IN: packet
 	      uint8 data)	  // IN: data to set
 {
    ASSERT(packet);
-
 #ifdef _WIN32
+
+   if (packet == NULL || packet->buf1 == NULL || packet->buf2 == NULL) {
+       return FALSE;
+   }
+
    /* check length, be sure to handle case where offset = -1, length > 0 */
    if (offset > GetPacketLength(packet)) {
       /* packet not long enough for data */
       return FALSE;
    }
 
-   /* if offset starts in the first buffer, then copy from first buffer */   
+   /* if offset starts in the first buffer, then copy from first buffer */
    if (offset < packet->buf1Len) {
       ((uint8*)packet->buf1)[offset] = data;
    } else {
diff --git a/vmnet-only/vnetEvent.c b/vmnet-only/vnetEvent.c
index 3fda7f5a..f1579292 100644
--- a/vmnet-only/vnetEvent.c
+++ b/vmnet-only/vnetEvent.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2007 VMware, Inc. All rights reserved.
+ * Copyright (C) 2007, 2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -60,10 +60,12 @@ typedef struct VNetEvent_EventNode VNetEvent_EventNode;
 
 struct VNetEvent_EventNode {
    VNetEvent_EventNode *nextEvent;
-   VNet_EventHeader event;
+   union {
+       VNet_EventHeader header;
+       VNet_LinkStateEvent lse;
+   } event;
 };
 
-#define EVENT_NODE_HEADER_SIZE offsetof(struct VNetEvent_EventNode, event)
 
 struct VNetEvent_Mechanism {
    VNetKernel_SpinLock lock;          /* mechanism lock */
@@ -369,6 +371,10 @@ VNetEvent_Send(VNetEvent_Sender *s, // IN: a sender
       return VNetKernel_EINVAL;
    }
 
+   if (e->size > sizeof(p->event)) {
+      return VNetKernel_EINVAL;
+   }
+
    /* lock */
    VNetKernel_SpinLockAcquire(&m->lock);
    m->handlerTask = VNetKernel_ThreadCurrent();
@@ -378,22 +384,15 @@ VNetEvent_Send(VNetEvent_Sender *s, // IN: a sender
    while (TRUE) {
        p = *q;
        if (p == NULL ||
-           (p->event.eventId == e->eventId && p->event.type == e->type)) {
+           (p->event.header.eventId == e->eventId && p->event.header.type == e->type)) {
                break;
            }
       q = &p->nextEvent;
    }
 
-   /* remove previously sent event */
-   if (p != NULL && p->event.size != e->size) {
-      *q = p->nextEvent;
-      VNetKernel_MemoryFree(p);
-      p = NULL;
-   }
-
    /* insert new event into event list*/
    if (p == NULL) {
-      p = VNetKernel_MemoryAllocate(EVENT_NODE_HEADER_SIZE + e->size);
+      p = VNetKernel_MemoryAllocate(sizeof(*p));
       if (p == NULL) {
          m->handlerTask = NULL;
          VNetKernel_SpinLockRelease(&m->lock);
@@ -485,8 +484,8 @@ VNetEvent_CreateListener(VNetEvent_Mechanism *m, // IN: a mechanism
    while (s != NULL) {
       e = s->firstEvent;
       while (e != NULL) {
-         if ((e->event.classSet & classMask) != 0) {
-            h(data, &e->event);
+         if ((e->event.header.classSet & classMask) != 0) {
+            h(data, &e->event.header);
          }
          e = e->nextEvent;
       }

From 60bfdb5ed582d2dc00321bd4b27968f90001ef53 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 20 Oct 2023 13:56:49 +0200
Subject: [PATCH 23/41] import Workstation 17.5.0 module sources

---
 vmmon-only/bootstrap/monLoader.c              |   4 +-
 vmmon-only/bootstrap/monLoaderVmmon.c         |   2 +-
 vmmon-only/bootstrap/vmmblob.c                |   2 +-
 vmmon-only/common/apic.c                      |   2 +-
 vmmon-only/common/cpuid.c                     |   2 +-
 vmmon-only/common/cpuid.h                     |   2 +-
 vmmon-only/common/hostif.h                    |   2 +-
 vmmon-only/common/hostifMem.h                 |   2 +-
 vmmon-only/include/addrlayout.h               |   3 +-
 vmmon-only/include/compat_version.h           |   8 +-
 vmmon-only/include/cpu_types.h                |   2 +-
 vmmon-only/include/intelVT.h                  |   5 +-
 vmmon-only/include/iocontrols.h               |  22 +-
 vmmon-only/include/modulecall.h               |   5 +-
 vmmon-only/include/monLoader.h                |   2 +-
 vmmon-only/include/monLoaderLog.h             |   2 +-
 .../{vmm_constants.h => mon_constants.h}      |  20 +-
 vmmon-only/include/overheadmem_types.h        |  13 +-
 vmmon-only/include/perfctr.h                  |   7 +-
 vmmon-only/include/perfctr_arch.h             |   3 +
 vmmon-only/include/pgtbl.h                    |  18 +-
 vmmon-only/include/ptsc.h                     |  16 +-
 vmmon-only/include/rateconv.h                 |   6 +-
 vmmon-only/include/segs.h                     | 131 +++---
 vmmon-only/include/vcpuset.h                  |   2 +-
 vmmon-only/include/vcpuset_types.h            |  11 +-
 vmmon-only/include/versioned_atomic.h         |   2 +-
 vmmon-only/include/virtual_vt.h               |   6 +-
 vmmon-only/include/vm_asm_x86.h               |  60 ++-
 vmmon-only/include/vm_atomic.h                | 387 ++++++++++++------
 vmmon-only/include/vm_atomic_acqrel.h         |  62 ++-
 vmmon-only/include/vm_basic_asm.h             |  14 +-
 vmmon-only/include/vm_basic_asm_x86.h         |  12 +-
 vmmon-only/include/vm_basic_asm_x86_64.h      |  12 +-
 vmmon-only/include/vm_basic_defs.h            |  76 ++--
 vmmon-only/include/vm_basic_types.h           |  18 +-
 vmmon-only/include/x86_basic_defs.h           |   6 +-
 vmmon-only/include/x86cpuid.h                 | 225 ++++++++--
 vmmon-only/include/x86desc.h                  |  15 +-
 vmmon-only/include/x86msr.h                   |  85 +++-
 vmmon-only/include/x86paging_64.h             |  57 ++-
 vmmon-only/include/x86paging_common.h         |  30 +-
 vmmon-only/include/x86svm.h                   |  29 ++
 vmmon-only/include/x86vt-exit-reasons.h       |  25 +-
 vmmon-only/include/x86vt-vmcs-fields.h        |  10 +-
 vmmon-only/include/x86vt.h                    |  63 +--
 vmmon-only/include/x86vtinstr.h               |  20 +-
 vmmon-only/linux/hostif.c                     |   6 +-
 vmmon-only/linux/vmhost.h                     |   2 +-
 vmnet-only/bridge.c                           |   7 +-
 vmnet-only/compat_version.h                   |   8 +-
 vmnet-only/netif.c                            |   8 +-
 vmnet-only/smac.c                             |  12 +-
 vmnet-only/vm_atomic.h                        | 387 ++++++++++++------
 vmnet-only/vm_basic_asm.h                     |  14 +-
 vmnet-only/vm_basic_asm_x86.h                 |  12 +-
 vmnet-only/vm_basic_asm_x86_64.h              |  12 +-
 vmnet-only/vm_basic_defs.h                    |  76 ++--
 vmnet-only/vm_basic_types.h                   |  18 +-
 vmnet-only/vm_device_version.h                |  30 +-
 vmnet-only/vnetEvent.c                        |   2 +-
 vmnet-only/vnetUserListener.c                 |  12 +-
 62 files changed, 1507 insertions(+), 607 deletions(-)
 rename vmmon-only/include/{vmm_constants.h => mon_constants.h} (78%)

diff --git a/vmmon-only/bootstrap/monLoader.c b/vmmon-only/bootstrap/monLoader.c
index fef36977..a5e911b4 100644
--- a/vmmon-only/bootstrap/monLoader.c
+++ b/vmmon-only/bootstrap/monLoader.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 2015-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -791,7 +791,7 @@ MonLoader_Process(MonLoaderHeader  *header,   // IN/OUT
    }
    *line = LINE_INVALID;
 
-   if (header->entries == 0 || header->count == 0) {
+   if (header->count == 0) {
       return ML_ERROR_TABLE_MISSING;
    }
 
diff --git a/vmmon-only/bootstrap/monLoaderVmmon.c b/vmmon-only/bootstrap/monLoaderVmmon.c
index e121f7c4..18e13f91 100644
--- a/vmmon-only/bootstrap/monLoaderVmmon.c
+++ b/vmmon-only/bootstrap/monLoaderVmmon.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2016-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/bootstrap/vmmblob.c b/vmmon-only/bootstrap/vmmblob.c
index e0ff8193..cba3fcff 100644
--- a/vmmon-only/bootstrap/vmmblob.c
+++ b/vmmon-only/bootstrap/vmmblob.c
@@ -28,7 +28,7 @@
 #include "vm_assert.h"
 #include "hostif.h"
 #include "vmmblob.h"
-#include "vmm_constants.h"
+#include "mon_constants.h"
 #include "monLoader.h"
 
 /*
diff --git a/vmmon-only/common/apic.c b/vmmon-only/common/apic.c
index 6df44e61..c738687c 100644
--- a/vmmon-only/common/apic.c
+++ b/vmmon-only/common/apic.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2011, 2016, 2018,2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2011, 2016, 2018,2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
index 78b7a4af..1c88672a 100644
--- a/vmmon-only/common/cpuid.c
+++ b/vmmon-only/common/cpuid.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2016-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998, 2016-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/cpuid.h b/vmmon-only/common/cpuid.h
index 512d8c3b..ce625bda 100644
--- a/vmmon-only/common/cpuid.h
+++ b/vmmon-only/common/cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2016-2019 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998, 2016-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index 445570b9..107f700e 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/hostifMem.h b/vmmon-only/common/hostifMem.h
index 98621f85..a0f587e0 100644
--- a/vmmon-only/common/hostifMem.h
+++ b/vmmon-only/common/hostifMem.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998, 2008, 2018 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998, 2008, 2018 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/addrlayout.h b/vmmon-only/include/addrlayout.h
index df3b0d76..f2d6ef68 100644
--- a/vmmon-only/include/addrlayout.h
+++ b/vmmon-only/include/addrlayout.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2007-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2007-2020,2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -29,7 +29,6 @@
 #include "vm_basic_defs.h"
 #include "vm_assert.h"
 #include "address_defs.h"
-#include "vmm_constants.h"
 
 #define DIRECT_EXEC_USER_RPL    3
 #define BINARY_TRANSLATION_RPL  1
diff --git a/vmmon-only/include/compat_version.h b/vmmon-only/include/compat_version.h
index 51facf4b..4a0d7316 100644
--- a/vmmon-only/include/compat_version.h
+++ b/vmmon-only/include/compat_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -135,6 +135,12 @@
 #   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(8, 5)
 #      define RHEL85_BACKPORTS 1
 #   endif
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(9, 1)
+#      define RHEL91_BACKPORTS 1
+#   endif
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(9, 2)
+#      define RHEL92_BACKPORTS 1
+#   endif
 #endif
 
 #endif /* __COMPAT_VERSION_H__ */
diff --git a/vmmon-only/include/cpu_types.h b/vmmon-only/include/cpu_types.h
index 7b30e94a..9e879929 100644
--- a/vmmon-only/include/cpu_types.h
+++ b/vmmon-only/include/cpu_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/intelVT.h b/vmmon-only/include/intelVT.h
index 8de2cfe0..0ea222c9 100644
--- a/vmmon-only/include/intelVT.h
+++ b/vmmon-only/include/intelVT.h
@@ -391,9 +391,10 @@ IntelVT_FindCommon3rd(const MSRCache *data,     // IN
  *----------------------------------------------------------------------
  */
 static INLINE Bool
-IntelVT_Enabled(const MSRCache *cache, uint32 pcpu)
+IntelVT_Enabled(const MSRCache *cache, uint32 pcpu, Bool smxEnabled)
 {
-   return VT_EnabledFromFeatures(MSRCache_Get(cache, MSR_FEATCTL, pcpu));
+   return VT_EnabledFromFeatures(MSRCache_Get(cache, MSR_FEATCTL, pcpu),
+                                 smxEnabled);
 }
 
 
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 2dca0be8..74bbe6ce 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -168,6 +168,7 @@ PtrToVA64(void const *ptr) // IN
 #endif
 
 
+#if !defined __APPLE__
 #if !__linux__
 /*
  * On platforms other than Linux, IOCTLCMD_foo values are just numbers, and
@@ -198,13 +199,7 @@ enum IOCTLCmd {
     * handling 32 bit ioctl syscalls.  Hence FIRST and LAST.  FIRST must be
     * 2001 so that VERSION is 2001 for backwards compatibility.
     */
-#if defined __linux__ || defined _WIN32
-   /* Start at 2001 because legacy code did. */
    IOCTLCMD(FIRST) = 2001,
-#else
-   /* Start at 0. */
-   IOCTLCMD(FIRST),
-#endif
    IOCTLCMD(VERSION) = IOCTLCMD(FIRST),
    IOCTLCMD(CREATE_VM),
    IOCTLCMD(PROCESS_BOOTSTRAP),
@@ -268,18 +263,13 @@ enum IOCTLCmd {
    IOCTLCMD(UNMAP_SCATTER_LIST),
 #endif
 
-#if defined __APPLE__
-   IOCTLCMD(GET_NUM_RESPONDING_CPUS),
-   IOCTLCMD(INIT_DRIVER),
-   IOCTLCMD(BLUEPILL),
-#endif
-
    IOCTLCMD(GET_UNAVAIL_PERF_CTRS),
    IOCTLCMD(GET_MONITOR_CONTEXT),
    IOCTLCMD(KERNEL_CET_ENABLED),
    // Must be last.
    IOCTLCMD(LAST)
 };
+#endif // !defined __APPLE__
 
 
 #if defined _WIN32
@@ -293,7 +283,7 @@ enum IOCTLCmd {
 #define FILE_DEVICE_VMX86        0x8101
 #define VMX86_IOCTL_BASE_INDEX   0x801
 #define VMIOCTL_BUFFERED(name) \
-     CTL_CODE(FILE_DEVICE_VMX86, \
+      CTL_CODE(FILE_DEVICE_VMX86, \
 	       VMX86_IOCTL_BASE_INDEX + IOCTLCMD_ ## name, \
 	       METHOD_BUFFERED, \
 	       FILE_ANY_ACCESS)
@@ -352,7 +342,7 @@ enum IOCTLCmd {
 #define IOCTL_VMX86_REMAP_SCATTER_LIST_RO VMIOCTL_BUFFERED(REMAP_SCATTER_LIST_RO)
 #define IOCTL_VMX86_UNMAP_SCATTER_LIST    VMIOCTL_BUFFERED(UNMAP_SCATTER_LIST)
 #define IOCTL_VMX86_KERNEL_CET_ENABLED    VMIOCTL_BUFFERED(KERNEL_CET_ENABLED)
-#endif
+#endif // defined _WIN32
 
 
 #define INIT_BLOCK_MAGIC     (0x1789 + 14)
@@ -589,10 +579,6 @@ typedef union {
    Context64 context; // OUT
 } VMMonContext;
 
-#if defined __APPLE__
-#   include "iocontrolsMacos.h"
-#endif
-
 /* Clean up helper macros */
 #undef IOCTLCMD
 
diff --git a/vmmon-only/include/modulecall.h b/vmmon-only/include/modulecall.h
index f7a467bf..cb30e05f 100644
--- a/vmmon-only/include/modulecall.h
+++ b/vmmon-only/include/modulecall.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -34,7 +34,6 @@
 #include "ptsc.h"
 #include "vcpuid.h"
 #include "vcpuset.h"
-#include "vmm_constants.h"
 #include "contextinfo.h"
 #include "rateconv.h"
 #include "mon_assert.h"
@@ -363,7 +362,7 @@ typedef struct VMCrossPageData {
 } VMCrossPageData;
 #pragma pack(pop)
 
-#define CROSSPAGE_VERSION_BASE 0xc14 /* increment by 1 */
+#define CROSSPAGE_VERSION_BASE 0xc15 /* increment by 1 */
 #define CROSSPAGE_VERSION    ((CROSSPAGE_VERSION_BASE << 1) + WS_INTR_STRESS)
 
 #if !defined(VMX86_SERVER) && defined(VMM)
diff --git a/vmmon-only/include/monLoader.h b/vmmon-only/include/monLoader.h
index c3984c38..494cf858 100644
--- a/vmmon-only/include/monLoader.h
+++ b/vmmon-only/include/monLoader.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2015-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/monLoaderLog.h b/vmmon-only/include/monLoaderLog.h
index eefba6ff..12afad16 100644
--- a/vmmon-only/include/monLoaderLog.h
+++ b/vmmon-only/include/monLoaderLog.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2019 VMware, Inc. All rights reserved.
+ * Copyright (c) 2016-2019 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vmm_constants.h b/vmmon-only/include/mon_constants.h
similarity index 78%
rename from vmmon-only/include/vmm_constants.h
rename to vmmon-only/include/mon_constants.h
index 35ca94db..4fbd59d5 100644
--- a/vmmon-only/include/vmm_constants.h
+++ b/vmmon-only/include/mon_constants.h
@@ -20,8 +20,8 @@
  * nonsense here.   This file is for _constants_.
  */
 
-#ifndef _VMM_CONSTANTS_H_
-#define _VMM_CONSTANTS_H_
+#ifndef _MON_CONSTANTS_H_
+#define _MON_CONSTANTS_H_
 
 #define INCLUDE_ALLOW_USERLEVEL
 
@@ -31,19 +31,19 @@
 #include "includeCheck.h"
 
 
-#define VMM_PANIC_NONE         0
-#define VMM_PANIC_MSG_COPYING  1
-#define VMM_PANIC_MSG_COPIED   2
-#define VMM_PANIC_COREDUMPING  3
-#define VMM_PANIC_VCPU         4
+#define MON_PANIC_NONE         0
+#define MON_PANIC_MSG_COPYING  1
+#define MON_PANIC_MSG_COPIED   2
+#define MON_PANIC_COREDUMPING  3
+#define MON_PANIC_VCPU         4
 
-#define VMM_PANIC_MSG_SIZE     256
+#define MON_PANIC_MSG_SIZE     256
 
 /* Ensure enough space for obj build with GCOV_VMM=1. */
 #if defined(VMX86_SERVER)
-#define VMMBLOB_SIZE_MAX (24 * 1024 * 1024)
+#define VMMBLOB_SIZE_MAX (25 * 1024 * 1024)
 #else
-#define VMMBLOB_SIZE_MAX (24 * 1024 * 1024)
+#define VMMBLOB_SIZE_MAX (25 * 1024 * 1024)
 #endif
 
 #endif
diff --git a/vmmon-only/include/overheadmem_types.h b/vmmon-only/include/overheadmem_types.h
index a07bcab6..7ced735d 100644
--- a/vmmon-only/include/overheadmem_types.h
+++ b/vmmon-only/include/overheadmem_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2001-2013 VMware, Inc. All rights reserved.
+ * Copyright (C) 2001-2013, 2022-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 /*
  * overheadmem_types.h
  *
- *	Types for tracking memory overheads.
+ *      Types for tracking memory overheads.
  */
 
 #ifndef _OVERHEADMEM_TYPES_H
@@ -30,6 +30,7 @@
 #define INCLUDE_ALLOW_VMMON
 #define INCLUDE_ALLOW_VMCORE
 #define INCLUDE_ALLOW_MODULE
+#define INCLUDE_ALLOW_VMKERNEL
 #include "includeCheck.h"
 
 #include "vm_basic_types.h"
@@ -128,4 +129,12 @@ typedef struct OvhdMemNode {
    OvhdMemType type;                 // how/where memory for source is managed
 } OvhdMemNode;
 
+typedef struct OvhdMemStats {
+   OvhdMemNode *anonNodes;
+   unsigned    *usedByCategory;
+   unsigned    *rsvdByCategory;
+   unsigned    *maxUsedByCategory;
+   unsigned    *maxRsvdByCategory;
+} OvhdMemStats;
+
 #endif
diff --git a/vmmon-only/include/perfctr.h b/vmmon-only/include/perfctr.h
index 59fad251..e9343b45 100644
--- a/vmmon-only/include/perfctr.h
+++ b/vmmon-only/include/perfctr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2012,2014-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2012,2014-2019,2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,8 +37,8 @@
 
 #define PERF_EVENT_NAME_LEN                      64
 /*
- * nmiNo      -- vmm peer is not attempting to do nmi profiling this run
- * nmiYes     -- vmm peer is doing nmi profiling and nmis are currently enabled
+ * nmiNo      -- vmm peer is not attempting to do nmi profiling this run.
+ * nmiYes     -- vmm peer is doing nmi profiling and nmis are currently enabled.
  * nmiStopped -- vmm peer is doing nmi profiling, but nmis are temporarily
  *               disabled for safety reasons.
  */
@@ -47,6 +47,7 @@ typedef struct NMIShared { /* shared with vmx and vmkernel */
    NMIStatus vmmStatus;
    int32     nmiErrorCode;
    int64     nmiErrorData;
+   NMI_SHARED_ARCH_FIELDS
 } NMIShared;
 
 /*
diff --git a/vmmon-only/include/perfctr_arch.h b/vmmon-only/include/perfctr_arch.h
index 22a6b4a9..2a98b07c 100644
--- a/vmmon-only/include/perfctr_arch.h
+++ b/vmmon-only/include/perfctr_arch.h
@@ -40,6 +40,9 @@
 #include "vm_asm.h"
 #include "x86cpuid_asm.h"
 
+#define NMI_SHARED_ARCH_FIELDS \
+   uint64 nmiMaskedTSC;
+
 #define PERFCTR_AMD_NUM_COUNTERS                 4
 #define PERFCTR_AMD_EXT_NUM_COUNTERS             6
 #define PERFCTR_P6_NUM_COUNTERS                  2
diff --git a/vmmon-only/include/pgtbl.h b/vmmon-only/include/pgtbl.h
index 0935e090..3f43c62a 100644
--- a/vmmon-only/include/pgtbl.h
+++ b/vmmon-only/include/pgtbl.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002,2014-2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002,2014-2017,2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -50,11 +50,10 @@ PgtblVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a process
                   VA addr)              // IN: Address in the virtual address
                                         //     space of that process
 {
-   pgd_t *pgd;
    compat_p4d_t *p4d;
    MPN mpn;
+   pgd_t *pgd = pgd_offset(mm, addr);
 
-   pgd = pgd_offset(mm, addr);
    if (pgd_present(*pgd) == 0) {
       return INVALID_MPN;
    }
@@ -71,27 +70,28 @@ PgtblVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a process
    if (compat_p4d_large(*p4d)) {
       mpn = compat_p4d_pfn(*p4d) + ((addr & ~COMPAT_P4D_MASK) >> PAGE_SHIFT);
    } else {
-      pud_t *pud;
+      pud_t *pud = pud_offset(p4d, addr);
 
-      pud = pud_offset(p4d, addr);
       if (pud_present(*pud) == 0) {
          return INVALID_MPN;
       }
       if (pud_large(*pud)) {
          mpn = pud_pfn(*pud) + ((addr & ~PUD_MASK) >> PAGE_SHIFT);
       } else {
-         pmd_t *pmd;
+         pmd_t *pmd = pmd_offset(pud, addr);
 
-         pmd = pmd_offset(pud, addr);
          if (pmd_present(*pmd) == 0) {
             return INVALID_MPN;
          }
          if (pmd_large(*pmd)) {
             mpn = pmd_pfn(*pmd) + ((addr & ~PMD_MASK) >> PAGE_SHIFT);
          } else {
-            pte_t *pte;
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(6,5,0)
+            pte_t *pte = pte_offset_kernel(pmd, addr);
+#else
+            pte_t *pte = pte_offset_map(pmd, addr);
+#endif
 
-            pte = pte_offset_map(pmd, addr);
             if (pte_present(*pte) == 0) {
                pte_unmap(pte);
                return INVALID_MPN;
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
index be48c4a7..477e6ea8 100644
--- a/vmmon-only/include/ptsc.h
+++ b/vmmon-only/include/ptsc.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2017,2019-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2017,2019-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -125,8 +125,6 @@ PTSC_MHz(void)
    return ptscInfo.mHz;
 }
 
-#if defined(VM_X86_64) || defined(VM_ARM_64)
-
 /*
  * Conversions to/from cycles.  Note that the conversions operate on
  * signed values, so be careful when taking the difference of two
@@ -158,16 +156,6 @@ PTSC_CyclesToUS(VmRelativeTS ts)
    return Muls64x32s64(ts, ptscInfo.cyclesToUs.mult, ptscInfo.cyclesToUs.shift);
 }
 
-#else
-
-/* 32-bit Muls64x32s64 too big to justify inlining. */
-VmRelativeTS PTSC_USToCycles(int64 us);
-VmRelativeTS PTSC_MSToCycles(int64 ms);
-int64 PTSC_CyclesToNS(VmRelativeTS ts);
-int64 PTSC_CyclesToUS(VmRelativeTS ts);
-
-#endif
-
 #if defined(VMX86_SERVER) && (defined(VMX86_VMX) || defined (ULM_ESX))
 
 /*
@@ -184,7 +172,7 @@ PTSC_Get(void)
    if (vmkUserTdata.magic != USER_THREADDATA_MAGIC) {
       return 0;
    }
-   ptsc = vmkUserTdata.u.pseudoTSCGet(&vmkUserTdata);
+   ptsc = vmkUserTdata.pseudoTSCGet(&vmkUserTdata);
    ASSERT((int64)ptsc >= 0);
    return ptsc;
 }
diff --git a/vmmon-only/include/rateconv.h b/vmmon-only/include/rateconv.h
index b44b9217..9d2cfef8 100644
--- a/vmmon-only/include/rateconv.h
+++ b/vmmon-only/include/rateconv.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2016, 2018 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2016, 2018-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -45,6 +45,10 @@
 #include "vm_atomic.h"
 #include "versioned_atomic.h"
 
+#if defined(VM_ARM_ANY) && defined(_MSC_VER)
+#include "mul64.h"
+#endif
+
 #if defined __cplusplus
 extern "C" {
 #endif
diff --git a/vmmon-only/include/segs.h b/vmmon-only/include/segs.h
index 6e25852a..df712df9 100644
--- a/vmmon-only/include/segs.h
+++ b/vmmon-only/include/segs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2018-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 2018-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -49,12 +49,27 @@
 #define GDT_SIZE              (sizeof(Descriptor) * NUM_VALID_SEGMENTS)
 #define GDT_LIMIT             (GDT_SIZE - 1)
 
+/*
+ * This is one more than max GDT limit value.
+ */
+#define VMK_GDT_SIZE          0x10000
+
+/*
+ * In the vmkernel the GDTR limit is set to the maximum because this will help
+ * the ULM/KLM to minimize the cost of a vmexit. After a vmexit the KLM doesn't
+ * need to restore the GDTR if the host GDTR limit is set to the maximum
+ * as Intel's VT restores the GDTR but sets the limit to the maximum value.
+ * Please see details 27.5.2 Loading Host Segment and Descriptor-Table
+ * Registers from the Intel manual.
+ */
+#define VMK_GDT_LIMIT         (VMK_GDT_SIZE - 1)
+
 #define IRB_SIZE              32 /* Interrupt redirection bitmap. */
 #define TSS_SIZE              (sizeof(Task64) + IRB_SIZE)
 
 #define PCPU_DATA_VA          (VPN_2_VA(GDT_AND_TASK_START))
-#define GDT_START_VA          (PCPU_DATA_VA + PCPU_DATA_SIZE)
-#define TASK_START_VA         (GDT_START_VA + GDT_SIZE)
+#define TASK_START_VA         (PCPU_DATA_VA + PCPU_DATA_SIZE)
+#define GDT_START_VA          (TASK_START_VA + TSS_SIZE)
 
 /*
  * vmkBoot uses some of the lower-numbered segments, as do host kernels on
@@ -67,6 +82,13 @@
 #define NUM_SYSTEM_SEGMENTS   2
 #define NUM_TASK_SEGMENTS     2
 
+#define NUM_TOTAL_SEGMENTS    ((VMK_GDT_SIZE) / sizeof(Descriptor))
+#define NUM_MAP_SEGMENTS      (NUM_BOOT_SEGMENTS + NUM_USER_SEGMENTS + \
+                               NUM_SYSTEM_SEGMENTS +                   \
+                               (2 * (sizeof(Descriptor64) /            \
+                                sizeof(Descriptor))))
+#define NUM_PAD_SEGMENTS      (NUM_TOTAL_SEGMENTS - NUM_MAP_SEGMENTS)
+
 #define FIRST_USER_SEGMENT    NUM_BOOT_SEGMENTS
 #define FIRST_SYSTEM_SEGMENT  (PAGE_SIZE / sizeof(Descriptor) - \
                                NUM_SYSTEM_SEGMENTS            - \
@@ -74,19 +96,6 @@
                                TSS_SIZE / sizeof(Descriptor)  - \
                                PCPU_DATA_SIZE / sizeof(Descriptor))
 
-#define GDT_USER_TLS_MIN      USER_TLS_1_SEGMENT
-#define GDT_USER_TLS_MAX      USER_TLS_3_SEGMENT
-#define USER_TLS_COUNT        ((USER_TLS_3_SEGMENT - USER_TLS_1_SEGMENT) + 1)
-
-#define FOREACH_USER_TLS_INDEX(_i)              \
-   {                                            \
-      unsigned _i;                              \
-      for (_i = 0; _i < USER_TLS_COUNT; _i++) { \
-
-#define FOREACH_USER_TLS_INDEX_DONE             \
-      }                                         \
-   }
-
 #define NULL_LDTR             0
 
 /*
@@ -94,10 +103,6 @@
  * well as higher-numbered segments, though the vmkernel should not
  * use monitor-private segments.
  *
- * The descriptor after SYSTEM_CODE_SEGMENT (loaded into %cs) must be
- * appropriate for %ss because of the syscall instruction for 64-bit
- * user worlds.  Thus SYSTEM_DATA_SEGMENT is directly after it.
- *
  * The monitor segments are placed at the end of the GDT.  The high
  * segment placement for the monitor ensures that there is no
  * selector-overlap with hosted kernel segments; the hosted world
@@ -108,14 +113,8 @@ typedef enum VmwSegs {
    NULL_SEGMENT             = 0,
    /* (... reserved for host operating system or vmkBoot segments). */
 
-   USER32_CODE_SEGMENT      = FIRST_USER_SEGMENT,
-   USER_DATA_SEGMENT,
-   USER64_SYSRET_SEGMENT,
-   USER64_STACK_SEGMENT,
-   USER64_CODE_SEGMENT,
-   USER_TLS_1_SEGMENT,
-   USER_TLS_2_SEGMENT,
-   USER_TLS_3_SEGMENT,
+   USER_DATA_STACK_SEGMENT  = FIRST_USER_SEGMENT,
+   USER_CODE_SEGMENT,
 
    AFTER_LAST_USER_SEGMENT,
 
@@ -137,18 +136,15 @@ typedef enum VmwSegs {
    MAKE_SELECTOR_UNCHECKED(x##_SEGMENT, SELECTOR_GDT, 3)
 
 /* Selectors used statically in code or in assembly must be unchecked. */
-#define SYSTEM_NULL_SELECTOR    GDT_SYSTEM_SEL(NULL)
+#define SYSTEM_NULL_SELECTOR     GDT_SYSTEM_SEL(NULL)
 #ifdef VMKERNEL
-/* USER32_CODE_SELECTOR is also defined in mach/i386/thread_status.h */
-#define USER32_CODE_SELECTOR    GDT_USER_SEL_UNCHECKED(USER32_CODE)
-#define USER_DATA_SELECTOR      GDT_USER_SEL_UNCHECKED(USER_DATA)
-#define USER64_CODE_SELECTOR    GDT_USER_SEL_UNCHECKED(USER64_CODE)
-#define USER64_SYSRET_SELECTOR  GDT_USER_SEL(USER64_SYSRET)
+#define USER_CODE_SELECTOR       GDT_USER_SEL_UNCHECKED(USER_CODE)
+#define USER_DATA_STACK_SELECTOR GDT_USER_SEL_UNCHECKED(USER_DATA_STACK)
 #endif
-#define SYSTEM_CODE_SELECTOR    GDT_SYSTEM_SEL_UNCHECKED(SYSTEM_CODE)
-#define SYSTEM_DATA_SELECTOR    GDT_SYSTEM_SEL_UNCHECKED(SYSTEM_DATA)
-#define MONITOR_TASK_SELECTOR   GDT_SYSTEM_SEL(MONITOR_TASK)
-#define VMKERNEL_TASK_SELECTOR  GDT_SYSTEM_SEL(VMKERNEL_TASK)
+#define SYSTEM_CODE_SELECTOR     GDT_SYSTEM_SEL_UNCHECKED(SYSTEM_CODE)
+#define SYSTEM_DATA_SELECTOR     GDT_SYSTEM_SEL_UNCHECKED(SYSTEM_DATA)
+#define MONITOR_TASK_SELECTOR    GDT_SYSTEM_SEL(MONITOR_TASK)
+#define VMKERNEL_TASK_SELECTOR   GDT_SYSTEM_SEL(VMKERNEL_TASK)
 
 /*
  * This struct is shared between the vmkernel and the monitor. Since
@@ -172,20 +168,29 @@ typedef struct PcpuData {
 /*
  * The VMM GDT is comprised of many segment descriptors with one initial
  * Task State Segment system descriptor.  The VMM Task State Segment is
- * on the same page sequentially after its GDT.
+ * on the same page just before GDT start VA. The base address of the
+ * GDT in GDTR register is set to address of empty descriptor.
  */
 #pragma pack(push, 1)
 typedef struct StaticGDTPage {
    PcpuData     pcpuData;                        /* Non-architectural. */
+   Task64       monTSS;
+   uint8        TSSIRBitmap[IRB_SIZE];
    Descriptor   empty[NUM_BOOT_SEGMENTS + NUM_USER_SEGMENTS];
    Descriptor   systemSegs[NUM_SYSTEM_SEGMENTS];
    Descriptor64 vmkTask;
    Descriptor64 monTask;
-   Task64       monTSS;
-   uint8        TSSIRBitmap[IRB_SIZE];
 } StaticGDTPage;
 #pragma pack(pop)
 
+/*
+ * The base address of the GDT in GDTR register is set to VmkernelGDT.
+ * The size of VmkernelGDT is 64K with 239 mapped entries and 7953
+ * pad entries (8 bytes per entry). We only reserve VA space for 7953
+ * pad entries and not map them in PTE. This is done so that we could
+ * set GDTR limit to maximum value (that is 64K - 1). Please see
+ * bora/main/doc/gdtLim.txt for more details.
+ */
 #pragma pack(push, 1)
 typedef struct VmkernelGDT {
    Descriptor   bootSegs[NUM_BOOT_SEGMENTS];
@@ -193,16 +198,17 @@ typedef struct VmkernelGDT {
    Descriptor   systemSegs[NUM_SYSTEM_SEGMENTS]; /* VMM/VMK-shared. */
    Descriptor64 vmkTask;
    Descriptor64 monTask;
+   Descriptor   padSegs[NUM_PAD_SEGMENTS];
 } VmkernelGDT;
 #pragma pack(pop)
 
 #pragma pack(push, 1)
-typedef struct VmkernelGDTPage {
+typedef struct VmkernelGDTInfo {
    PcpuData     pcpuData;                        /* Non-architectural */
-   VmkernelGDT  vmkGDT;
    Task64       vmkTSS;
    uint8        TSSIRBitmap[IRB_SIZE];
-} VmkernelGDTPage;
+   VmkernelGDT  vmkGDT;
+} VmkernelGDTInfo;
 #pragma pack(pop)
 
 MY_ASSERTS(segs,
@@ -212,11 +218,42 @@ MY_ASSERTS(segs,
            ASSERT_ON_COMPILE(AFTER_LAST_USER_SEGMENT <= FIRST_SYSTEM_SEGMENT);
 )
 
+/*
+ * Invariants:
+ * 1) PcpuData, task and GDT mapped segments resides in the same page.
+ *    VMM maps this 4KB page and refers it to locate task and GDT segments.
+ *    HTSched maps this 4KB page of each host PCPU's GDT.
+ * 2) GDT_START_VA should point to the mapped segments in VmkernelGDTInfo
+ *    struct and also it should point to mapped segments in StaticGDTPage.
+ *    The offset of mapped segments in VmkernelGDTInfo and StaticGDTPage
+ *    should remain same.
+ * 3) The key data structures like systemSegs, vmkTask and monTask in
+ *    the StaticGDTPage and VmkernelGDTInfo structs align.
+ */
 MY_ASSERTS(pcpuData,
            ASSERT_ON_COMPILE(sizeof(PcpuData) == PCPU_DATA_SIZE);
-           ASSERT_ON_COMPILE(offsetof(VmkernelGDTPage, vmkGDT) ==
-                             PCPU_DATA_SIZE);
-           ASSERT_ON_COMPILE(sizeof(VmkernelGDTPage) == PAGE_SIZE);
+           ASSERT_ON_COMPILE(offsetof(VmkernelGDTInfo, vmkGDT) ==
+                             PCPU_DATA_SIZE + TSS_SIZE);
+           ASSERT_ON_COMPILE(sizeof(VmkernelGDTInfo) == PCPU_DATA_SIZE +
+                             TSS_SIZE + VMK_GDT_SIZE);
+           ASSERT_ON_COMPILE((PCPU_DATA_SIZE + TSS_SIZE +
+                              sizeof(Descriptor) * NUM_MAP_SEGMENTS) ==
+                              PAGE_SIZE);
+           ASSERT_ON_COMPILE(sizeof(VmkernelGDTInfo) -
+                             sizeof(Descriptor) * NUM_PAD_SEGMENTS ==
+                             PAGE_SIZE);
+           ASSERT_ON_COMPILE(sizeof(StaticGDTPage) == PAGE_SIZE);
+           ASSERT_ON_COMPILE((PCPU_DATA_SIZE + TSS_SIZE +
+                              offsetof(VmkernelGDT, systemSegs)) ==
+                              offsetof(StaticGDTPage, systemSegs));
+           ASSERT_ON_COMPILE((PCPU_DATA_SIZE + TSS_SIZE +
+                              offsetof(VmkernelGDT, vmkTask)) ==
+                              offsetof(StaticGDTPage, vmkTask));
+           ASSERT_ON_COMPILE((PCPU_DATA_SIZE + TSS_SIZE +
+                              offsetof(VmkernelGDT, monTask)) ==
+                              offsetof(StaticGDTPage, monTask));
+           ASSERT_ON_COMPILE(offsetof(VmkernelGDTInfo, vmkTSS) ==
+                             offsetof(StaticGDTPage, monTSS));
 )
 
 #endif /* _SEGS_H_ */
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
index 0d005850..831a0511 100644
--- a/vmmon-only/include/vcpuset.h
+++ b/vmmon-only/include/vcpuset.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 2002-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vcpuset_types.h b/vmmon-only/include/vcpuset_types.h
index 64c7cbff..1b4b6577 100644
--- a/vmmon-only/include/vcpuset_types.h
+++ b/vmmon-only/include/vcpuset_types.h
@@ -47,25 +47,16 @@
 #define VCS_VCPUID_SUBSET_IDX(v)                    ((v) >> VCS_SUBSET_SHIFT)
 #define VCS_VCPUID_SUBSET_BIT(v)     (CONST64U(1) << ((v) & VCS_SUBSET_MASK))
 
-/*
- * If you update this type, you also need to update the SEND_IPI line in
- * bora/public/iocontrolsMacosTable.h.
- */
 typedef struct VCPUSet {
    uint64 subset[VCS_SUBSET_COUNT];
 } VCPUSet;
 
 MY_ASSERTS(VCPUSET_ASSERTS,
            ASSERT_ON_COMPILE(VCS_SUBSET_WIDTH * VCS_SUBSET_COUNT >= MAX_VCPUS);
-           /*
-            * Catch changes in VCPUSet which need to be reflected in
-            * bora/public/iocontrolsMacosTable.h.
-            */
-           ASSERT_ON_COMPILE(VCS_SUBSET_COUNT == 32);
            /*
             * There is code that depends on sizeof(VCPUSet) being a power of
             * 2 in at least vcpuHotPlug.c and possible other places.
             */
-            ASSERT_ON_COMPILE((sizeof(VCPUSet) & (sizeof(VCPUSet) - 1)) == 0);
+           ASSERT_ON_COMPILE((sizeof(VCPUSet) & (sizeof(VCPUSet) - 1)) == 0);
 )
 #endif
diff --git a/vmmon-only/include/versioned_atomic.h b/vmmon-only/include/versioned_atomic.h
index 9ebc8997..2fb711a3 100644
--- a/vmmon-only/include/versioned_atomic.h
+++ b/vmmon-only/include/versioned_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2007-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998,2007-2021 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/virtual_vt.h b/vmmon-only/include/virtual_vt.h
index 8fdbcde8..695ba9a5 100644
--- a/vmmon-only/include/virtual_vt.h
+++ b/vmmon-only/include/virtual_vt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -74,9 +74,7 @@
                                       VT_VMCS_2ND_VMEXEC_CTL_APIC |         \
                                       VT_VMCS_2ND_VMEXEC_CTL_PML |          \
                                       VT_VMCS_2ND_VMEXEC_CTL_ENCLS |        \
-                                      VT_VMCS_2ND_VMEXEC_CTL_ENCLV |        \
-                                      VT_VMCS_2ND_VMEXEC_CTL_UMWAIT |       \
-                                      VT_VMCS_2ND_VMEXEC_CTL_EPC_VIRT_EXT)
+                                      VT_VMCS_2ND_VMEXEC_CTL_UMWAIT)
 
 #define VVT_2ND_CTLS                 QWORD(VVT_2ND_CTLS1,                   \
                                            VVT_2ND_CTLS0)
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index 9f9b2991..a6eac4e9 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -705,4 +705,62 @@ RDTSCP(void)
 #endif
 }
 
+
+static INLINE void
+MONITOR(void *addr, uint32 extensions, uint32 hints)
+{
+   /*
+    * Flush the monitored cache line to work around hardware bug
+    * on Dunnington CPUs which can cause false wakeups.
+    * (cf. PowerSetCState in the vmkernel.)
+    */
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "clflush (%0);"
+      "monitor" : : "a" (addr), "c" (extensions), "d" (hints)
+   );
+#elif defined _MSC_VER
+   _mm_clflush(addr);
+   _mm_monitor(addr, extensions, hints);
+#endif
+}
+
+
+static INLINE void
+MWAIT(uint32 extensions, uint32 hints)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "mwait" : : "a" (hints), "c" (extensions)
+   );
+#elif defined _MSC_VER
+   _mm_mwait(extensions, hints);
+#endif
+}
+
+
+static INLINE void
+MONITORX(void *addr, uint32 extensions, uint32 hints)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "monitorx" : : "a" (addr), "c" (extensions), "d" (hints)
+   );
+#elif defined _MSC_VER
+   _mm_monitorx(addr, extensions, hints);
+#endif
+}
+
+
+static INLINE void
+MWAITX(uint32 extensions, uint32 hints, uint32 timeout)
+{
+#ifdef __GNUC__
+   __asm__ __volatile__(
+      "mwaitx" : : "a" (hints), "b" (timeout), "c" (extensions)
+   );
+#elif defined _MSC_VER
+   _mm_mwaitx(extensions, hints, timeout);
+#endif
+}
 #endif
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index 4f8e04fc..87bf1ece 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -45,6 +45,14 @@
 #pragma warning(pop)
 #endif
 
+#ifdef __wasm__
+#define VM_ATOMIC_USE_C11
+#endif
+
+#ifdef VM_ATOMIC_USE_C11
+#include <stdatomic.h>
+#endif
+
 #include "vm_basic_types.h"
 #include "vm_assert.h"
 
@@ -233,7 +241,7 @@ Atomic_ReadIfEqualWrite128(Atomic_uint128 *ptr,   // IN/OUT
     * use the right (LL/SC vs LSE) atomics without -moutline-atomics.
     */
 #if __GNUC__ >= 9
-   if (Atomic_HaveLSE) {
+   if (Atomic_HaveLse()) {
       SMP_RW_BARRIER_RW();
       __asm__ __volatile__(
          ".arch armv8.2-a            \n\t"
@@ -309,7 +317,9 @@ Atomic_Read8(Atomic_uint8 const *var)  // IN:
 {
    uint8 val;
 
-#if defined __GNUC__ && defined VM_ARM_32
+#if defined VM_ATOMIC_USE_C11
+   val = atomic_load((const _Atomic uint8 *)&var->value);
+#elif defined __GNUC__ && defined VM_ARM_32
    val = AtomicUndefined(var);
 #elif defined __GNUC__ && defined VM_ARM_64
    val = _VMATOM_X(R, 8, &var->value);
@@ -349,7 +359,9 @@ static INLINE uint8
 Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
                   uint8 val)          // IN:
 {
-#if defined __GNUC__ && defined VM_ARM_32
+#if defined VM_ATOMIC_USE_C11
+   return atomic_exchange((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + val);
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 8, TRUE, &var->value, val);
@@ -363,6 +375,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
    );
    return val;
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (volatile char) == sizeof var->value);
    return _InterlockedExchange8((volatile char *)&var->value, val);
 #else
 #error Atomic_ReadWrite8 not implemented
@@ -390,7 +403,9 @@ static INLINE void
 Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
               uint8 val)          // IN:
 {
-#if defined __GNUC__ && defined VM_ARM_32
+#if defined VM_ATOMIC_USE_C11
+   atomic_store((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_32
    AtomicUndefined(var + val);
 #elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(W, 8, &var->value, val);
@@ -429,7 +444,11 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
                          uint8 oldVal,       // IN:
                          uint8 newVal)       // IN:
 {
-#if defined __GNUC__ && defined VM_ARM_32
+#if defined VM_ATOMIC_USE_C11
+   atomic_compare_exchange_strong(
+      (_Atomic uint8 *)&var->value, &oldVal, newVal);
+   return oldVal;
+#elif defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + oldVal + newVal);
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RIFEQW, 8, TRUE, &var->value, oldVal, newVal);
@@ -447,6 +466,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
 
    return val;
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (volatile char) == sizeof var->value);
    return _InterlockedCompareExchange8((volatile char *)&var->value,
                                        newVal, oldVal);
 #else
@@ -477,7 +497,9 @@ Atomic_ReadAnd8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_and((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, and, val);
 #else
    do {
@@ -539,7 +561,9 @@ Atomic_ReadOr8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_or((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, orr, val);
 #else
    do {
@@ -601,7 +625,9 @@ Atomic_ReadXor8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_xor((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, eor, val);
 #else
    do {
@@ -663,7 +689,9 @@ Atomic_ReadAdd8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_add((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, add, val);
 #else
    do {
@@ -723,7 +751,9 @@ static INLINE void
 Atomic_Sub8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_sub((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, sub, val);
 #else
    Atomic_Add8(var, -val);
@@ -848,7 +878,9 @@ Atomic_Read32(Atomic_uint32 const *var) // IN
    ASSERT(((uintptr_t)var % 4) == 0);
 #endif
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   value = atomic_load((_Atomic uint32 *)&var->value);
+#elif defined __GNUC__
    /*
     * Use inline assembler to force using a single load instruction to
     * ensure that the compiler doesn't split a transfer operation into multiple
@@ -907,7 +939,9 @@ static INLINE uint32
 Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
                    uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_exchange((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 retVal;
    uint32 res;
@@ -941,6 +975,7 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    return _InterlockedExchange((long *)&var->value, (long)val);
 #else
 #error Atomic_ReadWrite32 not implemented
@@ -973,7 +1008,9 @@ Atomic_Write32(Atomic_uint32 *var, // OUT
    ASSERT(((uintptr_t)var % 4) == 0);
 #endif
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #if defined VM_ARM_64
    _VMATOM_X(W, 32, &var->value, val);
 #elif defined VM_ARM_32
@@ -1052,7 +1089,11 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
                           uint32 oldVal,      // IN
                           uint32 newVal)      // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_compare_exchange_strong(
+      (_Atomic uint32 *)&var->value, &oldVal, newVal);
+   return oldVal;
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 retVal;
    uint32 res;
@@ -1091,6 +1132,7 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    return _InterlockedCompareExchange((long *)&var->value,
                                       (long)newVal,
                                       (long)oldVal);
@@ -1101,7 +1143,7 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
 #define Atomic_ReadIfEqualWrite Atomic_ReadIfEqualWrite32
 
 
-#if defined VM_64BIT || defined VM_ARM_V7
+#if defined VM_64BIT || defined VM_ARM_V7 || defined VM_ATOMIC_USE_C11
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1123,7 +1165,11 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
                           uint64 oldVal,      // IN
                           uint64 newVal)      // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_compare_exchange_strong(
+      (_Atomic uint64 *)&var->value, &oldVal, newVal);
+   return oldVal;
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint64 retVal;
    uint32 res;
@@ -1183,6 +1229,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
    return val;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedCompareExchange64((__int64 *)&var->value,
                                         (__int64)newVal,
                                         (__int64)oldVal);
@@ -1213,7 +1260,9 @@ static INLINE void
 Atomic_And32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_and((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1244,6 +1293,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedAnd((long *)&var->value, (long)val);
 #else
 #error Atomic_And32 not implemented
@@ -1272,7 +1322,9 @@ static INLINE void
 Atomic_Or32(Atomic_uint32 *var, // IN/OUT
             uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_or((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1303,6 +1355,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedOr((long *)&var->value, (long)val);
 #else
 #error Atomic_Or32 not implemented
@@ -1331,7 +1384,9 @@ static INLINE void
 Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_xor((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1362,6 +1417,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedXor((long *)&var->value, (long)val);
 #else
 #error Atomic_Xor32 not implemented
@@ -1391,7 +1447,9 @@ static INLINE void
 Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_xor((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__
 #if defined VM_ARM_64
    _VMATOM_X(OP, 64, TRUE, &var->value, eor, val);
 #else /* VM_X86_64 */
@@ -1404,6 +1462,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
    );
 #endif
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedXor64((__int64 *)&var->value, (__int64)val);
 #else
 #error Atomic_Xor64 not implemented
@@ -1432,7 +1491,9 @@ static INLINE void
 Atomic_Add32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_add((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1463,6 +1524,7 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
 #error Atomic_Add32 not implemented
@@ -1491,7 +1553,9 @@ static INLINE void
 Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_sub((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1535,6 +1599,7 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
     */
 #   pragma warning(push)
 #   pragma warning(disable: 4146)
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedExchangeAdd((long *)&var->value, (long)-val);
 #   pragma warning(pop)
 #else
@@ -1563,7 +1628,9 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
 static INLINE void
 Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
 {
-#ifdef __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   Atomic_Add32(var, 1);
+#elif defined __GNUC__
 #if defined VM_ARM_ANY
    Atomic_Add32(var, 1);
 #else /* VM_X86_ANY */
@@ -1576,6 +1643,7 @@ Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedIncrement((long *)&var->value);
 #else
 #error Atomic_Inc32 not implemented
@@ -1603,7 +1671,9 @@ Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
 static INLINE void
 Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
 {
-#ifdef __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   Atomic_Sub32(var, 1);
+#elif defined __GNUC__
 #if defined VM_ARM_ANY
    Atomic_Sub32(var, 1);
 #else /* VM_X86_ANY */
@@ -1616,6 +1686,7 @@ Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedDecrement((long *)&var->value);
 #else
 #error Atomic_Dec32 not implemented
@@ -1652,7 +1723,9 @@ Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_or((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, orr, val);
 #else
    do {
@@ -1686,7 +1759,9 @@ Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_and((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, and, val);
 #else
    do {
@@ -1721,7 +1796,9 @@ Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_or((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, orr, val);
 #else
    do {
@@ -1755,7 +1832,9 @@ Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_and((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, and, val);
 #else
    do {
@@ -1792,7 +1871,9 @@ static INLINE uint32
 Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
                  uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_fetch_add((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 retVal;
@@ -1828,6 +1909,7 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    return _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
 #error Atomic_ReadAdd32 not implemented
@@ -1902,7 +1984,10 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
                  uint64 oldVal,        // IN
                  uint64 newVal)        // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_compare_exchange_strong(
+      (_Atomic uint64 *)&var->value, &oldVal, newVal);
+#elif defined __GNUC__
 #if defined VM_ARM_ANY
    return Atomic_ReadIfEqualWrite64(var, oldVal, newVal) == oldVal;
 #else /* VM_X86_ANY */
@@ -1996,6 +2081,7 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
    return equal;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return (__int64)oldVal == _InterlockedCompareExchange64((__int64 *)&var->value,
                                                            (__int64)newVal,
                                                            (__int64)oldVal);
@@ -2026,7 +2112,10 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
                  uint32 oldVal,        // IN
                  uint32 newVal)        // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_compare_exchange_strong(
+      (_Atomic uint32 *)&var->value, &oldVal, newVal);
+#elif defined __GNUC__
 #if defined VM_ARM_ANY
    return Atomic_ReadIfEqualWrite32(var, oldVal, newVal) == oldVal;
 #else /* VM_X86_ANY */
@@ -2070,6 +2159,9 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
 static INLINE uint64
 Atomic_Read64(Atomic_uint64 const *var) // IN
 {
+#if defined VM_ATOMIC_USE_C11
+   return atomic_load((const _Atomic uint64 *)&var->value);
+#else
 #if defined __GNUC__
    uint64 value;
 #endif
@@ -2116,9 +2208,11 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
    return var->value;
 #elif defined _MSC_VER && defined VM_ARM_32
    /* MSVC + 32-bit ARM has add64 but no cmpxchg64 */
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedAdd64((__int64 *)&var->value, 0);
 #elif defined _MSC_VER && defined __i386__
    /* MSVC + 32-bit x86 has cmpxchg64 but no add64 */
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedCompareExchange64((__int64 *)&var->value,
                                         (__int64)255,  // Unlikely value to
                                         (__int64)255); // not dirty cache
@@ -2135,6 +2229,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
 #if defined __GNUC__
    return value;
 #endif
+#endif // !defined VM_ATOMIC_USE_C11
 }
 
 
@@ -2188,7 +2283,9 @@ static INLINE uint64
 Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   return atomic_fetch_add((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, add, val);
 #elif defined __x86_64__
 
@@ -2202,6 +2299,7 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
    );
    return val;
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
 #else
 #error Atomic_ReadAdd64 not implemented
@@ -2241,7 +2339,9 @@ static INLINE uint64
 Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   return atomic_fetch_sub((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
 #   ifdef _MSC_VER
@@ -2333,7 +2433,9 @@ static INLINE void
 Atomic_Add64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if !defined VM_64BIT
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_add((_Atomic uint64 *)&var->value, val);
+#elif !defined VM_64BIT
    Atomic_ReadAdd64(var, val); /* Return value is unused. */
 #elif defined __GNUC__
 #if defined VM_ARM_64
@@ -2348,6 +2450,7 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
    );
 #endif
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
 #else
 #error Atomic_Add64 not implemented
@@ -2375,7 +2478,9 @@ static INLINE void
 Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if !defined VM_64BIT
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_sub((_Atomic uint64 *)&var->value, val);
+#elif !defined VM_64BIT
    Atomic_ReadSub64(var, val); /* Return value is unused. */
 #elif defined __GNUC__
 #if defined VM_ARM_64
@@ -2390,6 +2495,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
    );
 #endif
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)-val);
 #else
 #error Atomic_Sub64 not implemented
@@ -2416,7 +2522,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
 static INLINE void
 Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 {
-#if defined VM_ARM_64
+#if defined VM_ARM_64 || defined VM_ATOMIC_USE_C11
    Atomic_Add64(var, 1);
 #elif !defined __x86_64__
    Atomic_ReadInc64(var);  /* Return value is unused. */
@@ -2429,6 +2535,7 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
       : "cc", "memory"
    );
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedIncrement64((__int64 *)&var->value);
 #else
 #error Atomic_Inc64 not implemented
@@ -2455,7 +2562,7 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 static INLINE void
 Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
 {
-#if defined VM_ARM_64
+#if defined VM_ARM_64 || defined VM_ATOMIC_USE_C11
    Atomic_Sub64(var, 1);
 #elif !defined __x86_64__
    Atomic_ReadDec64(var);  /* Return value is unused. */
@@ -2468,6 +2575,7 @@ Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
       : "cc", "memory"
    );
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedDecrement64((__int64 *)&var->value);
 #else
 #error Atomic_Dec64 not implemented
@@ -2495,7 +2603,9 @@ static INLINE uint64
 Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
                    uint64 val)         // IN
 {
-#if defined __GNUC__ && defined __x86_64__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_exchange((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "xchgq %0, %1"
@@ -2508,6 +2618,7 @@ Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 64, TRUE, &var->value, val);
 #elif defined _MSC_VER && defined VM_64BIT
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
 #else
    uint64 oldVal;
@@ -2545,7 +2656,9 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
    ASSERT((uintptr_t)var % 8 == 0);
 #endif
 
-#if defined __GNUC__ && defined __x86_64__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined __x86_64__
    /*
     * There is no move instruction for 64-bit immediate to memory, so unless
     * the immediate value fits in 32-bit (i.e. can be sign-extended), GCC
@@ -2596,7 +2709,9 @@ static INLINE void
 Atomic_Or64(Atomic_uint64 *var, // IN/OUT
             uint64 val)         // IN
 {
-#if defined __GNUC__ && defined __x86_64__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_or((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; orq %1, %0"
@@ -2607,6 +2722,7 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
 #elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 64, TRUE, &var->value, orr, val);
 #elif defined _MSC_VER && defined VM_64BIT
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedOr64((__int64 *)&var->value, (__int64)val);
 #else
    uint64 oldVal;
@@ -2639,7 +2755,9 @@ static INLINE void
 Atomic_And64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined __GNUC__ && defined __x86_64__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_and((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; andq %1, %0"
@@ -2650,6 +2768,7 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
 #elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 64, TRUE, &var->value, and, val);
 #elif defined _MSC_VER && defined VM_64BIT
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
 #else
    uint64 oldVal;
@@ -2823,7 +2942,6 @@ Atomic_TestSetBit64(Atomic_uint64 *var, // IN/OUT
 }
 
 
-#if defined __GNUC__
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2845,19 +2963,20 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
 {
    uint16 value;
 
-#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || \
+    defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 2 == 0);
 #endif
 
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
-
+#if defined VM_ATOMIC_USE_C11
+   value = atomic_load((_Atomic uint16 *)&var->value);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "movw %1, %0"
       : "=r" (value)
       : "m" (var->value)
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    NOT_TESTED();
 
    __asm__ __volatile__(
@@ -2865,11 +2984,10 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
       : "=r" (value)
       : "r" (&var->value)
    );
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    value = _VMATOM_X(R, 16, &var->value);
 #else
-#error Atomic_Read16 not implemented
-#endif
+   value = (uint16)AtomicUndefined(var);
 #endif
 
    return value;
@@ -2896,8 +3014,9 @@ static INLINE uint16
 Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
                    uint16 val)          // IN:
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_exchange((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "xchgw %0, %1"
       : "=r" (val),
@@ -2906,7 +3025,7 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
       : "memory"
    );
    return val;
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 retVal;
    uint16 res;
 
@@ -2927,11 +3046,10 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
    dmb();
 
    return retVal;
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 16, TRUE, &var->value, val);
 #else
-#error Atomic_ReadWrite16 not implemented
-#endif
+   return (uint16)AtomicUndefined(var + val);
 #endif
 }
 
@@ -2956,18 +3074,20 @@ static INLINE void
 Atomic_Write16(Atomic_uint16 *var,  // OUT:
                uint16 val)          // IN:
 {
-#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || \
+    defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 2 == 0);
 #endif
 
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "movw %1, %0"
       : "=m" (var->value)
       : "r" (val)
    );
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(W, 16, &var->value, val);
 #elif defined VM_ARM_32
    /*
@@ -2976,8 +3096,7 @@ Atomic_Write16(Atomic_uint16 *var,  // OUT:
     */
    Atomic_ReadWrite16(var, val);
 #else
-#error Atomic_Write16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3003,8 +3122,11 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
                           uint16 oldVal,        // IN
                           uint16 newVal)        // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_compare_exchange_strong(
+      (_Atomic uint16 *)&var->value, &oldVal, newVal);
+   return oldVal;
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    uint16 val;
 
    __asm__ __volatile__(
@@ -3016,7 +3138,7 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
       : "cc", "memory"
    );
    return val;
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 retVal;
    uint16 res;
 
@@ -3039,12 +3161,47 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
    dmb();
 
    return retVal;
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RIFEQW, 16, TRUE, &var->value, oldVal, newVal);
 #else
-#error Atomic_ReadIfEqualWrite16 not implemented
+   return (uint16)AtomicUndefined(var + oldVal + newVal);
 #endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAnd16 --
+ *
+ *      Atomic read (returned), bitwise AND with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadAnd16(Atomic_uint16 *var, // IN/OUT
+                 uint16 val)         // IN
+{
+   uint16 res;
+
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_and((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
+   res = _VMATOM_X(ROP, 16, TRUE, &var->value, and, val);
+#else
+   do {
+      res = Atomic_Read16(var);
+   } while (res != Atomic_ReadIfEqualWrite16(var, res, res & val));
 #endif
+
+   return res;
 }
 
 
@@ -3068,15 +3225,16 @@ static INLINE void
 Atomic_And16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_and((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; andw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3096,11 +3254,10 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, and, val);
 #else
-#error Atomic_And16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3125,15 +3282,16 @@ static INLINE void
 Atomic_Or16(Atomic_uint16 *var, // IN/OUT
             uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_or((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; orw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3153,11 +3311,10 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, orr, val);
 #else
-#error Atomic_Or16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3182,15 +3339,16 @@ static INLINE void
 Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_xor((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; xorw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3210,11 +3368,10 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, eor, val);
 #else
-#error Atomic_Xor16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3239,15 +3396,16 @@ static INLINE void
 Atomic_Add16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_add((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; addw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3267,11 +3425,10 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, add, val);
 #else
-#error Atomic_Add16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3296,15 +3453,16 @@ static INLINE void
 Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_sub((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; subw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3324,11 +3482,10 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, sub, val);
 #else
-#error Atomic_Sub16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3352,19 +3509,15 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
 static INLINE void
 Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; incw %0"
       : "+m" (var->value)
       :
       : "cc", "memory"
    );
-#elif defined VM_ARM_ANY
-   Atomic_Add16(var, 1);
 #else
-#error Atomic_Inc16 not implemented
-#endif
+   Atomic_Add16(var, 1);
 #endif
 }
 
@@ -3388,19 +3541,15 @@ Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 static INLINE void
 Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; decw %0"
       : "+m" (var->value)
       :
       : "cc", "memory"
    );
-#elif defined VM_ARM_ANY
-   Atomic_Sub16(var, 1);
 #else
-#error Atomic_Dec16 not implemented
-#endif
+   Atomic_Sub16(var, 1);
 #endif
 }
 
@@ -3427,7 +3576,9 @@ Atomic_ReadOr16(Atomic_uint16 *var, // IN/OUT
 {
    uint16 res;
 
-#if defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_or((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 16, TRUE, &var->value, orr, val);
 #else
    do {
@@ -3459,8 +3610,9 @@ static INLINE uint16
 Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
                  uint16 val)          // IN:
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_fetch_add((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; xaddw %0, %1"
       : "=r" (val),
@@ -3469,7 +3621,7 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
       : "cc", "memory"
    );
    return val;
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 retVal;
    uint16 tmp;
@@ -3492,11 +3644,10 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
    dmb();
 
    return retVal;
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 16, TRUE, &var->value, add, val);
 #else
-#error Atomic_ReadAdd16 not implemented
-#endif
+   return (uint16)AtomicUndefined(var + val);
 #endif
 }
 
@@ -3545,7 +3696,7 @@ Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
 {
    return Atomic_ReadAdd16(var, (uint16)-1);
 }
-#endif
+
 
 /*
  * Template code for the Atomic_<name> type and its operators.
diff --git a/vmmon-only/include/vm_atomic_acqrel.h b/vmmon-only/include/vm_atomic_acqrel.h
index 1a952732..639aefd4 100644
--- a/vmmon-only/include/vm_atomic_acqrel.h
+++ b/vmmon-only/include/vm_atomic_acqrel.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2018-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2018-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -165,7 +165,10 @@ Atomic_Read8Acquire(Atomic_uint8 const *var)  // IN:
 {
    uint8 val;
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   val = atomic_load_explicit((_Atomic uint8 *)&var->value,
+                              memory_order_acquire);
+#elif defined __GNUC__
 #  if defined __i386__ || defined __x86_64__
    __asm__ __volatile__(
       "movb %1, %0"
@@ -224,7 +227,10 @@ Atomic_Read16Acquire(Atomic_uint16 const *var)  // IN:
 
    ASSERT((uintptr_t)var % 2 == 0);
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   val = atomic_load_explicit((_Atomic uint16 *)&var->value,
+                              memory_order_acquire);
+#elif defined __GNUC__
 #  if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "movw %1, %0"
@@ -283,7 +289,10 @@ Atomic_Read32Acquire(Atomic_uint32 const *var)  // IN:
 
    ASSERT((uintptr_t)var % 4 == 0);
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   val = atomic_load_explicit((_Atomic uint32 *)&var->value,
+                              memory_order_acquire);
+#elif defined __GNUC__
    /*
     * Use inline assembler to force using a single load instruction to
     * ensure that the compiler doesn't split a transfer operation into multiple
@@ -351,7 +360,10 @@ Atomic_Read64Acquire(Atomic_uint64 const *var)  // IN:
 
    ASSERT((uintptr_t)var % 8 == 0);
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   val = atomic_load_explicit((_Atomic uint64 *)&var->value,
+                              memory_order_acquire);
+#elif defined __GNUC__
 #  if defined __x86_64__
    __asm__ __volatile__(
       "movq %1, %0"
@@ -445,7 +457,10 @@ static INLINE void
 Atomic_Write8Release(Atomic_uint8 *var,  // OUT:
                      uint8 val)          // IN:
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store_explicit((_Atomic uint8 *)&var->value, val,
+                         memory_order_release);
+#elif defined __GNUC__
 #  if defined __i386__ || defined __x86_64__
    __asm__ __volatile__(
       "movb %1, %0"
@@ -501,7 +516,10 @@ Atomic_Write16Release(Atomic_uint16 *var,  // OUT:
 {
    ASSERT((uintptr_t)var % 2 == 0);
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store_explicit((_Atomic uint16 *)&var->value, val,
+                         memory_order_release);
+#elif defined __GNUC__
 #  if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "movw %1, %0"
@@ -557,7 +575,10 @@ Atomic_Write32Release(Atomic_uint32 *var,  // OUT:
 {
    ASSERT((uintptr_t)var % 4 == 0);
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store_explicit((_Atomic uint32 *)&var->value, val,
+                         memory_order_release);
+#elif defined __GNUC__
 #  if defined __x86_64__ || defined __i386__
    __asm__ __volatile__(
       "movl %1, %0"
@@ -618,7 +639,10 @@ Atomic_Write64Release(Atomic_uint64 *var,  // OUT:
 
    ASSERT((uintptr_t)var % 8 == 0);
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store_explicit((_Atomic uint64 *)&var->value, val,
+                         memory_order_release);
+#elif defined __GNUC__
 #  if defined __x86_64__
    __asm__ __volatile__(
       "movq %1, %0"
@@ -741,31 +765,43 @@ MAKE_ATOMIC_ACQREL_FUNCS(Bool, 8, Bool, Bool, Bool)
 static INLINE void
 Atomic_FenceAcquire(void)
 {
-   // C11 atomic_thread_fence(memory_order_acquire);
+#ifdef VM_ATOMIC_USE_C11
+   atomic_thread_fence(memory_order_acquire);
+#else
    SMP_R_BARRIER_RW();
+#endif
 }
 
 static INLINE void
 Atomic_FenceRelease(void)
 {
-   // C11 atomic_thread_fence(memory_order_release);
+#ifdef VM_ATOMIC_USE_C11
+   atomic_thread_fence(memory_order_release);
+#else
    SMP_RW_BARRIER_W();
+#endif
 }
 
 static INLINE void
 Atomic_FenceAcqRel(void)
 {
-   // C11 atomic_thread_fence(memory_order_acq_rel);
+#ifdef VM_ATOMIC_USE_C11
+   atomic_thread_fence(memory_order_acq_rel);
+#else
    /* R_RW + RW_W is generally cheaper than RW_RW (W_R is expensive) */
    SMP_R_BARRIER_RW();
    SMP_RW_BARRIER_W();
+#endif
 }
 
 static INLINE void
 Atomic_FenceSeqCst(void)
 {
-   // C11 atomic_thread_fence(memory_order_seq_cst);
+#ifdef VM_ATOMIC_USE_C11
+   atomic_thread_fence(memory_order_seq_cst);
+#else
    SMP_RW_BARRIER_RW();
+#endif
 }
 
 #ifdef VM_ARM_64
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index 781cb1b1..c6485d9a 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2003-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -61,6 +61,12 @@
 #include "mul64.h"
 #endif
 
+#if defined _M_ARM64EC
+#include "vm_assert.h"
+#define MUL64_NO_ASM 1
+#include "mul64.h"
+#endif
+
 #if defined __cplusplus
 extern "C" {
 #endif
@@ -95,7 +101,7 @@ extern "C" {
  * mssb64      MSB set (uint64)            1..64    0
  */
 
-#ifdef _MSC_VER
+#if defined(_MSC_VER) && !defined(__clang__) // Clang defines _MSC_VER on Windows
 static INLINE int
 lssb32_0(const uint32 value)
 {
@@ -773,7 +779,7 @@ RDTSC(void)
     * bora/lib/vprobe/arm64/vp_emit_tc.c::VpEmit_BuiltinRDTSCWork()
     * bora/modules/vmkernel/tests/core/xmapTest/xmapTest_arm64.c::XMapTest_SetupLoopCode()
     */
-#if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1_OR_VHE)
+#if defined(VMKERNEL) && !defined(VMK_ARM_EL1_OR_VHE)
    return MRS(CNTPCT_EL0);
 #else
    return MRS(CNTVCT_EL0);
@@ -1117,7 +1123,7 @@ RoundUpPow2Asm32(uint32 value)
                                            // if out == 2^32 then out = 1 as it is right rotate
        : [in]"+r"(value),[out]"+r"(out));
    return out;
-#elif defined(VM_ARM_64)
+#elif defined(VM_ARM_64) || defined(__wasm__)
    return RoundUpPow2C32(value);
 #else
    uint32 out = 2;
diff --git a/vmmon-only/include/vm_basic_asm_x86.h b/vmmon-only/include/vm_basic_asm_x86.h
index 3f6369c9..be045d4a 100644
--- a/vmmon-only/include/vm_basic_asm_x86.h
+++ b/vmmon-only/include/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -57,7 +57,7 @@ extern "C" {
  *  constraints.
  *
  */
-#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+#if (defined(VMM) || defined(VMKERNEL) || defined(FROBOS) || defined(ULM))
 static INLINE Bool
 xtest(void)
 {
@@ -66,14 +66,18 @@ xtest(void)
    __asm__ __volatile__("xtest\n"
                         "setnz %%al"
                         : "=a" (result) : : "cc");
-#else
+#elif defined (__GNUC__)
    __asm__ __volatile__("xtest"
                         : "=@ccnz" (result) : : "cc");
+#elif defined (_WIN32)
+   result = _xtest();
+#else
+#error No xtest implementation for this compiler.
 #endif
    return result;
 }
 
-#endif /* __GNUC__ */
+#endif /* VMM || VMKERNEL || FROBOS || ULM */
 
 
 /*
diff --git a/vmmon-only/include/vm_basic_asm_x86_64.h b/vmmon-only/include/vm_basic_asm_x86_64.h
index 2b9e8f8e..39462324 100644
--- a/vmmon-only/include/vm_basic_asm_x86_64.h
+++ b/vmmon-only/include/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -331,7 +331,7 @@ XRSTORS(const void *load, uint64 mask)
  *  constraints.
  *
  */
-#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+#if (defined(VMM) || defined(VMKERNEL) || defined(FROBOS) || defined(ULM))
 static INLINE Bool
 xtest(void)
 {
@@ -340,14 +340,18 @@ xtest(void)
    __asm__ __volatile__("xtest\n"
                         "setnz %%al"
                         : "=a" (result) : : "cc");
-#else
+#elif defined(__GNUC__)
    __asm__ __volatile__("xtest"
                         : "=@ccnz" (result) : : "cc");
+#elif defined (_WIN64)
+   result = _xtest();
+#else
+#error No xtest implementation for this compiler.
 #endif
    return result;
 }
 
-#endif /* __GNUC__ */
+#endif /* VMM || VMKERNEL || FROBOS || ULM */
 
 /*
  *-----------------------------------------------------------------------------
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index fd597664..80bbad90 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 /*
  * vm_basic_defs.h --
  *
- *	Standard macros for VMware source code.
+ *      Standard macros for VMware source code.
  */
 
 #ifndef _VM_BASIC_DEFS_H_
@@ -36,14 +36,6 @@
 #include "includeCheck.h"
 #include "vm_basic_types.h" // For INLINE.
 
-/* Checks for FreeBSD, filtering out VMKERNEL. */
-#if !defined(VMKERNEL) && defined(__FreeBSD__)
-#define __IS_FREEBSD__ 1
-#else
-#define __IS_FREEBSD__ 0
-#endif
-#define __IS_FREEBSD_VER__(ver) (__IS_FREEBSD__ && __FreeBSD_version >= (ver))
-
 /*
  * <stddef.h> provides definitions for:
  *   NULL, offsetof
@@ -128,11 +120,11 @@ Max(int a, int b)
 #define VMW_CLAMP(x, min, max) \
    ((x) < (min) ? (min) : ((x) > (max) ? (max) : (x)))
 
-#define ROUNDUP(x,y)		(((x) + (y) - 1) / (y) * (y))
-#define ROUNDDOWN(x,y)		((x) / (y) * (y))
-#define ROUNDUPBITS(x, bits)	(((uintptr_t) (x) + MASK(bits)) & ~MASK(bits))
-#define ROUNDDOWNBITS(x, bits)	((uintptr_t) (x) & ~MASK(bits))
-#define CEILING(x, y)		(((x) + (y) - 1) / (y))
+#define ROUNDUP(x,y)           (((x) + (y) - 1) / (y) * (y))
+#define ROUNDDOWN(x,y)         ((x) / (y) * (y))
+#define ROUNDUPBITS(x, bits)   (((uintptr_t)(x) + MASK(bits)) & ~MASK(bits))
+#define ROUNDDOWNBITS(x, bits) ((uintptr_t)(x) & ~MASK(bits))
+#define CEILING(x, y)          (((x) + (y) - 1) / (y))
 
 #if defined VMKERNEL || defined VMKBOOT
 # define CEIL(_a, _b)        CEILING(_a, _b)
@@ -157,8 +149,9 @@ Max(int a, int b)
  * argument. The range 0..31 is safe.
  */
 
-#define MASK(n)		((1 << (n)) - 1)	    /* make an n-bit mask */
-#define MASK64(n)	((CONST64U(1) << (n)) - 1)  /* make an n-bit mask */
+#define MASK(n)      ((1 << (n)) - 1)            /* make an n-bit mask */
+#define MASK64(n)    ((CONST64U(1) << (n)) - 1)  /* make an n-bit mask */
+#define MASK128(n)   (((uint128)1 << (n)) - 1)   /* make an n-bit mask */
 /*
  * MASKRANGE64 makes a bit vector starting at bit lo and ending at bit hi.  No
  * checking for lo < hi is done.
@@ -187,7 +180,9 @@ Max(int a, int b)
 #define XCONC(x, y)             CONC(x, y)
 #define XXCONC(x, y)            XCONC(x, y)
 #define MAKESTR(x)              #x
+#ifndef XSTR
 #define XSTR(x)                 MAKESTR(x)
+#endif
 
 
 /*
@@ -227,6 +222,8 @@ Max(int a, int b)
    #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #elif defined __arm__
    #define PAGE_SHIFT    PAGE_SHIFT_4KB
+#elif defined __wasm__
+   #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #else
    #error
 #endif
@@ -260,15 +257,6 @@ Max(int a, int b)
 #define PAGE_NUMBER(_addr)  ((uintptr_t)(_addr) / PAGE_SIZE)
 #endif
 
-#ifndef VM_PAGE_BASE
-#define VM_PAGE_BASE(_addr)  ((_addr) & ~(PAGE_SIZE - 1))
-#endif
-
-#ifndef VM_PAGES_SPANNED
-#define VM_PAGES_SPANNED(_addr, _size) \
-   ((((_addr) & (PAGE_SIZE - 1)) + (_size) + (PAGE_SIZE - 1)) >> PAGE_SHIFT)
-#endif
-
 #ifndef BYTES_2_PAGES
 #define BYTES_2_PAGES(_nbytes)  ((_nbytes) >> PAGE_SHIFT)
 #endif
@@ -281,6 +269,16 @@ Max(int a, int b)
 #define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
 #endif
 
+#ifndef VM_PAGE_BASE
+#define VM_PAGE_BASE(_addr)  ((_addr) & ~(PAGE_SIZE - 1))
+#endif
+
+#ifndef VM_PAGES_SPANNED
+#define VM_PAGES_SPANNED(_addr, _size) \
+   (BYTES_2_PAGES(PAGE_OFFSET(_addr) + PAGE_OFFSET(_size) + (PAGE_SIZE - 1)) + \
+    BYTES_2_PAGES(_size))
+#endif
+
 #ifndef KBYTES_SHIFT
 #define KBYTES_SHIFT 10
 #endif
@@ -428,9 +426,9 @@ Max(int a, int b)
  */
 
 #define DEPOSIT_BITS(_src,_pos,_len,_target) { \
-	unsigned mask = ((1 << _len) - 1); \
-	unsigned shiftedmask = ((1 << _len) - 1) << _pos; \
-	_target = (_target & ~shiftedmask) | ((_src & mask) << _pos); \
+   unsigned mask = ((1 << _len) - 1); \
+   unsigned shiftedmask = ((1 << _len) - 1) << _pos; \
+   _target = (_target & ~shiftedmask) | ((_src & mask) << _pos); \
 }
 
 
@@ -647,6 +645,12 @@ typedef int pid_t;
 #define VMKERNEL_ONLY(x)
 #endif
 
+#ifdef COMP_TEST
+#define vmx86_test   1
+#else
+#define vmx86_test   0
+#endif
+
 /*
  * In MSVC, _WIN32 is defined as 1 when the compilation target is
  * 32-bit ARM, 64-bit ARM, x86, or x64 (which implies _WIN64). This
@@ -700,6 +704,18 @@ typedef int pid_t;
 #define VMM_ONLY(x)
 #endif
 
+#ifdef VMX86_VMX
+#define vmx86_vmx 1
+#else
+#define vmx86_vmx 0
+#endif
+
+#ifdef VMM_BOOTSTRAP
+#define vmm_bootstrap 1
+#else
+#define vmm_bootstrap 0
+#endif
+
 #ifdef ULM
 #define vmx86_ulm 1
 #define ULM_ONLY(x) x
@@ -776,6 +792,7 @@ typedef int pid_t;
                                                      lfMessageFont)
 
 /* This is not intended to be thread-safe. */
+#ifndef KBUILD_MODNAME
 #define DO_ONCE(code)                                                   \
    do {                                                                 \
       static MONITOR_ONLY(PERVCPU) Bool _doOnceDone = FALSE;            \
@@ -784,6 +801,7 @@ typedef int pid_t;
          code;                                                          \
       }                                                                 \
    } while (0)
+#endif
 
 /*
  * Bug 827422 and 838523.
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index d05fcc79..0cfc0264 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,11 +39,11 @@
 /*
  * Standardize MSVC arch macros to GCC arch macros.
  */
-#if defined _MSC_VER && defined _M_X64
+#if defined _MSC_VER && defined _M_X64 && !defined _M_ARM64EC
 #  define __x86_64__ 1
 #elif defined _MSC_VER && defined _M_IX86
 #  define __i386__ 1
-#elif defined _MSC_VER && defined _M_ARM64
+#elif defined _MSC_VER && (defined _M_ARM64 || defined _M_ARM64EC)
 #  define __aarch64__ 1
 #elif defined _MSC_VER && defined _M_ARM
 #  define __arm__ 1
@@ -163,7 +163,7 @@
  * - Linux userlevel uses 'long' uint64_t
  * - Windows uses 'long long' uint64_t
  */
-#if !defined(VMKERNEL) && !defined(DECODERLIB) && \
+#if !defined(VMKERNEL) &&  \
     defined(__linux__) && defined(__KERNEL__)
 #  include <linux/types.h>
 #  include <linux/version.h>
@@ -205,7 +205,7 @@
  * - VMM does not have POSIX headers
  * - Windows <sys/types.h> does not define ssize_t
  */
-#if defined(VMKERNEL) || defined(VMM) || defined(DECODERLIB)
+#if defined(VMKERNEL) || defined(VMM)
    /* Guard against FreeBSD <sys/types.h> collison. */
 #  if !defined(_SIZE_T_DEFINED) && !defined(_SIZE_T)
 #     define _SIZE_T_DEFINED
@@ -290,11 +290,11 @@ typedef char           Bool;
 #if !defined(USING_AUTOCONF)
 #   if defined(__FreeBSD__) || defined(sun)
 #      ifndef KLD_MODULE
-#         if __FreeBSD_version >= 500043
+#         if defined(__FreeBSD__)
 #            if !defined(VMKERNEL)
 #               include <inttypes.h>
 #            endif
-#         else
+#         else /* sun */
 #            include <sys/inttypes.h>
 #         endif
 #      endif
@@ -353,7 +353,7 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
       #define FMTPD      "I"
       #define FMTH       "I"
    #endif
-#elif defined __APPLE__ || (!defined VMKERNEL && !defined DECODERLIB && \
+#elif defined __APPLE__ || (!defined VMKERNEL && \
                             defined __linux__ && defined __KERNEL__)
    /* semi-LLP64 targets; 'long' is 64-bit, but uint64_t is 'long long' */
    #define FMT64         "ll"
@@ -508,7 +508,7 @@ typedef uint16  UReg16;
 typedef uint32  UReg32;
 typedef uint64  UReg64;
 
-#if defined(__GNUC__) && defined(__SIZEOF_INT128__)
+#ifdef VM_HAS_INT128
 typedef  int128  Reg128;
 typedef uint128 UReg128;
 #endif
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index 42885b08..2a79373b 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2006-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2006-2021,2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -275,4 +275,8 @@ typedef enum x86_FLAGS {
 #define BNDCFG_RSVD      0x00000ffc
 #define BNDCFG_BDBASE    CONST64U(0xfffffffffffff000)
 
+/* Reset state of RIP. */
+#define RESET_RIP       0xfff0
+#define RESET_RIP_TDX   0xfffffff0  /* Reset RIP for TDX protected mode boot. */
+
 #endif // ifndef _VM_BASIC_DEFS_H_
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 1fe6fcda..e2d297bf 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -148,7 +148,8 @@ typedef struct CPUIDQuery {
    CPUIDLEVEL(TRUE,  1E,  0x1e,       1, 19) \
    CPUIDLEVEL(FALSE, 1F,  0x1f,       6, 17) \
    CPUIDLEVEL(TRUE,  20,  0x20,       1, 20) \
-   CPUIDLEVEL(TRUE , 21,  0x21,       1, 20) \
+   CPUIDLEVEL(TRUE,  21,  0x21,       1, 20) \
+   CPUIDLEVEL(TRUE,  23,  0x23,       4, 21) \
    CPUIDLEVEL(FALSE, 400, 0x40000000, 0,  0) \
    CPUIDLEVEL(FALSE, 401, 0x40000001, 0,  0) \
    CPUIDLEVEL(FALSE, 402, 0x40000002, 0,  0) \
@@ -174,7 +175,7 @@ typedef struct CPUIDQuery {
    CPUIDLEVEL(FALSE, 81D, 0x8000001d, 5,  0) \
    CPUIDLEVEL(FALSE, 81E, 0x8000001e, 0,  0) \
    CPUIDLEVEL(TRUE,  81F, 0x8000001f, 0, 14) \
-   CPUIDLEVEL(TRUE,  820, 0x80000020, 2, 17) \
+   CPUIDLEVEL(TRUE,  820, 0x80000020, 4, 17) \
    CPUIDLEVEL(TRUE,  821, 0x80000021, 0, 17) \
    CPUIDLEVEL(TRUE,  822, 0x80000022, 0, 20) \
    CPUIDLEVEL(TRUE,  823, 0x80000023, 0, 20) \
@@ -483,6 +484,7 @@ FLAG(   6,  0, EAX, 18,  1, HWP_FAST_ACCESS,                     NO,    0 ) \
 FLAG(   6,  0, EAX, 19,  1, HW_FEEDBACK,                         NO,    0 ) \
 FLAG(   6,  0, EAX, 20,  1, HWP_IGNORE_IDLE_REQUEST,             NO,    0 ) \
 FLAG(   6,  0, EAX, 23,  1, HW_FEEDBACK_ENHANCED,                NO,    0 ) \
+FLAG(   6,  0, EAX, 24,  1, HWP_THERM_INTERRUPT_MSR,             NO,    0 ) \
 FIELD(  6,  0, EBX,  0,  4, NUM_INTR_THRESHOLDS,                 NO,    0 ) \
 FLAG(   6,  0, ECX,  0,  1, HW_COORD_FEEDBACK,                   NO,    0 ) \
 FLAG(   6,  0, ECX,  1,  1, ACNT2,                               ANY,  13 ) \
@@ -532,7 +534,7 @@ FLAG(   7,  0, ECX,  1,  1, AVX512VBMI,                          YES,  17 ) \
 FLAG(   7,  0, ECX,  2,  1, UMIP,                                YES,  17 ) \
 FLAG(   7,  0, ECX,  3,  1, PKU,                                 YES,  13 ) \
 FLAG(   7,  0, ECX,  4,  1, OSPKE,                               ANY,  13 ) \
-FLAG(   7,  0, ECX,  5,  1, WAITPKG,                             YES, FUT ) \
+FLAG(   7,  0, ECX,  5,  1, WAITPKG,                             YES,  21 ) \
 FLAG(   7,  0, ECX,  6,  1, AVX512VBMI2,                         YES,  17 ) \
 FLAG(   7,  0, ECX,  7,  1, CET_SS,                              YES,  20 ) \
 FLAG(   7,  0, ECX,  8,  1, GFNI,                                YES,  17 ) \
@@ -550,19 +552,22 @@ FLAG(   7,  0, ECX, 24,  1, BUS_LOCK_DB,                         NO,    0 ) \
 FLAG(   7,  0, ECX, 25,  1, CLDEMOTE,                            YES,  18 ) \
 FLAG(   7,  0, ECX, 27,  1, MOVDIRI,                             YES,  18 ) \
 FLAG(   7,  0, ECX, 28,  1, MOVDIR64B,                           YES,  18 ) \
-FLAG(   7,  0, ECX, 29,  1, ENQCMD,                              NO,    0 ) \
+FLAG(   7,  0, ECX, 29,  1, ENQCMD,                              YES, FUT ) \
 FLAG(   7,  0, ECX, 30,  1, SGX_LC,                              ANY,  17 ) \
 FLAG(   7,  0, ECX, 31,  1, PKS,                                 YES,  20 ) \
+FLAG(   7,  0, EDX,  1,  1, SGK_KEYS,                            NO,    0 ) \
 FLAG(   7,  0, EDX,  2,  1, AVX512QVNNIW,                        YES,  16 ) \
 FLAG(   7,  0, EDX,  3,  1, AVX512QFMAPS,                        YES,  16 ) \
 FLAG(   7,  0, EDX,  4,  1, FAST_SHORT_REPMOV,                   YES,  18 ) \
 FLAG(   7,  0, EDX,  5,  1, UINTR,                               NO,    0 ) \
 FLAG(   7,  0, EDX,  8,  1, AVX512VP2INTERSECT,                  YES,  18 ) \
+FLAG(   7,  0, EDX,  9,  1, SRBDS_CTRL,                          NO,    0 ) \
 FLAG(   7,  0, EDX, 10,  1, MDCLEAR,                             YES,   9 ) \
-FLAG(   7,  0, EDX, 13,  1, TSX_FORCE_ABORT,                     NO,    0 ) \
+FLAG(   7,  0, EDX, 11,  1, RTM_ALWAYS_ABORT,                    NO,    0 ) \
+FLAG(   7,  0, EDX, 13,  1, RTM_FORCE_ABORT,                     NO,    0 ) \
 FLAG(   7,  0, EDX, 14,  1, SERIALIZE,                           YES,  20 ) \
 FLAG(   7,  0, EDX, 15,  1, HYBRID,                              NO,    0 ) \
-FLAG(   7,  0, EDX, 16,  1, TSXLDTRK,                            NO,    0 ) \
+FLAG(   7,  0, EDX, 16,  1, TSXLDTRK,                            YES,  21 ) \
 FLAG(   7,  0, EDX, 18,  1, PCONFIG,                             NO,    0 ) \
 FLAG(   7,  0, EDX, 19,  1, ARCH_LBR,                            YES,  20 ) \
 FLAG(   7,  0, EDX, 20,  1, CET_IBT,                             YES,  20 ) \
@@ -576,14 +581,34 @@ FLAG(   7,  0, EDX, 28,  1, FCMD,                                YES,   9 ) \
 FLAG(   7,  0, EDX, 29,  1, ARCH_CAPABILITIES,                   ANY,   9 ) \
 FLAG(   7,  0, EDX, 30,  1, CORE_CAPABILITIES,                   NO,    0 ) \
 FLAG(   7,  0, EDX, 31,  1, SSBD,                                YES,   9 ) \
+FLAG(   7,  1, EAX,  3,  1, RAO_INT,                             NO,    0 ) \
 FLAG(   7,  1, EAX,  4,  1, AVX_VNNI,                            YES,  20 ) \
 FLAG(   7,  1, EAX,  5,  1, AVX512BF16,                          YES,  18 ) \
+FLAG(   7,  1, EAX,  6,  1, LASS,                                NO,    0 ) \
+FLAG(   7,  1, EAX,  7,  1, CMPCCXADD,                           NO,    0 ) \
+FLAG(   7,  1, EAX,  8,  1, ARCH_PERFMON_EXT,                    NO,    0 ) \
 FLAG(   7,  1, EAX, 10,  1, FAST_ZERO_MOVSB,                     YES,  20 ) \
 FLAG(   7,  1, EAX, 11,  1, FAST_SHORT_STOSB,                    YES,  20 ) \
 FLAG(   7,  1, EAX, 12,  1, FAST_SHORT_CMPSB_SCASB,              YES,  20 ) \
+FLAG(   7,  1, EAX, 19,  1, WRMSRNS,                             NO,    0 ) \
+FLAG(   7,  1, EAX, 21,  1, AMX_FP16,                            YES,  21 ) \
 FLAG(   7,  1, EAX, 22,  1, HRESET,                              NO,    0 ) \
+FLAG(   7,  1, EAX, 23,  1, AVX_IFMA,                            NO,    0 ) \
 FLAG(   7,  1, EAX, 26,  1, LAM,                                 NO,    0 ) \
-FLAG(   7,  2, EDX,  0,  1, PSFD,                                YES,  20 )
+FLAG(   7,  1, EAX, 27,  1, MSRLIST,                             NO,    0 ) \
+FLAG(   7,  1, EBX,  0,  1, LEAF7_PPIN,                          NO,    0 ) \
+FLAG(   7,  1, EDX,  4,  1, AVX_VNNI_INT8,                       NO,    0 ) \
+FLAG(   7,  1, EDX,  5,  1, AVX_NE_CONVERT,                      NO,    0 ) \
+FLAG(   7,  1, EDX,  8,  1, AMX_COMPLEX,                         NO,    0 ) \
+FLAG(   7,  1, EDX, 14,  1, PREFETCHI,                           YES,  21 ) \
+FLAG(   7,  1, EDX, 18,  1, CET_SSS,                             NO,    0 ) \
+FLAG(   7,  2, EDX,  0,  1, PSFD,                                YES,  20 ) \
+FLAG(   7,  2, EDX,  1,  1, IPRED_CTRL,                          YES,  21 ) \
+FLAG(   7,  2, EDX,  2,  1, RRSBA_CTRL,                          YES,  21 ) \
+FLAG(   7,  2, EDX,  3,  1, DDPD_U,                              YES,  21 ) \
+FLAG(   7,  2, EDX,  4,  1, BHI_CTRL,                            YES,  21 ) \
+FLAG(   7,  2, EDX,  5,  1, MCDT_NO,                             NO,    0 ) \
+FLAG(   7,  2, EDX,  6,  1, UC_LOCK_DISABLE,                     NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_9                                            \
@@ -644,7 +669,7 @@ FLAG(   D,  1, EAX,  3,  1, XSAVES,                              YES,  13 ) \
 FLAG(   D,  1, EAX,  4,  1, XFD,                                 YES,  20 ) \
 FIELD(  D,  1, EBX,  0, 32, XSAVES_ENABLED_SIZE,                 ANY,  13 ) \
 FLAG(   D,  1, ECX,  8,  1, XSS_MASTER_PT,                       NO,    0 ) \
-FLAG(   D,  1, ECX, 10,  1, XSS_MASTER_PASID,                    NO,    0 ) \
+FLAG(   D,  1, ECX, 10,  1, XSS_MASTER_PASID,                    YES, FUT ) \
 FLAG(   D,  1, ECX, 11,  1, XSS_MASTER_CET_U,                    YES,  20 ) \
 FLAG(   D,  1, ECX, 12,  1, XSS_MASTER_CET_S,                    YES,  20 ) \
 FLAG(   D,  1, ECX, 13,  1, XSS_MASTER_HDC,                      NO,    0 ) \
@@ -691,10 +716,10 @@ FIELD(  D,  9, EBX,  0, 32, XSAVE_PKRU_OFFSET,                   YES,  13 ) \
 FLAG(   D,  9, ECX,  0,  1, XSAVE_PKRU_SUP_BY_XSS,               NO,    0 ) \
 FLAG(   D,  9, ECX,  1,  1, XSAVE_PKRU_ALIGN,                    YES,  13 ) \
 FLAG(   D,  9, ECX,  2,  1, XSAVE_PKRU_XFD,                      NO,    0 ) \
-FIELD(  D, 10, EAX,  0, 32, XSAVES_PASID_STATE_SIZE,             NO,    0 ) \
-FLAG(   D, 10, ECX,  0,  1, XSAVES_PASID_STATE_SUP_BY_XSS,       NO,    0 ) \
-FLAG(   D, 10, ECX,  1,  1, XSAVES_PASID_STATE_ALIGN,            NO,    0 ) \
-FLAG(   D, 10, ECX,  2,  1, XSAVES_PASID_STATE_XFD,              NO,    0 ) \
+FIELD(  D, 10, EAX,  0, 32, XSAVES_PASID_STATE_SIZE,             YES, FUT ) \
+FLAG(   D, 10, ECX,  0,  1, XSAVES_PASID_STATE_SUP_BY_XSS,       YES, FUT ) \
+FLAG(   D, 10, ECX,  1,  1, XSAVES_PASID_STATE_ALIGN,            YES, FUT ) \
+FLAG(   D, 10, ECX,  2,  1, XSAVES_PASID_STATE_XFD,              YES, FUT ) \
 FIELD(  D, 11, EAX,  0, 32, XSAVES_CET_U_SIZE,                   YES,  20 ) \
 FLAG(   D, 11, ECX,  0,  1, XSAVES_CET_U_SUP_BY_XSS,             YES,  20 ) \
 FLAG(   D, 11, ECX,  1,  1, XSAVES_CET_U_ALIGN,                  YES,  20 ) \
@@ -759,9 +784,11 @@ FIELD( 10,  2, EDX,  0, 16, PQE_L2_MAX_COS_NUMBER,               NO,    0 )
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_12                                           \
 FLAG(  12,  0, EAX,  0,  1, SGX1,                                ANY,  17 ) \
-FLAG(  12,  0, EAX,  1,  1, SGX2,                                ANY, FUT ) \
-FLAG(  12,  0, EAX,  5,  1, SGX_OVERSUB_ENCLV,                   ANY, FUT ) \
-FLAG(  12,  0, EAX,  6,  1, SGX_OVERSUB_ENCLS,                   ANY, FUT ) \
+FLAG(  12,  0, EAX,  1,  1, SGX2,                                ANY,  21 ) \
+FLAG(  12,  0, EAX,  5,  1, SGX_OVERSUB_ENCLV,                   NO,    0 ) \
+FLAG(  12,  0, EAX,  6,  1, SGX_OVERSUB_ENCLS,                   NO,    0 ) \
+FLAG(  12,  0, EAX,  7,  1, SGX_EVERIFYREPORT2,                  NO,    0 ) \
+FLAG(  12,  0, EAX, 10,  1, SGX_EUPDATESVN,                      NO,    0 ) \
 FLAG(  12,  0, EBX,  0,  1, SGX_MISCSELECT_EXINFO,               ANY, FUT ) \
 FIELD( 12,  0, EBX,  1, 31, SGX_MISCSELECT_RSVD,                 NO,    0 ) \
 FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,              ANY,  17 ) \
@@ -792,6 +819,9 @@ FLAG(  14,  0, EBX,  2,  1, PT_IP_FILTER_PERSIST_MSR,            NO,    0 ) \
 FLAG(  14,  0, EBX,  3,  1, PT_MTC,                              NO,    0 ) \
 FLAG(  14,  0, EBX,  4,  1, PT_PTWRITE,                          NO,    0 ) \
 FLAG(  14,  0, EBX,  5,  1, PT_POWER_EVENT,                      NO,    0 ) \
+FLAG(  14,  0, EBX,  6,  1, PT_PSB_PMI,                          NO,    0 ) \
+FLAG(  14,  0, EBX,  7,  1, PT_EVENT_TRACE_ENABLE,               NO,    0 ) \
+FLAG(  14,  0, EBX,  8,  1, PT_TNT_DISABLE,                      NO,    0 ) \
 FLAG(  14,  0, ECX,  0,  1, PT_TOPA,                             NO,    0 ) \
 FLAG(  14,  0, ECX,  1,  1, PT_TOPA_MULTI,                       NO,    0 ) \
 FLAG(  14,  0, ECX,  2,  1, PT_SRO,                              NO,    0 ) \
@@ -883,20 +913,24 @@ FLAG(  1C,  0, EBX,  2,  1, LBR_CALL_STACK_MODE,                 YES,  20 ) \
 FLAG(  1C,  0, ECX,  0,  1, LBR_MISPREDICT,                      YES,  20 ) \
 FLAG(  1C,  0, ECX,  1,  1, LBR_TIMED_LBRS,                      YES,  20 ) \
 FLAG(  1C,  0, ECX,  2,  1, LBR_BRANCH_TYPE,                     YES,  20 ) \
+FLAG(  1C,  0, ECX, 16,  1, LBR_EVENT_LOGGING_PMC0,               NO,   0 ) \
+FLAG(  1C,  0, ECX, 17,  1, LBR_EVENT_LOGGING_PMC1,               NO,   0 ) \
+FLAG(  1C,  0, ECX, 18,  1, LBR_EVENT_LOGGING_PMC2,               NO,   0 ) \
+FLAG(  1C,  0, ECX, 19,  1, LBR_EVENT_LOGGING_PMC3,               NO,   0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1D                                           \
-FIELD( 1D,  0, EAX,  0, 32, TILE_PALETTE_MAX,                    YES,    20 ) \
-FIELD( 1D,  1, EAX,  0, 16, TILE_PALETTE1_TOTAL_BYTES,           YES,    20 ) \
-FIELD( 1D,  1, EAX, 16, 16, TILE_PALETTE1_BYTES_PER_TILE,        YES,    20 ) \
-FIELD( 1D,  1, EBX,  0, 16, TILE_PALETTE1_BYTES_PER_ROW,         YES,    20 ) \
-FIELD( 1D,  1, EBX, 16, 16, TILE_PALETTE1_NUM_REGS,              YES,    20 ) \
-FIELD( 1D,  1, ECX,  0, 16, TILE_PALETTE1_MAX_ROWS,              YES,    20 )
+FIELD( 1D,  0, EAX,  0, 32, TILE_PALETTE_MAX,                    YES,  20 ) \
+FIELD( 1D,  1, EAX,  0, 16, TILE_PALETTE1_TOTAL_BYTES,           YES,  20 ) \
+FIELD( 1D,  1, EAX, 16, 16, TILE_PALETTE1_BYTES_PER_TILE,        YES,  20 ) \
+FIELD( 1D,  1, EBX,  0, 16, TILE_PALETTE1_BYTES_PER_ROW,         YES,  20 ) \
+FIELD( 1D,  1, EBX, 16, 16, TILE_PALETTE1_NUM_REGS,              YES,  20 ) \
+FIELD( 1D,  1, ECX,  0, 16, TILE_PALETTE1_MAX_ROWS,              YES,  20 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1E                                           \
-FIELD( 1E,  0, EBX,  0,  8, TMUL_MAX_K,                          YES,    20 ) \
-FIELD( 1E,  0, EBX,  8, 16, TMUL_MAX_N,                          YES,    20 )
+FIELD( 1E,  0, EBX,  0,  8, TMUL_MAX_K,                          YES,  20 ) \
+FIELD( 1E,  0, EBX,  8, 16, TMUL_MAX_N,                          YES,  20 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_1F                                           \
@@ -918,6 +952,26 @@ FIELD( 21,  0, EBX,  0, 32, TDX_VENDOR1,                         NO,    0 ) \
 FIELD( 21,  0, ECX,  0, 32, TDX_VENDOR3,                         NO,    0 ) \
 FIELD( 21,  0, EDX,  0, 32, TDX_VENDOR2,                         NO,    0 )
 
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_23                                           \
+FIELD( 23,  0, EAX,  0, 32, ARCH_PMC_MAX_SUBLEAF,                NO,    0 ) \
+FLAG(  23,  0, EBX,  0,  1, ARCH_PMC_UNITMASK2,                  NO,    0 ) \
+FLAG(  23,  0, EBX,  1,  1, ARCH_PMC_ZBIT,                       NO,    0 ) \
+FIELD( 23,  1, EAX,  0, 32, ARCH_PMC_GEN_BITMAP,                 NO,    0 ) \
+FIELD( 23,  1, EBX,  0, 32, ARCH_PMC_FIXED_BITMAP,               NO,    0 ) \
+FLAG(  23,  3, EAX,  0,  1, ARCH_PMC_CORE_CYCLES,                NO,    0 ) \
+FLAG(  23,  3, EAX,  1,  1, ARCH_PMC_INSTR_RETIRED,              NO,    0 ) \
+FLAG(  23,  3, EAX,  2,  1, ARCH_PMC_REF_CYCLES,                 NO,    0 ) \
+FLAG(  23,  3, EAX,  3,  1, ARCH_PMC_LAST_LVL_CREF,              NO,    0 ) \
+FLAG(  23,  3, EAX,  4,  1, ARCH_PMC_LAST_LVL_CMISS,             NO,    0 ) \
+FLAG(  23,  3, EAX,  5,  1, ARCH_PMC_BR_INST_RETIRED,            NO,    0 ) \
+FLAG(  23,  3, EAX,  6,  1, ARCH_PMC_BR_MISS_RETIRED,            NO,    0 ) \
+FLAG(  23,  3, EAX,  7,  1, ARCH_PMC_TOPDOWN_SLOTS,              NO,    0 ) \
+FLAG(  23,  3, EAX,  8,  1, ARCH_PMC_TOPDOWN_BACKEND,            NO,    0 ) \
+FLAG(  23,  3, EAX,  9,  1, ARCH_PMC_TOPDOWN_BAD_SPEC,           NO,    0 ) \
+FLAG(  23,  3, EAX, 10,  1, ARCH_PMC_TOPDOWN_FRONTEND,           NO,    0 ) \
+FLAG(  23,  3, EAX, 11,  1, ARCH_PMC_TOPDOWN_RETIRE,             NO,    0 )
+
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_400                                          \
 FIELD(400,  0, EAX,  0, 32, MAX_HYP_LEVEL,                       NA,    0 ) \
@@ -1042,7 +1096,7 @@ FIELD( 81,  0, EAX, 12,  2, LEAF81_TYPE,                         ANY,   4 ) \
 FIELD( 81,  0, EAX, 16,  4, LEAF81_EXTENDED_MODEL,               ANY,   4 ) \
 FIELD( 81,  0, EAX, 20,  8, LEAF81_EXTENDED_FAMILY,              ANY,   4 ) \
 FIELD( 81,  0, EBX,  0, 16, LEAF81_BRAND_ID,                     ANY,   4 ) \
-FIELD( 81,  0, EBX, 16, 16, UNDEF,                               ANY,   4 ) \
+FIELD( 81,  0, EBX, 28,  4, LEAF81_PKG_TYPE,                     ANY,   4 ) \
 FLAG(  81,  0, ECX,  0,  1, LAHF64,                              YES,   4 ) \
 FLAG(  81,  0, ECX,  1,  1, CMPLEGACY,                           ANY,   9 ) \
 FLAG(  81,  0, ECX,  2,  1, SVM,                                 YES,   8 ) \
@@ -1068,7 +1122,7 @@ FLAG(  81,  0, ECX, 24,  1, PERFNB,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 26,  1, DATABK,                              NO,    0 ) \
 FLAG(  81,  0, ECX, 27,  1, PERFTSC,                             NO,    0 ) \
 FLAG(  81,  0, ECX, 28,  1, PERFL3,                              NO,    0 ) \
-FLAG(  81,  0, ECX, 29,  1, MONITORX,                            NO,    0 ) \
+FLAG(  81,  0, ECX, 29,  1, MONITORX,                            YES,  21 ) \
 FLAG(  81,  0, ECX, 30,  1, ADDR_MASK_EXT,                       NO,    0 ) \
 FLAG(  81,  0, EDX,  0,  1, LEAF81_FPU,                          YES,   4 ) \
 FLAG(  81,  0, EDX,  1,  1, LEAF81_VME,                          YES,   4 ) \
@@ -1179,7 +1233,8 @@ FLAG(  87,  0, EDX, 10,  1, EFFECTIVE_FREQUENCY,                 NA,    0 ) \
 FLAG(  87,  0, EDX, 11,  1, PROC_FEEDBACK_INTERFACE,             NA,    0 ) \
 FLAG(  87,  0, EDX, 12,  1, PROC_POWER_REPORTING,                NA,    0 ) \
 FLAG(  87,  0, EDX, 13,  1, CONNECTED_STANDBY,                   NA,    0 ) \
-FLAG(  87,  0, EDX, 14,  1, RAPL,                                NA,    0 )
+FLAG(  87,  0, EDX, 14,  1, RAPL,                                NA,    0 ) \
+FLAG(  87,  0, EDX, 15,  1, FAST_CPPC,                           NA,    0 )
 
 /*    LEVEL, REG, POS, SIZE, NAME,                          MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_88                                           \
@@ -1208,7 +1263,9 @@ FLAG(  88,  0, EBX, 23,  1, PPIN,                                NO,    0 ) \
 FLAG(  88,  0, EBX, 24,  1, LEAF88_SSBD_SPEC_CTRL,               YES,  20 ) \
 FLAG(  88,  0, EBX, 25,  1, LEAF88_SSBD_VIRT_SPEC_CTRL,          NO,    0 ) \
 FLAG(  88,  0, EBX, 26,  1, LEAF88_SSBD_NOT_NEEDED,              NO,    0 ) \
+FLAG(  88,  0, EBX, 27,  1, CPPC,                                NO,    0 ) \
 FLAG(  88,  0, EBX, 28,  1, LEAF88_PSFD,                         YES,  20 ) \
+FLAG(  88,  0, EBX, 29,  1, BTC_NO,                              NO,    0 ) \
 FIELD( 88,  0, ECX,  0,  8, LEAF88_CORE_COUNT,                   YES,   4 ) \
 FIELD( 88,  0, ECX, 12,  4, APICID_COREID_SIZE,                  YES,   7 ) \
 FIELD( 88,  0, ECX, 16,  2, PERFTSC_SIZE,                        NO,    0 ) \
@@ -1247,9 +1304,13 @@ FLAG(  8A,  0, EDX, 17,  1, SVM_GMET,                            YES,  17 ) \
 FLAG(  8A,  0, EDX, 18,  1, SVMEDX_RSVD3,                        NO,    0 ) \
 FLAG(  8A,  0, EDX, 19,  1, SVM_SSS,                             YES,  20 ) \
 FLAG(  8A,  0, EDX, 20,  1, SVM_GUEST_SPEC_CTRL,                 NO,    0 ) \
-FIELD( 8A,  0, EDX, 21,  3, SVMEDX_RSVD4,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 21,  1, SVM_NON_WRITEABLE_PT,                NO,    0 ) \
+FLAG(  8A,  0, EDX, 23,  1, SVM_HOST_MCE_OVERRIDE,               NO,    0 ) \
 FLAG(  8A,  0, EDX, 24,  1, SVM_TLB_CTL,                         NO,    0 ) \
-FIELD( 8A,  0, EDX, 25,  7, SVMEDX_RSVD5,                        NO,    0 )
+FLAG(  8A,  0, EDX, 25,  1, SVM_NMI_VIRT,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 26,  1, SVM_IBS_VIRT,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 27,  1, SVM_EXTLVT_OFFSET_FAULT,             NO,    0 ) \
+FLAG(  8A,  0, EDX, 28,  1, SVM_VMCB_ADDR_CHK,                   NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_819                                          \
@@ -1280,7 +1341,8 @@ FLAG( 81B,  0, EAX,  6,  1, OPCOUNT_EXT,                         NA,    0 ) \
 FLAG( 81B,  0, EAX,  7,  1, RIP_INVALID_CHECK,                   NA,    0 ) \
 FLAG( 81B,  0, EAX,  8,  1, OP_BRN_FUSE,                         NA,    0 ) \
 FLAG( 81B,  0, EAX,  9,  1, IBS_FETCH_CTL_EXTD,                  NA,    0 ) \
-FLAG( 81B,  0, EAX, 10,  1, IBS_OP_DATA4,                        NA,    0 )
+FLAG( 81B,  0, EAX, 10,  1, IBS_OP_DATA4,                        NA,    0 ) \
+FLAG( 81B,  0, EAX, 11,  1, IBS_FETCH_OP,                        NA,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_81C                                          \
@@ -1348,6 +1410,9 @@ FLAG( 81F,  0, EAX,  2,  1, PAGE_FLUSH_MSR,                      NO,    0 ) \
 FLAG( 81F,  0, EAX,  3,  1, SEV_ES,                              YES,  17 ) \
 FLAG( 81F,  0, EAX,  4,  1, SEV_SNP,                             NO,    0 ) \
 FLAG( 81F,  0, EAX,  5,  1, VMPL,                                NO,    0 ) \
+FLAG( 81F,  0, EAX,  6,  1, RMPQUERY,                            NO,    0 ) \
+FLAG( 81F,  0, EAX,  7,  1, VMPL_SSS,                            NO,    0 ) \
+FLAG( 81F,  0, EAX,  8,  1, SECURE_TSC,                          NO,    0 ) \
 FLAG( 81F,  0, EAX,  9,  1, TSC_AUX_VIRT,                        YES,  20 ) \
 FLAG( 81F,  0, EAX, 10,  1, SEV_HEC,                             NO,    0 ) \
 FLAG( 81F,  0, EAX, 11,  1, SEV_64BIT_REQ,                       NO,    0 ) \
@@ -1355,6 +1420,11 @@ FLAG( 81F,  0, EAX, 12,  1, SEV_RESTR_INJECTION,                 NO,    0 ) \
 FLAG( 81F,  0, EAX, 13,  1, SEV_ALT_INJECTION,                   NO,    0 ) \
 FLAG( 81F,  0, EAX, 14,  1, SEV_DEBUG_SWAP,                      NO,    0 ) \
 FLAG( 81F,  0, EAX, 15,  1, SEV_NO_HOST_IBS,                     NO,    0 ) \
+FLAG( 81F,  0, EAX, 16,  1, SEV_VTE,                             NO,    0 ) \
+FLAG( 81F,  0, EAX, 17,  1, VMGEXIT_PARAMETER,                   NO,    0 ) \
+FLAG( 81F,  0, EAX, 18,  1, VIRTUAL_MSR_TOM,                     NO,    0 ) \
+FLAG( 81F,  0, EAX, 19,  1, SEV_IBS_VIRT,                        NO,    0 ) \
+FLAG( 81F,  0, EAX, 24,  1, VMSA_REG_PROT,                       NO,    0 ) \
 FIELD(81F,  0, EBX,  0,  6, SME_PAGE_TABLE_BIT_NUM,              YES,  17 ) \
 FIELD(81F,  0, EBX,  6,  6, SME_PHYS_ADDR_SPACE_REDUCTION,       NO,    0 ) \
 FIELD(81F,  0, EBX, 12,  4, NUM_VMPL,                            NO,    0 ) \
@@ -1364,17 +1434,68 @@ FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                        NO,    0 )
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_820                                          \
 FLAG( 820,  0, EBX,  1,  1, LEAF820_MBE,                         NO,    0 ) \
+FLAG( 820,  0, EBX,  2,  1, LEAF820_SMBE,                        NO,    0 ) \
+FLAG( 820,  0, EBX,  3,  1, LEAF820_EVT_CFG,                     NO,    0 ) \
+FLAG( 820,  0, EBX,  4,  1, LEAF820_L3RR,                        NO,    0 ) \
 FIELD(820,  1, EAX,  0, 32, CAPACITY_MASK_LEN,                   NO,    0 ) \
-FIELD(820,  1, EDX,  0, 32, NUM_SERVICE_CLASSES,                 NO,    0 )
+FIELD(820,  1, EDX,  0, 32, NUM_SERVICE_CLASSES,                 NO,    0 ) \
+FIELD(820,  2, EAX,  0, 32, SMBE_LENGTH,                         NO,    0 ) \
+FIELD(820,  2, EDX,  0, 32, COS_MAX,                             NO,    0 ) \
+FIELD(820,  3, EBX,  0,  8, NUM_BANDWIDTH_EVENTS,                NO,    0 ) \
+FLAG( 820,  3, ECX,  0,  1, L3_CACHE_LCL_BW_FILL,                NO,    0 ) \
+FLAG( 820,  3, ECX,  1,  1, L3_CACHE_RMT_BW_FILL,                NO,    0 ) \
+FLAG( 820,  3, ECX,  2,  1, L3_CACHE_LCL_BW_NT_WRITE,            NO,    0 ) \
+FLAG( 820,  3, ECX,  3,  1, L3_CACHE_RMT_BW_NT_WRITE,            NO,    0 ) \
+FLAG( 820,  3, ECX,  4,  1, L3_CACHE_LCL_SLOW_BW_FILL,           NO,    0 ) \
+FLAG( 820,  3, ECX,  5,  1, L3_CACHE_RMT_SLOW_BW_FILL,           NO,    0 ) \
+FLAG( 820,  3, ECX,  6,  1, L3_CACHE_BW_VIC,                     NO,    0 )
 
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
 #define CPUID_FIELD_DATA_LEVEL_821                                          \
-FLAG( 821,  0, EAX,  7,  1, UPPER_ADDRESS_IGNORE,                YES,  20 )
+FLAG( 821,  0, EAX,  0,  1, NO_NESTED_DATA_BP,                   NO,    0 ) \
+FLAG( 821,  0, EAX,  1,  1, NON_SERIALIZING_FSGSBASE,            NO,    0 ) \
+FLAG( 821,  0, EAX,  2,  1, ALWAYS_SERIALIZING_LFENCE,           YES,  19 ) \
+FLAG( 821,  0, EAX,  3,  1, SMM_PGCFG_LOCK,                      NO,    0 ) \
+FLAG( 821,  0, EAX,  6,  1, NULL_SELECTOR_CLEARS_BASE,           NO,    0 ) \
+FLAG( 821,  0, EAX,  7,  1, UPPER_ADDRESS_IGNORE,                YES,  20 ) \
+FLAG( 821,  0, EAX,  8,  1, AUTOMATIC_IBRS,                      YES,  20 ) \
+FLAG( 821,  0, EAX,  9,  1, NO_SMMCTL_MSR,                       NO,    0 ) \
+FLAG( 821,  0, EAX, 10,  1, AMD_FAST_SHORT_STOSB,                YES,  20 ) \
+FLAG( 821,  0, EAX, 11,  1, AMD_FAST_SHORT_CMPSB,                YES,  20 ) \
+FLAG( 821,  0, EAX, 13,  1, PREFETCHCTL_MSR,                     NO,    0 ) \
+FLAG( 821,  0, EAX, 17,  1, CPL3_CPUID_GP,                       NO,    0 ) \
+FLAG( 821,  0, EAX, 18,  1, EPSF,                                NO,    0 ) \
+FIELD(821,  0, EBX,  0, 12, MICROCODE_PATCH_SIZE,                NO,    0 )
 
-#define CPUID_FIELD_DATA_LEVEL_822
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_822                                          \
+FLAG( 822,  0, EAX,  0,  1, AMD_PERFMON_V2,                      NO,    0 ) \
+FLAG( 822,  0, EAX,  1,  1, AMD_LBREXT_V2,                       NO,    0 ) \
+FLAG( 822,  0, EAX,  2,  1, AMD_LBR_PMC_FREEZE,                  NO,    0 ) \
+FIELD(822,  0, EBX,  0,  4, AMD_NUM_CORE_PMC,                    NO,    0 ) \
+FIELD(822,  0, EBX,  4,  6, AMD_LBR_STACK_SIZE,                  NO,    0 ) \
+FIELD(822,  0, EBX, 10,  6, AMD_NUM_DF_PMC,                      NO,    0 ) \
+FIELD(822,  0, EBX, 16,  6, AMD_NUM_UMC_PMC,                     NO,    0 ) \
+FIELD(822,  0, ECX,  0, 32, AMD_ACTIVE_UMC_PMC_MASK,             NO,    0 )
 
-#define CPUID_FIELD_DATA_LEVEL_823
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_823                                          \
+FLAG( 823,  0, EAX,  0,  1, MEM_HMK,                             NO,    0 ) \
+FIELD(823,  0, EBX,  0, 16, MEM_HMK_MAX_ENCR_KEYID,              NO,    0 )
 
-#define CPUID_FIELD_DATA_LEVEL_826
+/*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
+#define CPUID_FIELD_DATA_LEVEL_826                                          \
+FIELD(826,  0, EAX,  0,  5, AMD_TOPOLOGY_MASK_WIDTH,             NA,    0 ) \
+FLAG( 826,  0, EAX, 29,  1, AMD_TOPOLOGY_EFFICIENCY_RANK,        NA,    0 ) \
+FLAG( 826,  0, EAX, 30,  1, AMD_TOPOLOGY_HETEROGENEOUS_CORES,    NA,    0 ) \
+FLAG( 826,  0, EAX, 31,  1, AMD_TOPOLOGY_ASYMMETRIC_CORES,       NA,    0 ) \
+FIELD(826,  0, EBX,  0, 16, AMD_TOPOLOGY_CPUS_SHARING_LEVEL,     NA,    0 ) \
+FIELD(826,  0, EBX, 16,  8, AMD_TOPOLOGY_POWER_RANKING,          NA,    0 ) \
+FIELD(826,  0, EBX, 24,  4, AMD_TOPOLOGY_NATIVE_MODEL_ID,        NA,    0 ) \
+FIELD(826,  0, EBX, 28,  4, AMD_TOPOLOGY_CORE_TYPE,              NA,    0 ) \
+FIELD(826,  0, ECX,  0,  8, AMD_TOPOLOGY_LEVEL_NUMBER,           NA,    0 ) \
+FIELD(826,  0, ECX,  8,  8, AMD_TOPOLOGY_LEVEL_TYPE,             NA,    0 ) \
+FIELD(826,  0, EDX,  0, 32, AMD_TOPOLOGY_EXT_APIC_ID,            NA,    0 )
 
 #define CPUID_FIELD_DATA                                              \
    CPUID_FIELD_DATA_LEVEL_0                                           \
@@ -1405,6 +1526,7 @@ FLAG( 821,  0, EAX,  7,  1, UPPER_ADDRESS_IGNORE,                YES,  20 )
    CPUID_FIELD_DATA_LEVEL_1F                                          \
    CPUID_FIELD_DATA_LEVEL_20                                          \
    CPUID_FIELD_DATA_LEVEL_21                                          \
+   CPUID_FIELD_DATA_LEVEL_23                                          \
    CPUID_FIELD_DATA_LEVEL_400                                         \
    CPUID_FIELD_DATA_LEVEL_401                                         \
    CPUID_FIELD_DATA_LEVEL_402                                         \
@@ -1673,8 +1795,10 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_ICELAKE_7E        0x7e  // Ice Lake U/Y
 #define CPUID_MODEL_ICELAKE_6A        0x6a  // Ice Lake SP (ICX)
 #define CPUID_MODEL_ICELAKE_6C        0x6c  // Ice Lake D
+#define CPUID_MODEL_LAKEFIELD_8A      0x8a  // Lakefield
 #define CPUID_MODEL_TIGERLAKE_8C      0x8c  // Tiger Lake UP3/UP4/H35
 #define CPUID_MODEL_TIGERLAKE_8D      0x8d  // Tiger Lake H81
+#define CPUID_MODEL_SAPPHIRERAPIDS_8F 0x8f  // Sapphire Rapids
 #define CPUID_MODEL_KNM_85            0x85  // Knights Mill
 #define CPUID_MODEL_KABYLAKE_8E       0x8e  // Kaby Lake U/Y QS
 #define CPUID_MODEL_ALDERLAKE_97      0x97  // Alder Lake-S
@@ -1683,6 +1807,9 @@ CPUIDCheck(int32 eaxIn, int32 eaxInCheck,
 #define CPUID_MODEL_COMETLAKE_A5      0xa5  // Comet Lake S
 #define CPUID_MODEL_COMETLAKE_A6      0xa6  // Comet Lake U
 #define CPUID_MODEL_ROCKETLAKE_A7     0xa7  // Rocket Lake S
+#define CPUID_MODEL_RAPTORLAKE_B7     0xb7  // Raptor Lake S/HX B-0
+#define CPUID_MODEL_RAPTORLAKE_BA     0xba  // Raptor Lake H/P/PX J-0, U Q-0
+#define CPUID_MODEL_RAPTORLAKE_BF     0xbf  // Raptor Lake S/HX C-0
 
 /* Intel stepping information */
 #define CPUID_STEPPING_KABYLAKE_ES     0x8  // Kaby Lake S/H/U/Y ES
@@ -2083,6 +2210,34 @@ CPUID_MODEL_IS_ALDERLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
            CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_ALDERLAKE_9A);
 }
 
+static INLINE Bool
+CPUID_MODEL_IS_RAPTORLAKE(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          (CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_RAPTORLAKE_B7 ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_RAPTORLAKE_BF ||
+           CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_RAPTORLAKE_BA);
+}
+
+
+static INLINE Bool
+CPUID_MODEL_IS_SAPPHIRERAPIDS(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_FAMILY_IS_P6(v) &&
+          CPUID_EFFECTIVE_MODEL(v) == CPUID_MODEL_SAPPHIRERAPIDS_8F;
+}
+
+static INLINE Bool
+CPUID_UARCH_IS_SAPPHIRERAPIDS(uint32 v) // IN: %eax from CPUID with %eax=1.
+{
+   /* Assumes the CPU manufacturer is Intel. */
+   return CPUID_MODEL_IS_SAPPHIRERAPIDS(v) ||
+          CPUID_MODEL_IS_ALDERLAKE(v) ||
+          CPUID_MODEL_IS_RAPTORLAKE(v);
+}
+
 
 static INLINE Bool
 CPUID_UARCH_IS_HASWELL(uint32 v) // IN: %eax from CPUID with %eax=1.
diff --git a/vmmon-only/include/x86desc.h b/vmmon-only/include/x86desc.h
index 4f2f877a..6d7fd2b6 100644
--- a/vmmon-only/include/x86desc.h
+++ b/vmmon-only/include/x86desc.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019,2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -72,6 +72,19 @@
 #define OFFSET_LO(_dw)            ((uint32)((_dw) & 0xffff)) /* CallGate */
 #define OFFSET_HI(_dw)            ((uint32)(((_dw) >> 16) & 0xffff))
 
+
+/* Reset values for descriptors. */
+#define RESET_DESC_BASE            0x00000000
+#define RESET_DESC_BASE_CS         0xffff0000
+#define RESET_DESC_LIMIT           0x0000ffff
+#define RESET_DESC_LIMIT_AP        0xffffffff
+#define RESET_DESC_LIMIT_TDX       0xffffffff
+#define RESET_SELECTOR_VALUE       0x00000000
+#define RESET_SELECTOR_VALUE_CS    0x0000f000
+#define RESET_GDT_LIMIT            0x0000ffff
+#define RESET_IDT_LIMIT            0x0000ffff
+
+
 /*
  * Accessor functions for descriptors.  
  * 
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 7def93ab..bafc51d6 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -101,6 +101,7 @@ typedef struct MSRQuery {
 #define MSR_DEBUGCTL          0x000001d9
 #define MSR_TSC_DEADLINE      0x000006e0
 #define MSR_PKRS              0x000006e1
+#define MSR_DEBUG_INTERFACE   0x00000c80
 #define MSR_EFER              0xc0000080
 #define MSR_FSBASE            0xc0000100
 #define MSR_GSBASE            0xc0000101
@@ -108,6 +109,15 @@ typedef struct MSRQuery {
 #define MSR_TSC_AUX           0xc0000103
 #define MSR_BD_TSC_RATIO      0xc0000104
 
+#define MSR_TEMPERATURE_TARGET   0x000001a2
+#define MSR_PACKAGE_THERM_STATUS 0x000001b1
+#define MSR_RAPL_POWER_UNIT      0x00000606
+#define MSR_PKG_ENERGY_STATUS    0x00000611
+#define MSR_PKG_PERF_STATUS      0x00000613
+#define MSR_PKG_POWER_INFO       0x00000614
+#define MSR_DRAM_ENERGY_STATUS   0x00000619
+#define MSR_DRAM_PERF_STATUS     0x0000061b
+
 /* CET MSRs */
 #define MSR_U_CET                            0x6a0
 #define MSR_S_CET                            0x6a2
@@ -142,6 +152,19 @@ typedef struct MSRQuery {
 #define MSR_ARCH_CAPABILITIES_IF_PSCHANGE_MC_NO   (1ULL << 6)
 #define MSR_ARCH_CAPABILITIES_TSX_CTRL            (1ULL << 7)
 #define MSR_ARCH_CAPABILITIES_TAA_NO              (1ULL << 8)
+#define MSR_ARCH_CAPABILITIES_MISC_PKG_CTRLS      (1ULL << 10)
+#define MSR_ARCH_CAPABILITIES_ENERGY_FILT_CTL     (1ULL << 11)
+#define MSR_ARCH_CAPABILITIES_DOITM               (1ULL << 12)
+#define MSR_ARCH_CAPABILITIES_SBDR_SSDP_NO        (1ULL << 13)
+#define MSR_ARCH_CAPABILITIES_FBSDP_NO            (1ULL << 14)
+#define MSR_ARCH_CAPABILITIES_PSDP_NO             (1ULL << 15)
+#define MSR_ARCH_CAPABILITIES_FB_CLEAR            (1ULL << 17)
+#define MSR_ARCH_CAPABILITIES_FB_CLEAR_CTRL       (1ULL << 18)
+#define MSR_ARCH_CAPABILITIES_RRSBA               (1ULL << 19)
+#define MSR_ARCH_CAPABILITIES_BHI_NO              (1ULL << 20)
+#define MSR_ARCH_CAPABILITIES_XAPIC_DIS_STATUS    (1ULL << 21)
+#define MSR_ARCH_CAPABILITIES_OVERCLOCKING_STATUS (1ULL << 23)
+#define MSR_ARCH_CAPABILITIES_PBRSB_NO            (1ULL << 24)
 
 #define MSR_FLUSH_CMD                        0x10b
 #define MSR_FLUSH_CMD_FLUSH_L1D                   (1ULL << 0)
@@ -149,7 +172,13 @@ typedef struct MSRQuery {
 #define MSR_SPEC_CTRL_IBRS                        (1UL << 0)
 #define MSR_SPEC_CTRL_STIBP                       (1UL << 1)
 #define MSR_SPEC_CTRL_SSBD                        (1UL << 2)
+#define MSR_SPEC_CTRL_IPRED_DIS_U                 (1UL << 3)
+#define MSR_SPEC_CTRL_IPRED_DIS_S                 (1UL << 4)
+#define MSR_SPEC_CTRL_RRSBA_DIS_U                 (1UL << 5)
+#define MSR_SPEC_CTRL_RRSBA_DIS_S                 (1UL << 6)
 #define MSR_SPEC_CTRL_PSFD                        (1UL << 7)
+#define MSR_SPEC_CTRL_DDPD_U                      (1UL << 8)
+#define MSR_SPEC_CTRL_BHI_DIS_S                   (1UL << 10)
 
 #define MSR_PRED_CMD_IBPB                         (1UL << 0)
 
@@ -157,6 +186,12 @@ typedef struct MSRQuery {
 #define MSR_TSX_CTRL_RTM_DISABLE                  (1ULL << 0)
 #define MSR_TSX_CTRL_CPUID_CLEAR                  (1ULL << 1)
 
+#define MSR_MCU_OPT_CTRL                     0x123
+#define MSR_MCU_OPT_CTRL_RNGDS_MITG_DIS           (1ULL << 0)
+#define MSR_MCU_OPT_CTRL_RTM_ALLOW                (1ULL << 1)
+#define MSR_MCU_OPT_CTRL_RTM_LOCKED               (1ULL << 2)
+#define MSR_MCU_OPT_CTRL_FB_CLEAR_DIS             (1ULL << 3)
+
 #ifndef MSR_MISC_FEATURES_ENABLES
 #define MSR_MISC_FEATURES_ENABLES            0x140
 #endif
@@ -295,6 +330,13 @@ typedef struct MSRQuery {
 #define MSR_ARCH_LBR_CTL_BRANCH_MASK   0x7f0000
 #define MSR_ARCH_LBR_CTL_ALL           0x7f000f
 
+/* AMD LBR stack MSRs. */
+#define MSR_DBG_EXTN_CTL      0xc000010f
+#define MSR_DBG_EXTN_CTL_LBRS (1 << 6)
+
+#define MSR_AMD_LBR_FROM_IP   0xc0010300
+#define MSR_AMD_LBR_TO_IP     0xc0010301
+
 /* Power Management MSRs */
 #define MSR_PERF_STATUS      0x00000198 // Current Performance State (ro)
 #define MSR_PERF_CTL         0x00000199 // Target Performance State (rw)
@@ -620,6 +662,10 @@ typedef struct MSRQuery {
 #define MSR_EFER_AMD_MBZ     0xffffffffffcf0200ULL  /* Must be zero (resrvd) */
 #define MSR_EFER_AMD_RAZ     0x00000000000000feULL  /* Read as zero          */
 
+/* MSR_BD_TSC_RATIO bits */
+#define MSR_BD_TSC_RATIO_RSVD    CONST64U(0xffffff0000000000)
+#define MSR_BD_TSC_RATIO_DEFAULT 0x0100000000ULL
+
 #define MSR_AMD_PATCH_LOADER 0xc0010020
 
 /* This ifndef is necessary because this is defined by some kernel headers. */
@@ -634,12 +680,15 @@ typedef struct MSRQuery {
 #ifndef MSR_K8_SYSCFG
 #define MSR_K8_SYSCFG        0xc0010010
 #endif
+#define MSR_K8_SYSCFG_MFDM               (1ULL<<19)
 #define MSR_K8_SYSCFG_MTRRTOM2EN         (1ULL<<21)
 #define MSR_K8_SYSCFG_TOM2FORCEMEMTYPEWB (1ULL<<22)
 #define MSR_K8_SYSCFG_SMEE               (1ULL<<23)
 #define MSR_K8_SYSCFG_SNPE               (1ULL<<24)
 #define MSR_K8_SYSCFG_VMPLE              (1ULL<<25)
 
+#define MSR_K8_IORRBASE0     0xc0010016
+#define MSR_K8_TOPMEM        0xc001001a
 #define MSR_K8_TOPMEM2       0xc001001d
 
 /* AMD "Greyhound" MSRs */
@@ -717,6 +766,19 @@ typedef struct MSRQuery {
 /* Field definitions for MSR_GHCB_PA_AP_RESET_HOLD_REQ */
 #define MSR_GHCB_PA_AP_RESET_HOLD_SHIFT     12
 
+/* Field definitions for MSR_GHCB_PA_REGISTER_GHCB_GPA_RESP */
+#define MSR_GHCB_PA_REGISTER_GHCB_GPA_ERR   0xfffffffffffff
+
+/* Field definitions for MSR_GHCB_PA_SNP_PSC_REQ */
+#define MSR_GHCB_PA_SNP_PSC_OP_PRIVATE      (1ULL << 52)
+#define MSR_GHCB_PA_SNP_PSC_OP_SHARED       (2ULL << 52)
+/* These definitions are used in assembly code to set edx for a wrmsr. */
+#define MSR_GHCB_PA_SNP_PSC_OP_PRIVATE_HI32 (1ULL << 20)
+#define MSR_GHCB_PA_SNP_PSC_OP_SHARED_HI32  (2ULL << 20)
+
+/* Field definitions for MSR_GHCB_PA_SNP_PSC_RESP */
+#define MSR_GHCB_PA_SNP_PSC_ERRCODE_SHIFT   32
+
 /* Field definitions for MSR_GHCB_PA_FEATURES_REQ */
 #define MSR_GHCB_PA_FEATURES_SHIFT          12
 
@@ -733,6 +795,16 @@ typedef struct MSRQuery {
 
 #define SEV_TERM_FROBOS_REG_FAILED       1  /* GHCB PA registration failed. */
 #define SEV_TERM_FROBOS_PVALIDATE_FAILED 2  /* PVALIDATE failed unexpectedly. */
+#define SEV_TERM_FROBOS_MISSING_CC_BLOB  3  /* Required CC blob is missing. */
+#define SEV_TERM_FROBOS_BAD_CC_BLOB      4  /* Contents of CC blob are bad. */
+#define SEV_TERM_FROBOS_INVALID_MEM      5  /* Unexpected PVALIDATE #VC. */
+#define SEV_TERM_FROBOS_INVALID_FIELD    6  /* Required GHCB field not valid. */
+#define SEV_TERM_FROBOS_BAD_NAE_STATE    7  /* #VC called with invalid state. */
+#define SEV_TERM_FROBOS_UNHANDLED_NAE    8  /* NAE not handled by #VC. */
+#define SEV_TERM_FROBOS_BAD_VMGEXIT_RESP 9  /* Unrecognized VMGEXIT response. */
+#define SEV_TERM_FROBOS_DECODE_ERROR     10 /* Instruction decode error. */
+#define SEV_TERM_FROBOS_PSC_FAILED       11 /* Page state change req failed. */
+#define SEV_TERM_FROBOS_NESTED_VC_EXC    12 /* A nested #VC occurred. */
 
 /* SEV feature-enabled bits in MSR_SEV_STATUS. */
 #define MSR_SEV_STATUS_SEV_EN_BIT      0
@@ -945,6 +1017,9 @@ typedef unsigned char MTRRType;
 #define MTRR_TYPE_WT          4
 #define MTRR_TYPE_WP          5
 #define MTRR_TYPE_WB          6
+/* AMD-only extended type bits: to be OR'ed with the above standard types */
+#define MTRR_TYPE_EXT_WRMEM   (1 << 3)
+#define MTRR_TYPE_EXT_RDMEM   (1 << 4)
 /* PAT Memory Type Only */
 /* UC- is equivalent to UC, except that the MTRR values take precedence */
 #define MTRR_TYPE_UCM         7
@@ -954,7 +1029,7 @@ typedef unsigned char MTRRType;
  * specify that type is unknown as it is very unlikely that Intel will
  * use this value. Note that linux is taking the same liberty.
  */
-#define MTRR_TYPE_UNKNOW     0xff
+#define MTRR_TYPE_UNKNOWN     0xff
 
 /*
  * PERF_STATUS bits
@@ -995,6 +1070,12 @@ typedef unsigned char MTRRType;
 #define MSR_INTEL_PQE_CLOS_L2_MASK_BASE  0xd10
 #define MSR_INTEL_PQE_CLOS_L2_MASK_MAX   0xd4f
 
+/* PASID MSR */
+#define MSR_PASID                        0xd93
+#define MSR_PASID_RSVD_MASK              0xffffffff7ff00000ULL
+#define MSR_PASID_VALID_BIT              (1ULL << 31)
+#define MSR_PASID_PASID_MASK             0xfffff
+
 static INLINE uint32
 X86MSR_SysCallEIP(uint64 star)
 {
diff --git a/vmmon-only/include/x86paging_64.h b/vmmon-only/include/x86paging_64.h
index 85f04cfd..15de9ef3 100644
--- a/vmmon-only/include/x86paging_64.h
+++ b/vmmon-only/include/x86paging_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016,2018-2020,2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2014,2016,2018-2020,2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -122,6 +122,61 @@ LMPTEIsSafe(VM_PAE_PTE pte, PT_Level level, uint64 physMask)
 }
 #endif /* VMX86_DEBUG */
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * NPTValidLargePage --
+ *
+ *     Returns TRUE iff the provided large page NPT entry is valid
+ *     (i.e. no reserved bits set).
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+NPTValidLargePage(VM_PAE_PTE npte, PT_Level level, unsigned depth)
+{
+   const PPN lpRsvd = MASK((level - 1) * PT_LEVEL_SHIFT) &
+                      ~(PTE_LARGE_PAT >> PAGE_SHIFT);
+   return (level == PT_LEVEL_2 ||
+           (level == PT_LEVEL_3 && depth == PT_LEVEL_4)) &&
+          (LM_PTE_2_PFN(npte) & lpRsvd) == 0;
+}
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * NPTEIsValid --
+ *
+ *     Check an NPT entry for validity at the indicated page table level
+ *     and depth.  Use the provided physMask as the mask of reserved PA bits.
+ *
+ *----------------------------------------------------------------------
+ */
+static INLINE Bool
+NPTEIsValid(VM_PAE_PTE npte, PT_Level level, Bool nxOn, unsigned depth,
+            uint64 physMask)
+{
+   VM_PAE_PTE rsvd;
+   if (depth == PT_LEVEL_3) {
+      rsvd = physMask & ~PTE_NX;
+      if (level == PT_LEVEL_3) {
+         rsvd |= PTE_NX | PDPTR_MBZ_MASK;
+      }
+   } else {
+      rsvd = physMask & MASK64(52);
+      if (level == PT_LEVEL_4) {
+         rsvd |= PTE_PS | PTE_G;
+      }
+   }
+   if (UNLIKELY(!nxOn)) {
+      /* When NX is disabled, PTE_NX is treated as reserved. */
+      rsvd |= PTE_NX;
+   }
+   return !PTE_PRESENT(npte) ||
+          ((npte & rsvd) == 0 &&
+           (level == PT_LEVEL_1 ||
+            (!PTE_LARGEPAGE(npte) || NPTValidLargePage(npte, level, depth))));
+}
 
 /*
  * x86-64 architecture requires implementations supporting less than
diff --git a/vmmon-only/include/x86paging_common.h b/vmmon-only/include/x86paging_common.h
index 65716198..ab4409f7 100644
--- a/vmmon-only/include/x86paging_common.h
+++ b/vmmon-only/include/x86paging_common.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -62,11 +62,11 @@
 
 #define PTE_LARGE_PAT_2_PS(_pte) (((_pte) & PTE_LARGE_PAT) >> 5)
 
-#define PTE_PROT_FLAGS  (PTE_P|PTE_RW|PTE_US)
-#define PTE_FLAGS       (PTE_PROT_FLAGS|PTE_G)
+#define PTE_PROT_FLAGS      (PTE_P|PTE_RW|PTE_US)
+#define PTE_FLAGS           (PTE_PROT_FLAGS|PTE_G)
 
-#define PTE_KERNEL              (PTE_P|PTE_RW)
-#define PTE_KERNEL_NX           (PTE_P|PTE_RW|PTE_NX)
+#define PTE_KERNEL          (PTE_P|PTE_RW)
+#define PTE_KERNEL_NX       (PTE_P|PTE_RW|PTE_NX)
 
 #define PTE_PRESENT(_pte)   (((_pte) & PTE_P) != 0)
 #define PTE_WRITEABLE(_pte) (((_pte) & PTE_RW) != 0)
@@ -79,6 +79,8 @@
 #define PTE_NOEXECUTE(_pte) (((_pte) & PTE_NX) != 0)
 #define PTE_PK(_pte)        (((_pte) & PTE_PK_MASK) >> PTE_PK_SHIFT)
 
+#define PDPTR_MBZ_MASK      CONST64(0x1e6)
+
 #define PK_AD         1 /* Access disable bit */
 #define PK_WD         2 /* Write disable bit */
 #define PKR_WIDTH     2
@@ -86,15 +88,15 @@
 #define PK_RIGHTS(_pkru, _key) (((_pkru) >> ((_key) * PKR_WIDTH)) & PKR_MASK);
 
 /* Error code flags */
-#define PF_P            (1 << 0)
-#define PF_RW           (1 << 1)
-#define PF_US           (1 << 2)
-#define PF_RSVD         (1 << 3)
-#define PF_ID           (1 << 4)
-#define PF_PK           (1 << 5)
-#define PF_SS           (1 << 6)
-#define PF_SGX          (1 << 15)
-#define PF_RMP          (1 << 31)
+#define PF_P            (1u << 0)
+#define PF_RW           (1u << 1)
+#define PF_US           (1u << 2)
+#define PF_RSVD         (1u << 3)
+#define PF_ID           (1u << 4)
+#define PF_PK           (1u << 5)
+#define PF_SS           (1u << 6)
+#define PF_SGX          (1u << 15)
+#define PF_RMP          (1u << 31)
 
 /*
  * Operand definitions for the INVPCID instruction. See SDM Vol. 2A.
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
index 76550c09..09edbb84 100644
--- a/vmmon-only/include/x86svm.h
+++ b/vmmon-only/include/x86svm.h
@@ -139,10 +139,12 @@
 #define SVM_VMCB_APIC_VTPR_MASK            0x00000000000000ffULL
 #define SVM_VMCB_APIC_VTPR_SHIFT           0
 #define SVM_VMCB_APIC_VIRQ                 0x0000000000000100ULL
+#define SVM_VMCB_APIC_VGIF                 0x0000000000000200ULL
 #define SVM_VMCB_APIC_VINTR_PRIO_MASK      0x00000000000f0000ULL
 #define SVM_VMCB_APIC_VINTR_PRIO_SHIFT     16
 #define SVM_VMCB_APIC_VIGN_TPR             0x0000000000100000ULL
 #define SVM_VMCB_APIC_VINTR_MASKING        0x0000000001000000ULL
+#define SVM_VMCB_APIC_VGIF_ENABLE          0x0000000002000000ULL
 #define SVM_VMCB_APIC_AVIC_ENABLE          0x0000000080000000ULL
 #define SVM_VMCB_APIC_VINTR_VECTOR_MASK    0x000000ff00000000ULL
 #define SVM_VMCB_APIC_VINTR_VECTOR_SHIFT   32
@@ -301,6 +303,7 @@
 #define SVM_EXITCODE_AP_JUMP_TABLE       0x80000005   // SW only
 #define SVM_EXITCODE_SNP_PSC_REQ         0x80000010   // SW only
 #define SVM_EXITCODE_SNP_GUEST_REQ       0x80000011   // SW only
+#define SVM_EXITCODE_SNP_AP_CREATION     0x80000013   // SW only
 #define SVM_EXITCODE_HV_FEATURES         0x8000FFFD   // SW only
 #define SVM_EXITCODE_UNSUPPORTED         0x8000FFFF   // SW only
 #define SVM_EXITCODE_INVALID             (-1ULL)
@@ -375,6 +378,11 @@
 #define SVM_APEXIT_SET            0x0
 #define SVM_APEXIT_GET            0x1
 
+/* ExitInfo1 for SNP AP creation exits */
+#define SVM_SNPAPCREATE_WAIT_INIT 0x0
+#define SVM_SNPAPCREATE_VMRUN     0x1
+#define SVM_SNPAPCREATE_DESTROY   0x2
+
 /* Event Injection */
 #define SVM_INTINFO_VECTOR_MASK   0x000000ff
 #define SVM_INTINFO_TYPE_SHIFT    8
@@ -388,6 +396,27 @@
 #define SVM_INTINFO_RSVD          0x7ffff000
 #define SVM_INTINFO_VALID         0x80000000
 
+/* AVIC related definitions. */
+#define SVM_AVIC_PHYS_TBL_MAX_VCPUS  512
+
+#define SVM_AVIC_PHYS_ID_TBL_VALID (1ULL << 63)
+
+#define SVM_AVIC_TRAP_BITMASK     \
+      ((1ULL << APICR_ID)       | \
+       (1ULL << APICR_EOI)      | \
+       (1ULL << APICR_RMTREAD)  | \
+       (1ULL << APICR_LDR)      | \
+       (1ULL << APICR_DFR)      | \
+       (1ULL << APICR_SVR)      | \
+       (1ULL << APICR_ESR)      | \
+       (1ULL << APICR_TIMERLVT) | \
+       (1ULL << APICR_THERMLVT) | \
+       (1ULL << APICR_PCLVT)    | \
+       (1ULL << APICR_LVT0)     | \
+       (1ULL << APICR_LVT1)     | \
+       (1ULL << APICR_ERRLVT)   | \
+       (1ULL << APICR_INITCNT)  | \
+       (1ULL << APICR_DIVIDER))
 
 #define SVM_EXEC_CTL_BIT(exitCode) (1ULL << (exitCode - SVM_EXITCODE_INTR))
 
diff --git a/vmmon-only/include/x86vt-exit-reasons.h b/vmmon-only/include/x86vt-exit-reasons.h
index 7961d766..30a9e66d 100644
--- a/vmmon-only/include/x86vt-exit-reasons.h
+++ b/vmmon-only/include/x86vt-exit-reasons.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2018,2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2018,2021-2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -25,7 +25,16 @@
 
 #include "community_source.h"
 
-#define VT_EXITREASON_VMENTRYFAIL           (1U << 31)
+/*
+ * Definitions for fields in the exit reason. Bits 28 and 29 are only applicable
+ * for exits that end in SMM.  Bit 16 is MBZ while other bits are reserved for
+ * future use.
+ */
+#define VT_EXITREASON_BASIC_REASON_MASK      0xFFFF
+#define VT_EXITREASON_INSIDE_ENCLAVE         (1U << 27)
+#define VT_EXITREASON_PENDING_MTF            (1U << 28)
+#define VT_EXITREASON_EXIT_ROOT_OPERATION    (1U << 29)
+#define VT_EXITREASON_VMENTRYFAIL            (1U << 31)
 
 VT_EXIT(EXC_OR_NMI,            0)
 VT_EXIT(EXTINT,                1)
@@ -93,11 +102,17 @@ VT_EXIT(PML_LOGFULL,          62)
 VT_EXIT(XSAVES,               63)
 VT_EXIT(XRSTORS,              64)
 VT_EXIT(VMEXIT65,             65)
-VT_EXIT(VMEXIT66,             66)
+VT_EXIT(SPP_EVENT,            66)
 VT_EXIT(UMWAIT,               67)
 VT_EXIT(TPAUSE,               68)
-VT_EXIT(VMEXIT69,             69)
+VT_EXIT(LOADIWKEY,            69)
 VT_EXIT(ENCLV,                70)
 VT_EXIT(SGX_CONFLICT,         71)
+VT_EXIT(ENQCMD_PASID_FAIL,    72)
+VT_EXIT(ENQCMDS_PASID_FAIL,   73)
+VT_EXIT(BUS_LOCK,             74)
+VT_EXIT(NOTIFY_WINDOW,        75)
+VT_EXIT(VMEXIT76,             76)
+VT_EXIT(TDCALL,               77)
 /* Bump this up if you add an exit reason. */
-#define VT_NUM_EXIT_REASONS   72
+#define VT_NUM_EXIT_REASONS   78
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
index d9af56ab..69b09fdf 100644
--- a/vmmon-only/include/x86vt-vmcs-fields.h
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -284,10 +284,10 @@ VMCS_FIELD(ENCLS_EXITING_BITMAP,    0x202E, _S64, _TC, 23, _NC,  _V, _NA,  _S)
 VMCS_UNUSED(                        0x2030, _S64, _TC, 24)
 VMCS_FIELD(TSC_MULTIPLIER,          0x2032, _S64, _TC, 25, _NC, _NV, _NA,  _S)
 VMCS_UNUSED(                        0x2034, _S64, _TC, 26)
-VMCS_FIELD(ENCLV_EXITING_BITMAP,    0x2036, _S64, _TC, 27, _NC,  _V, _NA,  _S)
-VMCS_UNUSED(                        0x2038, _S64, _TC, 28)
-VMCS_UNUSED(                        0x203A, _S64, _TC, 29)
-VMCS_UNUSED(                        0x203C, _S64, _TC, 30)
+VMCS_FIELD(ENCLV_EXITING_BITMAP,    0x2036, _S64, _TC, 27, _NC, _NV, _NA,  _S)
+VMCS_FIELD(LOW_PASID_DIR,           0x2038, _S64, _TC, 28, _NC, _NV, _NA,  _S)
+VMCS_FIELD(HIGH_PASID_DIR,          0x203A, _S64, _TC, 29, _NC, _NV, _NA,  _S)
+VMCS_FIELD(SHARED_EPTP,             0x203C, _S64, _TC, 30, _NC, _NV, _NA, _NS)
 VMCS_UNUSED(                        0x203E, _S64, _TC, 31)
 VMCS_GROUP_END(64, CTL)
 
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
index 3dfe840d..379de474 100644
--- a/vmmon-only/include/x86vt.h
+++ b/vmmon-only/include/x86vt.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2004-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 2004-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -170,10 +170,10 @@
                                   VT_ENCODING_NUM_TYPES *   \
                                   VT_ENCODING_NUM_SIZES)
 /*
- * The highest index of any currently defined field is 27, for
- * ENCLV_EXITING_BITMAP.
+ * The highest index of any currently defined field is 30, for
+ * SHARED_EPTP.
  */
-#define VT_ENCODING_MAX_INDEX                  27
+#define VT_ENCODING_MAX_INDEX                  30
 
 /* VMCS ID's for various CPU models. */
 #define  VT_VMCS_ID_VMWARE       1
@@ -322,7 +322,7 @@ enum {
    VMX_CPU2(EPT_VIOL_VE,        18)                      \
    VMX_CPU2(PT_SUPPRESS_NR_BIT, 19)                      \
    VMX_CPU2(XSAVES,             20)                      \
-   VMX_CPU2(PASID,              21)                      \
+   VMX_CPU2(PASID_TRANS,        21)                      \
    VMX_CPU2(EPT_MBX,            22)                      \
    VMX_CPU2(EPT_SUB_PAGE,       23)                      \
    VMX_CPU2(PT_GUEST_PA,        24)                      \
@@ -348,6 +348,7 @@ enum {
    VMX_CPU3(PAGING_WRITE,        2)                      \
    VMX_CPU3(GUEST_PAGING_VERIF,  3)                      \
    VMX_CPU3(IPI_VIRTUALIZATION,  4)                      \
+   VMX_CPU3(VIRT_SPEC_CTRL,      7)                      \
 
 #define VMX_PROCBASED_CTLS3_CAP                          \
         VMX_PROCBASED_CTLS3_CAP_NDA                      \
@@ -587,18 +588,16 @@ enum {
  * exit reasons, because we shouldn't encounter any new exit reasons
  * unless we opt-in to the features that produce them.
  */
-#define VT_EXITREASON_SYNTH_BASE     77
-#define VT_EXITREASON_SYNTH_IRET     77
-#define VT_EXITREASON_SYNTH_NMI      78
-#define VT_EXITREASON_SYNTH_ICEBP    79
-#define VT_EXITREASON_SYNTH_EXC_BASE 80
-#define VT_EXITREASON_SYNTH_MAX      111
+#define VT_EXITREASON_SYNTH_BASE     78
+#define VT_EXITREASON_SYNTH_IRET     78
+#define VT_EXITREASON_SYNTH_NMI      79
+#define VT_EXITREASON_SYNTH_ICEBP    80
+#define VT_EXITREASON_SYNTH_EXC_BASE 81
+#define VT_EXITREASON_SYNTH_MAX      112
 
 #define VT_EXITREASON_SYNTH_EXC(gatenum) \
         (VT_EXITREASON_SYNTH_EXC_BASE + gatenum) /* 0-31 */
 
-#define VT_EXITREASON_INSIDE_ENCLAVE        (1U << 27)
-
 /* Instruction error codes. */
 #define VT_ERROR_VMCALL_VMX_ROOT            1
 #define VT_ERROR_VMCLEAR_INVALID_PA         2
@@ -703,12 +702,6 @@ enum {
 #define VT_GUESTFAIL_QUAL_NMI          3
 #define VT_GUESTFAIL_QUAL_LINK         4
 
-/* SGX conflict VM-exit Qualification Codes */
-#define VT_SGX_TRACKING_RESOURCE_CONFLICT     0
-#define VT_SGX_TRACKING_REFERENCE_CONFLICT    1
-#define VT_SGX_EPC_PAGE_CONFLICT_EXCEPTION    2
-#define VT_SGX_EPC_PAGE_CONFLICT_ERROR        3
-
 /* VMX abort indicators. */
 
 #define VT_VMX_ABORT_GUEST_MSRS        1
@@ -1022,14 +1015,17 @@ VTComputeMandatoryBits(uint64 msrVal, uint32 bits)
  * VT_EnabledFromFeatures --
  *
  *  Returns TRUE if VT is enabled in the given feature control bits.
+ *  If SMX is enabled, then only SMXE must be set, otherwise, only VMXE
+ *  must be set. The LOCK bit must always be set.
  *
  *----------------------------------------------------------------------
  */
 static INLINE Bool
-VT_EnabledFromFeatures(uint64 featCtl)
+VT_EnabledFromFeatures(uint64 featCtl, Bool smxEnabled)
 {
-   return ((featCtl & (MSR_FEATCTL_VMXE | MSR_FEATCTL_LOCK)) ==
-           (MSR_FEATCTL_VMXE | MSR_FEATCTL_LOCK));
+   uint64 req = MSR_FEATCTL_LOCK |
+                (smxEnabled ? MSR_FEATCTL_SMXE : MSR_FEATCTL_VMXE);
+   return (featCtl & req) == req;
 }
 
 /*
@@ -1150,6 +1146,25 @@ VT_ConvEPTViolSupportedFromFeatures(uint64 secondary)
    return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_EPT_VIOL_VE) != 0;
 }
 
+
+/*
+ *----------------------------------------------------------------------
+ *
+ * VT_PasidTransSupportedFromFeatures --
+ *
+ *   Returns TRUE if the given VMX features provide support for
+ *   PASID translation
+ *
+ *   Assumes that VT is supported.
+ *
+ *----------------------------------------------------------------------
+ */
+static inline Bool
+VT_PasidTransSupportedFromFeatures(uint64 secondary)
+{
+   return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_PASID_TRANS) != 0;
+}
+
 #if !defined(VM_ARM_64) /* PR 2822467 */ &&                     \
     (defined(DECODER) || defined(FROBOS) || defined(ULM) ||     \
      defined(VMKBOOT) || defined(VMKERNEL) || defined(VMM) ||   \
@@ -1165,9 +1180,9 @@ VT_ConvEPTViolSupportedFromFeatures(uint64 secondary)
  *----------------------------------------------------------------------
  */
 static INLINE Bool
-VT_EnabledCPU(void)
+VT_EnabledCPU(Bool smxEnabled)
 {
-   return VT_EnabledFromFeatures(X86MSR_GetMSR(MSR_FEATCTL));
+   return VT_EnabledFromFeatures(X86MSR_GetMSR(MSR_FEATCTL), smxEnabled);
 }
 
 
diff --git a/vmmon-only/include/x86vtinstr.h b/vmmon-only/include/x86vtinstr.h
index 83630927..e5320775 100644
--- a/vmmon-only/include/x86vtinstr.h
+++ b/vmmon-only/include/x86vtinstr.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2004-2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2004-2015, 2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -229,6 +229,7 @@ VMWRITE(size_t encoding, size_t val)
       VMXStatus status;
       status = VMWRITE_2_STATUS(encoding, val);
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       VMWRITE_UNCHECKED(encoding, val);
    }
@@ -262,6 +263,7 @@ VMLAUNCH(void)
       VMXStatus status;
       status = VMLAUNCH_2_STATUS();
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       VMLAUNCH_UNCHECKED();
    }
@@ -295,6 +297,7 @@ VMRESUME(void)
       VMXStatus status;
       status = VMRESUME_2_STATUS();
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       VMRESUME_UNCHECKED();
    }
@@ -328,6 +331,7 @@ VMCALL(void)
       VMXStatus status;
       status = VMCALL_2_STATUS();
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       VMCALL_UNCHECKED();
    }
@@ -374,6 +378,7 @@ INVVPID(InvvpidArg *v, size_t extent)
       VMXStatus status;
       status = INVVPID_2_STATUS(v, extent);
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       INVVPID_UNCHECKED(v, extent);
    }
@@ -446,6 +451,7 @@ INVEPT(InveptArg *e, size_t extent)
       VMXStatus status;
       status = INVEPT_2_STATUS(e, extent);
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       INVEPT_UNCHECKED(e, extent);
    }
@@ -541,14 +547,14 @@ VMCLEAR_2_STATUS(MA *vmcs)
    ASSERT(mscStatus < ARRAYSIZE(MscToStatus));
    return MscToStatus[mscStatus];
 }
- 
+
 static INLINE VMXStatus
 VMREAD_2_STATUS(size_t encoding, size_t *retval)
 {
    unsigned char mscStatus;
    static const VMXStatus MscToStatus[] =
       {VMX_Success, VMX_FailValid, VMX_FailInvalid};
- 
+
    mscStatus = __vmx_vmread(encoding, retval);
    ASSERT(mscStatus < ARRAYSIZE(MscToStatus));
    return MscToStatus[mscStatus];
@@ -597,8 +603,9 @@ VMXON(MA *vmxonRegion)
       VMXStatus status;
       status = VMXON_2_STATUS(vmxonRegion);
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
-      VMXON_UNCHECKED(vmxonRegion); 
+      VMXON_UNCHECKED(vmxonRegion);
    }
 }
 
@@ -609,6 +616,7 @@ VMXOFF(void)
       VMXStatus status;
       status = VMXOFF_2_STATUS();
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       VMXOFF_UNCHECKED();
    }
@@ -621,6 +629,7 @@ VMPTRLD(MA *vmcs)
       VMXStatus status;
       status = VMPTRLD_2_STATUS(vmcs);
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       VMPTRLD_UNCHECKED(vmcs);
    }
@@ -633,6 +642,7 @@ VMPTRST(MA *vmcs)
       VMXStatus status;
       status = VMPTRST_2_STATUS(vmcs);
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       VMPTRST_UNCHECKED(vmcs);
    }
@@ -646,6 +656,7 @@ VMCLEAR(MA* vmcs)
       VMXStatus status;
       status = VMCLEAR_2_STATUS(vmcs);
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       VMCLEAR_UNCHECKED(vmcs);
    }
@@ -659,6 +670,7 @@ VMREAD(size_t encoding)
       VMXStatus status;
       status = VMREAD_2_STATUS(encoding, &retval);
       ASSERT(status == VMX_Success);
+      UNUSED_VARIABLE(status);
    } else {
       retval = VMREAD_UNCHECKED(encoding);
    }
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 4fac1e43..1827087e 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -2332,7 +2332,9 @@ isVAReadable(VA r)  // IN:
    int ret;
 
    r = APICR_TO_ADDR(r, APICR_VERSION);
-#if defined(HAVE_GET_KERNEL_NOFAULT) || LINUX_VERSION_CODE >= KERNEL_VERSION(5, 17, 0)
+#if defined(HAVE_GET_KERNEL_NOFAULT) || \
+    defined(RHEL92_BACKPORTS)        || \
+    LINUX_VERSION_CODE >= KERNEL_VERSION(5, 17, 0)
    /*
     * Exists from 5.10, first indicated by HAVE_GET_KERNEL_NOFAULT,
     * and from post-5.17 just existing everywhere.
diff --git a/vmmon-only/linux/vmhost.h b/vmmon-only/linux/vmhost.h
index 5edd9ba7..dee549af 100644
--- a/vmmon-only/linux/vmhost.h
+++ b/vmmon-only/linux/vmhost.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2002-2020 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmnet-only/bridge.c b/vmnet-only/bridge.c
index feb22eec..cce209b2 100644
--- a/vmnet-only/bridge.c
+++ b/vmnet-only/bridge.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2013, 2017, 2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2013, 2017, 2022-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -26,6 +26,9 @@
 #include <linux/slab.h>
 #include <linux/poll.h>
 
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 4, 10)
+#include <net/gso.h>
+#endif
 #include <linux/netdevice.h>
 #include <linux/etherdevice.h>
 #include <linux/mm.h>
@@ -684,7 +687,7 @@ VNetBridgeReceiveFromVNet(VNetJack        *this, // IN: jack
 	 }
          spin_unlock_irqrestore(&bridge->historyLock, flags);
 
-#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 18, 0)
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 18, 0) && !defined(RHEL91_BACKPORTS)
          netif_rx_ni(clone);
 #else
          netif_rx(clone);
diff --git a/vmnet-only/compat_version.h b/vmnet-only/compat_version.h
index 51facf4b..4a0d7316 100644
--- a/vmnet-only/compat_version.h
+++ b/vmnet-only/compat_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -135,6 +135,12 @@
 #   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(8, 5)
 #      define RHEL85_BACKPORTS 1
 #   endif
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(9, 1)
+#      define RHEL91_BACKPORTS 1
+#   endif
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(9, 2)
+#      define RHEL92_BACKPORTS 1
+#   endif
 #endif
 
 #endif /* __COMPAT_VERSION_H__ */
diff --git a/vmnet-only/netif.c b/vmnet-only/netif.c
index e97ff5ce..8b9d16bc 100644
--- a/vmnet-only/netif.c
+++ b/vmnet-only/netif.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016,2019,2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2016,2019,2022-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -345,11 +345,11 @@ VNetNetIfReceive(VNetJack        *this, // IN: jack
                         netIf->dev->flags)) {
       goto drop_packet;
    }
-   
+
    /* send to the host interface */
    skb->dev = netIf->dev;
    skb->protocol = eth_type_trans(skb, netIf->dev);
-#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 18, 0)
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 18, 0) && !defined(RHEL91_BACKPORTS)
    netif_rx_ni(skb);
 #else
    netif_rx(skb);
@@ -357,7 +357,7 @@ VNetNetIfReceive(VNetJack        *this, // IN: jack
    netIf->stats.rx_packets++;
 
    return;
-   
+
  drop_packet:
    dev_kfree_skb(skb);
 }
diff --git a/vmnet-only/smac.c b/vmnet-only/smac.c
index a3b0cf5b..ab6cd101 100644
--- a/vmnet-only/smac.c
+++ b/vmnet-only/smac.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2002-2018,2020,2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 2002-2018,2020,2022,2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -4868,8 +4868,8 @@ SetPacketByte(SMACPacket *packet, // IN: packet
    ASSERT(packet);
 #ifdef _WIN32
 
-   if (packet == NULL || packet->buf1 == NULL || packet->buf2 == NULL) {
-       return FALSE;
+   if (packet == NULL) {
+      return FALSE;
    }
 
    /* check length, be sure to handle case where offset = -1, length > 0 */
@@ -4880,8 +4880,14 @@ SetPacketByte(SMACPacket *packet, // IN: packet
 
    /* if offset starts in the first buffer, then copy from first buffer */
    if (offset < packet->buf1Len) {
+      if (packet->buf1 == NULL) {
+         return FALSE;
+      }
       ((uint8*)packet->buf1)[offset] = data;
    } else {
+      if (packet->buf2 == NULL) {
+         return FALSE;
+      }
       offset -= packet->buf1Len;
       ((uint8*)packet->buf2)[offset] = data;
    }
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index 4f8e04fc..87bf1ece 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -45,6 +45,14 @@
 #pragma warning(pop)
 #endif
 
+#ifdef __wasm__
+#define VM_ATOMIC_USE_C11
+#endif
+
+#ifdef VM_ATOMIC_USE_C11
+#include <stdatomic.h>
+#endif
+
 #include "vm_basic_types.h"
 #include "vm_assert.h"
 
@@ -233,7 +241,7 @@ Atomic_ReadIfEqualWrite128(Atomic_uint128 *ptr,   // IN/OUT
     * use the right (LL/SC vs LSE) atomics without -moutline-atomics.
     */
 #if __GNUC__ >= 9
-   if (Atomic_HaveLSE) {
+   if (Atomic_HaveLse()) {
       SMP_RW_BARRIER_RW();
       __asm__ __volatile__(
          ".arch armv8.2-a            \n\t"
@@ -309,7 +317,9 @@ Atomic_Read8(Atomic_uint8 const *var)  // IN:
 {
    uint8 val;
 
-#if defined __GNUC__ && defined VM_ARM_32
+#if defined VM_ATOMIC_USE_C11
+   val = atomic_load((const _Atomic uint8 *)&var->value);
+#elif defined __GNUC__ && defined VM_ARM_32
    val = AtomicUndefined(var);
 #elif defined __GNUC__ && defined VM_ARM_64
    val = _VMATOM_X(R, 8, &var->value);
@@ -349,7 +359,9 @@ static INLINE uint8
 Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
                   uint8 val)          // IN:
 {
-#if defined __GNUC__ && defined VM_ARM_32
+#if defined VM_ATOMIC_USE_C11
+   return atomic_exchange((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + val);
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 8, TRUE, &var->value, val);
@@ -363,6 +375,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
    );
    return val;
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (volatile char) == sizeof var->value);
    return _InterlockedExchange8((volatile char *)&var->value, val);
 #else
 #error Atomic_ReadWrite8 not implemented
@@ -390,7 +403,9 @@ static INLINE void
 Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
               uint8 val)          // IN:
 {
-#if defined __GNUC__ && defined VM_ARM_32
+#if defined VM_ATOMIC_USE_C11
+   atomic_store((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_32
    AtomicUndefined(var + val);
 #elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(W, 8, &var->value, val);
@@ -429,7 +444,11 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
                          uint8 oldVal,       // IN:
                          uint8 newVal)       // IN:
 {
-#if defined __GNUC__ && defined VM_ARM_32
+#if defined VM_ATOMIC_USE_C11
+   atomic_compare_exchange_strong(
+      (_Atomic uint8 *)&var->value, &oldVal, newVal);
+   return oldVal;
+#elif defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + oldVal + newVal);
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RIFEQW, 8, TRUE, &var->value, oldVal, newVal);
@@ -447,6 +466,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
 
    return val;
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (volatile char) == sizeof var->value);
    return _InterlockedCompareExchange8((volatile char *)&var->value,
                                        newVal, oldVal);
 #else
@@ -477,7 +497,9 @@ Atomic_ReadAnd8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_and((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, and, val);
 #else
    do {
@@ -539,7 +561,9 @@ Atomic_ReadOr8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_or((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, orr, val);
 #else
    do {
@@ -601,7 +625,9 @@ Atomic_ReadXor8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_xor((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, eor, val);
 #else
    do {
@@ -663,7 +689,9 @@ Atomic_ReadAdd8(Atomic_uint8 *var, // IN/OUT
 {
    uint8 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_add((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, add, val);
 #else
    do {
@@ -723,7 +751,9 @@ static INLINE void
 Atomic_Sub8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_sub((_Atomic uint8 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, sub, val);
 #else
    Atomic_Add8(var, -val);
@@ -848,7 +878,9 @@ Atomic_Read32(Atomic_uint32 const *var) // IN
    ASSERT(((uintptr_t)var % 4) == 0);
 #endif
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   value = atomic_load((_Atomic uint32 *)&var->value);
+#elif defined __GNUC__
    /*
     * Use inline assembler to force using a single load instruction to
     * ensure that the compiler doesn't split a transfer operation into multiple
@@ -907,7 +939,9 @@ static INLINE uint32
 Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
                    uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_exchange((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 retVal;
    uint32 res;
@@ -941,6 +975,7 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    return _InterlockedExchange((long *)&var->value, (long)val);
 #else
 #error Atomic_ReadWrite32 not implemented
@@ -973,7 +1008,9 @@ Atomic_Write32(Atomic_uint32 *var, // OUT
    ASSERT(((uintptr_t)var % 4) == 0);
 #endif
 
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #if defined VM_ARM_64
    _VMATOM_X(W, 32, &var->value, val);
 #elif defined VM_ARM_32
@@ -1052,7 +1089,11 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
                           uint32 oldVal,      // IN
                           uint32 newVal)      // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_compare_exchange_strong(
+      (_Atomic uint32 *)&var->value, &oldVal, newVal);
+   return oldVal;
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 retVal;
    uint32 res;
@@ -1091,6 +1132,7 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    return _InterlockedCompareExchange((long *)&var->value,
                                       (long)newVal,
                                       (long)oldVal);
@@ -1101,7 +1143,7 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
 #define Atomic_ReadIfEqualWrite Atomic_ReadIfEqualWrite32
 
 
-#if defined VM_64BIT || defined VM_ARM_V7
+#if defined VM_64BIT || defined VM_ARM_V7 || defined VM_ATOMIC_USE_C11
 /*
  *-----------------------------------------------------------------------------
  *
@@ -1123,7 +1165,11 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
                           uint64 oldVal,      // IN
                           uint64 newVal)      // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_compare_exchange_strong(
+      (_Atomic uint64 *)&var->value, &oldVal, newVal);
+   return oldVal;
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint64 retVal;
    uint32 res;
@@ -1183,6 +1229,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
    return val;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedCompareExchange64((__int64 *)&var->value,
                                         (__int64)newVal,
                                         (__int64)oldVal);
@@ -1213,7 +1260,9 @@ static INLINE void
 Atomic_And32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_and((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1244,6 +1293,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedAnd((long *)&var->value, (long)val);
 #else
 #error Atomic_And32 not implemented
@@ -1272,7 +1322,9 @@ static INLINE void
 Atomic_Or32(Atomic_uint32 *var, // IN/OUT
             uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_or((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1303,6 +1355,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedOr((long *)&var->value, (long)val);
 #else
 #error Atomic_Or32 not implemented
@@ -1331,7 +1384,9 @@ static INLINE void
 Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_xor((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1362,6 +1417,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedXor((long *)&var->value, (long)val);
 #else
 #error Atomic_Xor32 not implemented
@@ -1391,7 +1447,9 @@ static INLINE void
 Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_xor((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__
 #if defined VM_ARM_64
    _VMATOM_X(OP, 64, TRUE, &var->value, eor, val);
 #else /* VM_X86_64 */
@@ -1404,6 +1462,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
    );
 #endif
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedXor64((__int64 *)&var->value, (__int64)val);
 #else
 #error Atomic_Xor64 not implemented
@@ -1432,7 +1491,9 @@ static INLINE void
 Atomic_Add32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_add((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1463,6 +1524,7 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
 #error Atomic_Add32 not implemented
@@ -1491,7 +1553,9 @@ static INLINE void
 Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_sub((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 tmp;
@@ -1535,6 +1599,7 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
     */
 #   pragma warning(push)
 #   pragma warning(disable: 4146)
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedExchangeAdd((long *)&var->value, (long)-val);
 #   pragma warning(pop)
 #else
@@ -1563,7 +1628,9 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
 static INLINE void
 Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
 {
-#ifdef __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   Atomic_Add32(var, 1);
+#elif defined __GNUC__
 #if defined VM_ARM_ANY
    Atomic_Add32(var, 1);
 #else /* VM_X86_ANY */
@@ -1576,6 +1643,7 @@ Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedIncrement((long *)&var->value);
 #else
 #error Atomic_Inc32 not implemented
@@ -1603,7 +1671,9 @@ Atomic_Inc32(Atomic_uint32 *var) // IN/OUT
 static INLINE void
 Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
 {
-#ifdef __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   Atomic_Sub32(var, 1);
+#elif defined __GNUC__
 #if defined VM_ARM_ANY
    Atomic_Sub32(var, 1);
 #else /* VM_X86_ANY */
@@ -1616,6 +1686,7 @@ Atomic_Dec32(Atomic_uint32 *var) // IN/OUT
    );
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    _InterlockedDecrement((long *)&var->value);
 #else
 #error Atomic_Dec32 not implemented
@@ -1652,7 +1723,9 @@ Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_or((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, orr, val);
 #else
    do {
@@ -1686,7 +1759,9 @@ Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
 {
    uint32 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_and((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, and, val);
 #else
    do {
@@ -1721,7 +1796,9 @@ Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_or((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, orr, val);
 #else
    do {
@@ -1755,7 +1832,9 @@ Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
 {
    uint64 res;
 
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_and((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, and, val);
 #else
    do {
@@ -1792,7 +1871,9 @@ static INLINE uint32
 Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
                  uint32 val)         // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_fetch_add((_Atomic uint32 *)&var->value, val);
+#elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
    uint32 retVal;
@@ -1828,6 +1909,7 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
    return val;
 #endif /* VM_X86_ANY */
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (long) == sizeof var->value);
    return _InterlockedExchangeAdd((long *)&var->value, (long)val);
 #else
 #error Atomic_ReadAdd32 not implemented
@@ -1902,7 +1984,10 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
                  uint64 oldVal,        // IN
                  uint64 newVal)        // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_compare_exchange_strong(
+      (_Atomic uint64 *)&var->value, &oldVal, newVal);
+#elif defined __GNUC__
 #if defined VM_ARM_ANY
    return Atomic_ReadIfEqualWrite64(var, oldVal, newVal) == oldVal;
 #else /* VM_X86_ANY */
@@ -1996,6 +2081,7 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
    return equal;
 #endif //VM_ARM_V7
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return (__int64)oldVal == _InterlockedCompareExchange64((__int64 *)&var->value,
                                                            (__int64)newVal,
                                                            (__int64)oldVal);
@@ -2026,7 +2112,10 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
                  uint32 oldVal,        // IN
                  uint32 newVal)        // IN
 {
-#if defined __GNUC__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_compare_exchange_strong(
+      (_Atomic uint32 *)&var->value, &oldVal, newVal);
+#elif defined __GNUC__
 #if defined VM_ARM_ANY
    return Atomic_ReadIfEqualWrite32(var, oldVal, newVal) == oldVal;
 #else /* VM_X86_ANY */
@@ -2070,6 +2159,9 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
 static INLINE uint64
 Atomic_Read64(Atomic_uint64 const *var) // IN
 {
+#if defined VM_ATOMIC_USE_C11
+   return atomic_load((const _Atomic uint64 *)&var->value);
+#else
 #if defined __GNUC__
    uint64 value;
 #endif
@@ -2116,9 +2208,11 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
    return var->value;
 #elif defined _MSC_VER && defined VM_ARM_32
    /* MSVC + 32-bit ARM has add64 but no cmpxchg64 */
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedAdd64((__int64 *)&var->value, 0);
 #elif defined _MSC_VER && defined __i386__
    /* MSVC + 32-bit x86 has cmpxchg64 but no add64 */
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedCompareExchange64((__int64 *)&var->value,
                                         (__int64)255,  // Unlikely value to
                                         (__int64)255); // not dirty cache
@@ -2135,6 +2229,7 @@ Atomic_Read64(Atomic_uint64 const *var) // IN
 #if defined __GNUC__
    return value;
 #endif
+#endif // !defined VM_ATOMIC_USE_C11
 }
 
 
@@ -2188,7 +2283,9 @@ static INLINE uint64
 Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   return atomic_fetch_add((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, add, val);
 #elif defined __x86_64__
 
@@ -2202,6 +2299,7 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
    );
    return val;
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
 #else
 #error Atomic_ReadAdd64 not implemented
@@ -2241,7 +2339,9 @@ static INLINE uint64
 Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
-#if defined __GNUC__ && defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   return atomic_fetch_sub((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
 #   ifdef _MSC_VER
@@ -2333,7 +2433,9 @@ static INLINE void
 Atomic_Add64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if !defined VM_64BIT
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_add((_Atomic uint64 *)&var->value, val);
+#elif !defined VM_64BIT
    Atomic_ReadAdd64(var, val); /* Return value is unused. */
 #elif defined __GNUC__
 #if defined VM_ARM_64
@@ -2348,6 +2450,7 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
    );
 #endif
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)val);
 #else
 #error Atomic_Add64 not implemented
@@ -2375,7 +2478,9 @@ static INLINE void
 Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if !defined VM_64BIT
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_sub((_Atomic uint64 *)&var->value, val);
+#elif !defined VM_64BIT
    Atomic_ReadSub64(var, val); /* Return value is unused. */
 #elif defined __GNUC__
 #if defined VM_ARM_64
@@ -2390,6 +2495,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
    );
 #endif
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedExchangeAdd64((__int64 *)&var->value, (__int64)-val);
 #else
 #error Atomic_Sub64 not implemented
@@ -2416,7 +2522,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
 static INLINE void
 Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 {
-#if defined VM_ARM_64
+#if defined VM_ARM_64 || defined VM_ATOMIC_USE_C11
    Atomic_Add64(var, 1);
 #elif !defined __x86_64__
    Atomic_ReadInc64(var);  /* Return value is unused. */
@@ -2429,6 +2535,7 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
       : "cc", "memory"
    );
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedIncrement64((__int64 *)&var->value);
 #else
 #error Atomic_Inc64 not implemented
@@ -2455,7 +2562,7 @@ Atomic_Inc64(Atomic_uint64 *var) // IN/OUT
 static INLINE void
 Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
 {
-#if defined VM_ARM_64
+#if defined VM_ARM_64 || defined VM_ATOMIC_USE_C11
    Atomic_Sub64(var, 1);
 #elif !defined __x86_64__
    Atomic_ReadDec64(var);  /* Return value is unused. */
@@ -2468,6 +2575,7 @@ Atomic_Dec64(Atomic_uint64 *var) // IN/OUT
       : "cc", "memory"
    );
 #elif defined _MSC_VER
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedDecrement64((__int64 *)&var->value);
 #else
 #error Atomic_Dec64 not implemented
@@ -2495,7 +2603,9 @@ static INLINE uint64
 Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
                    uint64 val)         // IN
 {
-#if defined __GNUC__ && defined __x86_64__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_exchange((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "xchgq %0, %1"
@@ -2508,6 +2618,7 @@ Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 64, TRUE, &var->value, val);
 #elif defined _MSC_VER && defined VM_64BIT
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    return _InterlockedExchange64((__int64 *)&var->value, (__int64)val);
 #else
    uint64 oldVal;
@@ -2545,7 +2656,9 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
    ASSERT((uintptr_t)var % 8 == 0);
 #endif
 
-#if defined __GNUC__ && defined __x86_64__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined __x86_64__
    /*
     * There is no move instruction for 64-bit immediate to memory, so unless
     * the immediate value fits in 32-bit (i.e. can be sign-extended), GCC
@@ -2596,7 +2709,9 @@ static INLINE void
 Atomic_Or64(Atomic_uint64 *var, // IN/OUT
             uint64 val)         // IN
 {
-#if defined __GNUC__ && defined __x86_64__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_or((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; orq %1, %0"
@@ -2607,6 +2722,7 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
 #elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 64, TRUE, &var->value, orr, val);
 #elif defined _MSC_VER && defined VM_64BIT
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedOr64((__int64 *)&var->value, (__int64)val);
 #else
    uint64 oldVal;
@@ -2639,7 +2755,9 @@ static INLINE void
 Atomic_And64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
-#if defined __GNUC__ && defined __x86_64__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_and((_Atomic uint64 *)&var->value, val);
+#elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
       "lock; andq %1, %0"
@@ -2650,6 +2768,7 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
 #elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 64, TRUE, &var->value, and, val);
 #elif defined _MSC_VER && defined VM_64BIT
+   ASSERT_ON_COMPILE(sizeof (__int64) == sizeof var->value);
    _InterlockedAnd64((__int64 *)&var->value, (__int64)val);
 #else
    uint64 oldVal;
@@ -2823,7 +2942,6 @@ Atomic_TestSetBit64(Atomic_uint64 *var, // IN/OUT
 }
 
 
-#if defined __GNUC__
 /*
  *-----------------------------------------------------------------------------
  *
@@ -2845,19 +2963,20 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
 {
    uint16 value;
 
-#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || \
+    defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 2 == 0);
 #endif
 
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
-
+#if defined VM_ATOMIC_USE_C11
+   value = atomic_load((_Atomic uint16 *)&var->value);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "movw %1, %0"
       : "=r" (value)
       : "m" (var->value)
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    NOT_TESTED();
 
    __asm__ __volatile__(
@@ -2865,11 +2984,10 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
       : "=r" (value)
       : "r" (&var->value)
    );
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    value = _VMATOM_X(R, 16, &var->value);
 #else
-#error Atomic_Read16 not implemented
-#endif
+   value = (uint16)AtomicUndefined(var);
 #endif
 
    return value;
@@ -2896,8 +3014,9 @@ static INLINE uint16
 Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
                    uint16 val)          // IN:
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_exchange((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "xchgw %0, %1"
       : "=r" (val),
@@ -2906,7 +3025,7 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
       : "memory"
    );
    return val;
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 retVal;
    uint16 res;
 
@@ -2927,11 +3046,10 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
    dmb();
 
    return retVal;
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RW, 16, TRUE, &var->value, val);
 #else
-#error Atomic_ReadWrite16 not implemented
-#endif
+   return (uint16)AtomicUndefined(var + val);
 #endif
 }
 
@@ -2956,18 +3074,20 @@ static INLINE void
 Atomic_Write16(Atomic_uint16 *var,  // OUT:
                uint16 val)          // IN:
 {
-#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || defined VMKERNEL_MODULE
+#if defined VMM || defined VM_ARM_64 || defined VMKERNEL || \
+    defined VMKERNEL_MODULE
    ASSERT((uintptr_t)var % 2 == 0);
 #endif
 
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_store((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "movw %1, %0"
       : "=m" (var->value)
       : "r" (val)
    );
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(W, 16, &var->value, val);
 #elif defined VM_ARM_32
    /*
@@ -2976,8 +3096,7 @@ Atomic_Write16(Atomic_uint16 *var,  // OUT:
     */
    Atomic_ReadWrite16(var, val);
 #else
-#error Atomic_Write16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3003,8 +3122,11 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
                           uint16 oldVal,        // IN
                           uint16 newVal)        // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_compare_exchange_strong(
+      (_Atomic uint16 *)&var->value, &oldVal, newVal);
+   return oldVal;
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    uint16 val;
 
    __asm__ __volatile__(
@@ -3016,7 +3138,7 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
       : "cc", "memory"
    );
    return val;
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 retVal;
    uint16 res;
 
@@ -3039,12 +3161,47 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
    dmb();
 
    return retVal;
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(RIFEQW, 16, TRUE, &var->value, oldVal, newVal);
 #else
-#error Atomic_ReadIfEqualWrite16 not implemented
+   return (uint16)AtomicUndefined(var + oldVal + newVal);
 #endif
+}
+
+
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ReadAnd16 --
+ *
+ *      Atomic read (returned), bitwise AND with a value, write.
+ *
+ * Results:
+ *      The value of the variable before the operation.
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE uint16
+Atomic_ReadAnd16(Atomic_uint16 *var, // IN/OUT
+                 uint16 val)         // IN
+{
+   uint16 res;
+
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_and((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
+   res = _VMATOM_X(ROP, 16, TRUE, &var->value, and, val);
+#else
+   do {
+      res = Atomic_Read16(var);
+   } while (res != Atomic_ReadIfEqualWrite16(var, res, res & val));
 #endif
+
+   return res;
 }
 
 
@@ -3068,15 +3225,16 @@ static INLINE void
 Atomic_And16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_and((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; andw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3096,11 +3254,10 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, and, val);
 #else
-#error Atomic_And16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3125,15 +3282,16 @@ static INLINE void
 Atomic_Or16(Atomic_uint16 *var, // IN/OUT
             uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_or((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; orw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3153,11 +3311,10 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, orr, val);
 #else
-#error Atomic_Or16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3182,15 +3339,16 @@ static INLINE void
 Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_xor((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; xorw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3210,11 +3368,10 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, eor, val);
 #else
-#error Atomic_Xor16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3239,15 +3396,16 @@ static INLINE void
 Atomic_Add16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_add((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; addw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3267,11 +3425,10 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, add, val);
 #else
-#error Atomic_Add16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3296,15 +3453,16 @@ static INLINE void
 Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   atomic_fetch_sub((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; subw %1, %0"
       : "+m" (var->value)
       : "re" (val)
       : "cc", "memory"
    );
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 tmp;
 
@@ -3324,11 +3482,10 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
    );
 
    dmb();
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 16, TRUE, &var->value, sub, val);
 #else
-#error Atomic_Sub16 not implemented
-#endif
+   AtomicUndefined(var + val);
 #endif
 }
 
@@ -3352,19 +3509,15 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
 static INLINE void
 Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; incw %0"
       : "+m" (var->value)
       :
       : "cc", "memory"
    );
-#elif defined VM_ARM_ANY
-   Atomic_Add16(var, 1);
 #else
-#error Atomic_Inc16 not implemented
-#endif
+   Atomic_Add16(var, 1);
 #endif
 }
 
@@ -3388,19 +3541,15 @@ Atomic_Inc16(Atomic_uint16 *var) // IN/OUT
 static INLINE void
 Atomic_Dec16(Atomic_uint16 *var) // IN/OUT
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; decw %0"
       : "+m" (var->value)
       :
       : "cc", "memory"
    );
-#elif defined VM_ARM_ANY
-   Atomic_Sub16(var, 1);
 #else
-#error Atomic_Dec16 not implemented
-#endif
+   Atomic_Sub16(var, 1);
 #endif
 }
 
@@ -3427,7 +3576,9 @@ Atomic_ReadOr16(Atomic_uint16 *var, // IN/OUT
 {
    uint16 res;
 
-#if defined VM_ARM_64
+#if defined VM_ATOMIC_USE_C11
+   res = atomic_fetch_or((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 16, TRUE, &var->value, orr, val);
 #else
    do {
@@ -3459,8 +3610,9 @@ static INLINE uint16
 Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
                  uint16 val)          // IN:
 {
-#if defined __GNUC__
-#if defined __x86_64__ || defined __i386__
+#if defined VM_ATOMIC_USE_C11
+   return atomic_fetch_add((_Atomic uint16 *)&var->value, val);
+#elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; xaddw %0, %1"
       : "=r" (val),
@@ -3469,7 +3621,7 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
       : "cc", "memory"
    );
    return val;
-#elif defined VM_ARM_V7
+#elif defined __GNUC__ && defined VM_ARM_V7
    uint16 res;
    uint16 retVal;
    uint16 tmp;
@@ -3492,11 +3644,10 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
    dmb();
 
    return retVal;
-#elif defined VM_ARM_64
+#elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 16, TRUE, &var->value, add, val);
 #else
-#error Atomic_ReadAdd16 not implemented
-#endif
+   return (uint16)AtomicUndefined(var + val);
 #endif
 }
 
@@ -3545,7 +3696,7 @@ Atomic_ReadDec16(Atomic_uint16 *var) // IN/OUT
 {
    return Atomic_ReadAdd16(var, (uint16)-1);
 }
-#endif
+
 
 /*
  * Template code for the Atomic_<name> type and its operators.
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index 781cb1b1..c6485d9a 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2003-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -61,6 +61,12 @@
 #include "mul64.h"
 #endif
 
+#if defined _M_ARM64EC
+#include "vm_assert.h"
+#define MUL64_NO_ASM 1
+#include "mul64.h"
+#endif
+
 #if defined __cplusplus
 extern "C" {
 #endif
@@ -95,7 +101,7 @@ extern "C" {
  * mssb64      MSB set (uint64)            1..64    0
  */
 
-#ifdef _MSC_VER
+#if defined(_MSC_VER) && !defined(__clang__) // Clang defines _MSC_VER on Windows
 static INLINE int
 lssb32_0(const uint32 value)
 {
@@ -773,7 +779,7 @@ RDTSC(void)
     * bora/lib/vprobe/arm64/vp_emit_tc.c::VpEmit_BuiltinRDTSCWork()
     * bora/modules/vmkernel/tests/core/xmapTest/xmapTest_arm64.c::XMapTest_SetupLoopCode()
     */
-#if (defined(VMKERNEL) || defined(VMM)) && !defined(VMK_ARM_EL1_OR_VHE)
+#if defined(VMKERNEL) && !defined(VMK_ARM_EL1_OR_VHE)
    return MRS(CNTPCT_EL0);
 #else
    return MRS(CNTVCT_EL0);
@@ -1117,7 +1123,7 @@ RoundUpPow2Asm32(uint32 value)
                                            // if out == 2^32 then out = 1 as it is right rotate
        : [in]"+r"(value),[out]"+r"(out));
    return out;
-#elif defined(VM_ARM_64)
+#elif defined(VM_ARM_64) || defined(__wasm__)
    return RoundUpPow2C32(value);
 #else
    uint32 out = 2;
diff --git a/vmnet-only/vm_basic_asm_x86.h b/vmnet-only/vm_basic_asm_x86.h
index 3f6369c9..be045d4a 100644
--- a/vmnet-only/vm_basic_asm_x86.h
+++ b/vmnet-only/vm_basic_asm_x86.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -57,7 +57,7 @@ extern "C" {
  *  constraints.
  *
  */
-#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+#if (defined(VMM) || defined(VMKERNEL) || defined(FROBOS) || defined(ULM))
 static INLINE Bool
 xtest(void)
 {
@@ -66,14 +66,18 @@ xtest(void)
    __asm__ __volatile__("xtest\n"
                         "setnz %%al"
                         : "=a" (result) : : "cc");
-#else
+#elif defined (__GNUC__)
    __asm__ __volatile__("xtest"
                         : "=@ccnz" (result) : : "cc");
+#elif defined (_WIN32)
+   result = _xtest();
+#else
+#error No xtest implementation for this compiler.
 #endif
    return result;
 }
 
-#endif /* __GNUC__ */
+#endif /* VMM || VMKERNEL || FROBOS || ULM */
 
 
 /*
diff --git a/vmnet-only/vm_basic_asm_x86_64.h b/vmnet-only/vm_basic_asm_x86_64.h
index 2b9e8f8e..39462324 100644
--- a/vmnet-only/vm_basic_asm_x86_64.h
+++ b/vmnet-only/vm_basic_asm_x86_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -331,7 +331,7 @@ XRSTORS(const void *load, uint64 mask)
  *  constraints.
  *
  */
-#if defined(__GNUC__) && (defined(VMM) || defined(VMKERNEL) || defined(FROBOS))
+#if (defined(VMM) || defined(VMKERNEL) || defined(FROBOS) || defined(ULM))
 static INLINE Bool
 xtest(void)
 {
@@ -340,14 +340,18 @@ xtest(void)
    __asm__ __volatile__("xtest\n"
                         "setnz %%al"
                         : "=a" (result) : : "cc");
-#else
+#elif defined(__GNUC__)
    __asm__ __volatile__("xtest"
                         : "=@ccnz" (result) : : "cc");
+#elif defined (_WIN64)
+   result = _xtest();
+#else
+#error No xtest implementation for this compiler.
 #endif
    return result;
 }
 
-#endif /* __GNUC__ */
+#endif /* VMM || VMKERNEL || FROBOS || ULM */
 
 /*
  *-----------------------------------------------------------------------------
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index fd597664..80bbad90 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2003-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 2003-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 /*
  * vm_basic_defs.h --
  *
- *	Standard macros for VMware source code.
+ *      Standard macros for VMware source code.
  */
 
 #ifndef _VM_BASIC_DEFS_H_
@@ -36,14 +36,6 @@
 #include "includeCheck.h"
 #include "vm_basic_types.h" // For INLINE.
 
-/* Checks for FreeBSD, filtering out VMKERNEL. */
-#if !defined(VMKERNEL) && defined(__FreeBSD__)
-#define __IS_FREEBSD__ 1
-#else
-#define __IS_FREEBSD__ 0
-#endif
-#define __IS_FREEBSD_VER__(ver) (__IS_FREEBSD__ && __FreeBSD_version >= (ver))
-
 /*
  * <stddef.h> provides definitions for:
  *   NULL, offsetof
@@ -128,11 +120,11 @@ Max(int a, int b)
 #define VMW_CLAMP(x, min, max) \
    ((x) < (min) ? (min) : ((x) > (max) ? (max) : (x)))
 
-#define ROUNDUP(x,y)		(((x) + (y) - 1) / (y) * (y))
-#define ROUNDDOWN(x,y)		((x) / (y) * (y))
-#define ROUNDUPBITS(x, bits)	(((uintptr_t) (x) + MASK(bits)) & ~MASK(bits))
-#define ROUNDDOWNBITS(x, bits)	((uintptr_t) (x) & ~MASK(bits))
-#define CEILING(x, y)		(((x) + (y) - 1) / (y))
+#define ROUNDUP(x,y)           (((x) + (y) - 1) / (y) * (y))
+#define ROUNDDOWN(x,y)         ((x) / (y) * (y))
+#define ROUNDUPBITS(x, bits)   (((uintptr_t)(x) + MASK(bits)) & ~MASK(bits))
+#define ROUNDDOWNBITS(x, bits) ((uintptr_t)(x) & ~MASK(bits))
+#define CEILING(x, y)          (((x) + (y) - 1) / (y))
 
 #if defined VMKERNEL || defined VMKBOOT
 # define CEIL(_a, _b)        CEILING(_a, _b)
@@ -157,8 +149,9 @@ Max(int a, int b)
  * argument. The range 0..31 is safe.
  */
 
-#define MASK(n)		((1 << (n)) - 1)	    /* make an n-bit mask */
-#define MASK64(n)	((CONST64U(1) << (n)) - 1)  /* make an n-bit mask */
+#define MASK(n)      ((1 << (n)) - 1)            /* make an n-bit mask */
+#define MASK64(n)    ((CONST64U(1) << (n)) - 1)  /* make an n-bit mask */
+#define MASK128(n)   (((uint128)1 << (n)) - 1)   /* make an n-bit mask */
 /*
  * MASKRANGE64 makes a bit vector starting at bit lo and ending at bit hi.  No
  * checking for lo < hi is done.
@@ -187,7 +180,9 @@ Max(int a, int b)
 #define XCONC(x, y)             CONC(x, y)
 #define XXCONC(x, y)            XCONC(x, y)
 #define MAKESTR(x)              #x
+#ifndef XSTR
 #define XSTR(x)                 MAKESTR(x)
+#endif
 
 
 /*
@@ -227,6 +222,8 @@ Max(int a, int b)
    #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #elif defined __arm__
    #define PAGE_SHIFT    PAGE_SHIFT_4KB
+#elif defined __wasm__
+   #define PAGE_SHIFT    PAGE_SHIFT_4KB
 #else
    #error
 #endif
@@ -260,15 +257,6 @@ Max(int a, int b)
 #define PAGE_NUMBER(_addr)  ((uintptr_t)(_addr) / PAGE_SIZE)
 #endif
 
-#ifndef VM_PAGE_BASE
-#define VM_PAGE_BASE(_addr)  ((_addr) & ~(PAGE_SIZE - 1))
-#endif
-
-#ifndef VM_PAGES_SPANNED
-#define VM_PAGES_SPANNED(_addr, _size) \
-   ((((_addr) & (PAGE_SIZE - 1)) + (_size) + (PAGE_SIZE - 1)) >> PAGE_SHIFT)
-#endif
-
 #ifndef BYTES_2_PAGES
 #define BYTES_2_PAGES(_nbytes)  ((_nbytes) >> PAGE_SHIFT)
 #endif
@@ -281,6 +269,16 @@ Max(int a, int b)
 #define PAGES_2_BYTES(_npages)  (((uint64)(_npages)) << PAGE_SHIFT)
 #endif
 
+#ifndef VM_PAGE_BASE
+#define VM_PAGE_BASE(_addr)  ((_addr) & ~(PAGE_SIZE - 1))
+#endif
+
+#ifndef VM_PAGES_SPANNED
+#define VM_PAGES_SPANNED(_addr, _size) \
+   (BYTES_2_PAGES(PAGE_OFFSET(_addr) + PAGE_OFFSET(_size) + (PAGE_SIZE - 1)) + \
+    BYTES_2_PAGES(_size))
+#endif
+
 #ifndef KBYTES_SHIFT
 #define KBYTES_SHIFT 10
 #endif
@@ -428,9 +426,9 @@ Max(int a, int b)
  */
 
 #define DEPOSIT_BITS(_src,_pos,_len,_target) { \
-	unsigned mask = ((1 << _len) - 1); \
-	unsigned shiftedmask = ((1 << _len) - 1) << _pos; \
-	_target = (_target & ~shiftedmask) | ((_src & mask) << _pos); \
+   unsigned mask = ((1 << _len) - 1); \
+   unsigned shiftedmask = ((1 << _len) - 1) << _pos; \
+   _target = (_target & ~shiftedmask) | ((_src & mask) << _pos); \
 }
 
 
@@ -647,6 +645,12 @@ typedef int pid_t;
 #define VMKERNEL_ONLY(x)
 #endif
 
+#ifdef COMP_TEST
+#define vmx86_test   1
+#else
+#define vmx86_test   0
+#endif
+
 /*
  * In MSVC, _WIN32 is defined as 1 when the compilation target is
  * 32-bit ARM, 64-bit ARM, x86, or x64 (which implies _WIN64). This
@@ -700,6 +704,18 @@ typedef int pid_t;
 #define VMM_ONLY(x)
 #endif
 
+#ifdef VMX86_VMX
+#define vmx86_vmx 1
+#else
+#define vmx86_vmx 0
+#endif
+
+#ifdef VMM_BOOTSTRAP
+#define vmm_bootstrap 1
+#else
+#define vmm_bootstrap 0
+#endif
+
 #ifdef ULM
 #define vmx86_ulm 1
 #define ULM_ONLY(x) x
@@ -776,6 +792,7 @@ typedef int pid_t;
                                                      lfMessageFont)
 
 /* This is not intended to be thread-safe. */
+#ifndef KBUILD_MODNAME
 #define DO_ONCE(code)                                                   \
    do {                                                                 \
       static MONITOR_ONLY(PERVCPU) Bool _doOnceDone = FALSE;            \
@@ -784,6 +801,7 @@ typedef int pid_t;
          code;                                                          \
       }                                                                 \
    } while (0)
+#endif
 
 /*
  * Bug 827422 and 838523.
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index d05fcc79..0cfc0264 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -39,11 +39,11 @@
 /*
  * Standardize MSVC arch macros to GCC arch macros.
  */
-#if defined _MSC_VER && defined _M_X64
+#if defined _MSC_VER && defined _M_X64 && !defined _M_ARM64EC
 #  define __x86_64__ 1
 #elif defined _MSC_VER && defined _M_IX86
 #  define __i386__ 1
-#elif defined _MSC_VER && defined _M_ARM64
+#elif defined _MSC_VER && (defined _M_ARM64 || defined _M_ARM64EC)
 #  define __aarch64__ 1
 #elif defined _MSC_VER && defined _M_ARM
 #  define __arm__ 1
@@ -163,7 +163,7 @@
  * - Linux userlevel uses 'long' uint64_t
  * - Windows uses 'long long' uint64_t
  */
-#if !defined(VMKERNEL) && !defined(DECODERLIB) && \
+#if !defined(VMKERNEL) &&  \
     defined(__linux__) && defined(__KERNEL__)
 #  include <linux/types.h>
 #  include <linux/version.h>
@@ -205,7 +205,7 @@
  * - VMM does not have POSIX headers
  * - Windows <sys/types.h> does not define ssize_t
  */
-#if defined(VMKERNEL) || defined(VMM) || defined(DECODERLIB)
+#if defined(VMKERNEL) || defined(VMM)
    /* Guard against FreeBSD <sys/types.h> collison. */
 #  if !defined(_SIZE_T_DEFINED) && !defined(_SIZE_T)
 #     define _SIZE_T_DEFINED
@@ -290,11 +290,11 @@ typedef char           Bool;
 #if !defined(USING_AUTOCONF)
 #   if defined(__FreeBSD__) || defined(sun)
 #      ifndef KLD_MODULE
-#         if __FreeBSD_version >= 500043
+#         if defined(__FreeBSD__)
 #            if !defined(VMKERNEL)
 #               include <inttypes.h>
 #            endif
-#         else
+#         else /* sun */
 #            include <sys/inttypes.h>
 #         endif
 #      endif
@@ -353,7 +353,7 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
       #define FMTPD      "I"
       #define FMTH       "I"
    #endif
-#elif defined __APPLE__ || (!defined VMKERNEL && !defined DECODERLIB && \
+#elif defined __APPLE__ || (!defined VMKERNEL && \
                             defined __linux__ && defined __KERNEL__)
    /* semi-LLP64 targets; 'long' is 64-bit, but uint64_t is 'long long' */
    #define FMT64         "ll"
@@ -508,7 +508,7 @@ typedef uint16  UReg16;
 typedef uint32  UReg32;
 typedef uint64  UReg64;
 
-#if defined(__GNUC__) && defined(__SIZEOF_INT128__)
+#ifdef VM_HAS_INT128
 typedef  int128  Reg128;
 typedef uint128 UReg128;
 #endif
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
index 7691618d..f2584a3b 100644
--- a/vmnet-only/vm_device_version.h
+++ b/vmnet-only/vm_device_version.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998,2005-2012,2014-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998,2005-2012,2014-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -56,6 +56,7 @@
  */
 #define PCI_VENDOR_ID_VMWARE                    0x15AD
 #define PCI_DEVICE_ID_VMWARE_SBX                0x0420
+#define PCI_DEVICE_ID_VMWARE_SVGA4              0x0408
 #define PCI_DEVICE_ID_VMWARE_SVGA_EFI           0x0407
 #define PCI_DEVICE_ID_VMWARE_SVGA3              0x0406
 #define PCI_DEVICE_ID_VMWARE_SVGA2              0x0405
@@ -71,6 +72,7 @@
 #define PCI_DEVICE_ID_VMWARE_UHCI               0x0774
 #define PCI_DEVICE_ID_VMWARE_XHCI_0096          0x0778
 #define PCI_DEVICE_ID_VMWARE_XHCI_0100          0x0779
+#define PCI_DEVICE_ID_VMWARE_XHCI_0120          0x077A
 #define PCI_DEVICE_ID_VMWARE_1394               0x0780
 #define PCI_DEVICE_ID_VMWARE_BRIDGE             0x0790
 #define PCI_DEVICE_ID_VMWARE_ROOTPORT           0x07A0
@@ -259,15 +261,15 @@
 #define NVME_MAX_NAMESPACES    64 /* We support 64 namespaces same
                                    * as PVSCSI controller.
                                    */
-#define NVME_HW19_MAX_NAMESPACES 15 // HWv19 and before supports 15 namespaces
+#define NVME_HW20_MAX_NAMESPACES 15 // HWv20 and before supports 15 namespaces
 #define NVME_FUTURE_MAX_NAMESPACES 256 /* To support NVME to the possible 256
                                         * disks per controller in future.
                                         */
 /************* SCSI implementation limits ********************************/
 #define SCSI_MAX_CONTROLLERS	 4	  // Need more than 1 for MSCS clustering
 #define	SCSI_MAX_DEVICES         16	  // BT-958 emulates only 16
-#define PVSCSI_HWV14_MAX_DEVICES 65	  /* HWv14 And Later Supports 64 
-					   * + controller at ID 7 
+#define PVSCSI_HWV14_MAX_DEVICES 65	  /* HWv14 And Later Supports 64
+					   * + controller at ID 7
 					   */
 #define PVSCSI_MAX_DEVICES       255	  // 255 (including the controller)
 #define PVSCSI_MAX_NUM_DISKS     (PVSCSI_HWV14_MAX_DEVICES - 1)
@@ -358,6 +360,22 @@
 #define NUM_SERIAL_PORTS     32
 #define NUM_PARALLEL_PORTS   3
 
+/************* USB host controller limits ********************/
+#define USB_EHCI_MAX_CONTROLLERS        1
+#define USB_XHCI_MAX_CONTROLLERS        1
+
+/*
+ * As per USB specification 127 devices can be connected. Along with user usb
+ * devices other types of devices like root hub, hub, keyboard, mouse are also
+ * present and are not expose directly to users. These other devices also
+ * occupy ports on USB.
+ *
+ * Although we have 20 devices limit for virtual usb mass storage on each
+ * controller we can't just put 20 here as we need to account for other devices
+ * which are necessary for functionality
+ * TODO: enforce 20 devices limit from hostd
+ */
+#define USB_MAX_DEVICES_PER_HOST_CTRL   127
 /************* Strings for Host USB Driver *******************************/
 
 #ifdef _WIN32
@@ -366,13 +384,13 @@
  * Globally unique ID for the VMware device interface. Define INITGUID before including
  * this header file to instantiate the variable.
  */
-DEFINE_GUID(GUID_DEVICE_INTERFACE_VMWARE_USB_DEVICES, 
+DEFINE_GUID(GUID_DEVICE_INTERFACE_VMWARE_USB_DEVICES,
 0x2da1fe75, 0xaab3, 0x4d2c, 0xac, 0xdf, 0x39, 0x8, 0x8c, 0xad, 0xa6, 0x65);
 
 /*
  * Globally unique ID for the VMware device setup class.
  */
-DEFINE_GUID(GUID_CLASS_VMWARE_USB_DEVICES, 
+DEFINE_GUID(GUID_CLASS_VMWARE_USB_DEVICES,
 0x3b3e62a5, 0x3556, 0x4d7e, 0xad, 0xad, 0xf5, 0xfa, 0x3a, 0x71, 0x2b, 0x56);
 
 /*
diff --git a/vmnet-only/vnetEvent.c b/vmnet-only/vnetEvent.c
index f1579292..5dde3d98 100644
--- a/vmnet-only/vnetEvent.c
+++ b/vmnet-only/vnetEvent.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2007, 2023 VMware, Inc. All rights reserved.
+ * Copyright (C) 2007, 2022 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmnet-only/vnetUserListener.c b/vmnet-only/vnetUserListener.c
index 114f3907..7770f118 100644
--- a/vmnet-only/vnetUserListener.c
+++ b/vmnet-only/vnetUserListener.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2008 VMware, Inc. All rights reserved.
+ * Copyright (C) 2008, 2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -42,10 +42,12 @@ typedef struct VNetUserListener_EventNode VNetUserListener_EventNode;
 
 struct VNetUserListener_EventNode {
    VNetUserListener_EventNode *nextEvent;
-   VNet_EventHeader event;
+   union {
+       VNet_EventHeader header;
+       VNet_LinkStateEvent lse;
+   } event;
 };
 
-#define EVENT_NODE_HEADER_SIZE offsetof(struct VNetUserListener_EventNode, event)
 
 typedef struct VNetUserListener {
    VNetPort port;                          /* base port/jack */
@@ -220,7 +222,7 @@ VNetUserListenerEventHandler(void *context,       // IN: the user listener
    VNetUserListener_EventNode *t;
 
    /* allocate and initialize event node */
-   t = kmalloc(EVENT_NODE_HEADER_SIZE + e->size, GFP_ATOMIC);
+   t = kmalloc(sizeof *t, GFP_ATOMIC);
    if (t == NULL) {
       LOG(0, (KERN_DEBUG "VNetUserListenerEventHandler, out of memory\n"));
       return;
@@ -299,7 +301,7 @@ VNetUserListenerRead(VNetPort    *port, // IN: the user listener
    spin_unlock(&userListener->lock);
 
    /* return data and free event */
-   n = t->event.size;
+   n = t->event.header.size;
    if (count < n) {
       n = count;
    }

From 363bab01bfde37bd89f167c661324fb9b705395a Mon Sep 17 00:00:00 2001
From: Philip Langdale <philipl@overt.org>
Date: Sat, 7 Sep 2024 14:31:49 -0700
Subject: [PATCH 24/41] import Workstation 17.6.0 module sources

---
 vmmon-only/Makefile.kernel                    |   3 +-
 vmmon-only/Makefile.normal                    |   3 +-
 vmmon-only/bootstrap/bootstrap.c              |   8 +-
 vmmon-only/bootstrap/monLoader.c              |   4 +-
 vmmon-only/bootstrap/monLoaderVmmon.c         |   3 +-
 vmmon-only/bootstrap/vmmblob.c                |   3 +-
 vmmon-only/common/apic.c                      |   3 +-
 vmmon-only/common/apic.h                      |   3 +-
 vmmon-only/common/comport.c                   |   3 +-
 vmmon-only/common/cpuid.c                     |   3 +-
 vmmon-only/common/cpuid.h                     |   3 +-
 vmmon-only/common/crosspage.c                 |  87 +--
 vmmon-only/common/crosspage.h                 |   3 +-
 vmmon-only/common/hostKernel.h                |   3 +-
 vmmon-only/common/hostif.h                    |   3 +-
 vmmon-only/common/hostifGlobalLock.h          |   3 +-
 vmmon-only/common/hostifMem.h                 |   3 +-
 vmmon-only/common/memtrack.c                  |   3 +-
 vmmon-only/common/memtrack.h                  |   3 +-
 vmmon-only/common/moduleloop.c                |   3 +-
 vmmon-only/common/phystrack.c                 |   3 +-
 vmmon-only/common/phystrack.h                 |   3 +-
 vmmon-only/common/sharedAreaVmmon.c           |   3 +-
 vmmon-only/common/statVarsVmmon.c             |   3 +-
 vmmon-only/common/task.c                      |   7 +-
 vmmon-only/common/task.h                      |   3 +-
 vmmon-only/common/vmx86.c                     |  12 +-
 vmmon-only/common/vmx86.h                     |   3 +-
 vmmon-only/include/addrlayout.h               |  12 +-
 vmmon-only/include/bootstrap_vmm.h            |   6 +-
 vmmon-only/include/compat_sched.h             |   5 +-
 vmmon-only/include/compat_version.h           |   6 +-
 vmmon-only/include/intelVT.h                  |  27 +-
 vmmon-only/include/iocontrols.h               |   4 +-
 vmmon-only/include/monAddrLayout.h            |   4 +-
 vmmon-only/include/monLoader.h                |  30 +-
 vmmon-only/include/perfctr.h                  |  16 +-
 vmmon-only/include/perfctr_arch.h             |  40 +-
 vmmon-only/include/pgtbl.h                    |   5 +-
 vmmon-only/include/ptsc.h                     |  24 +-
 vmmon-only/include/sharedAreaVmmon.h          |   3 +-
 vmmon-only/include/statVarsVmmon.h            |   3 +-
 vmmon-only/include/vcpuid.h                   |   7 +-
 vmmon-only/include/vcpuset.h                  |  68 +--
 vmmon-only/include/virtual_vt.h               |   9 +-
 vmmon-only/include/vm_asm.h                   |  14 +-
 vmmon-only/include/vm_asm_x86.h               |  82 ++-
 vmmon-only/include/vm_atomic.h                | 211 ++++---
 vmmon-only/include/vm_atomic_acqrel.h         |  16 +-
 vmmon-only/include/vm_basic_asm.h             | 269 +++++----
 vmmon-only/include/vm_basic_defs.h            |  93 +++-
 vmmon-only/include/vm_basic_types.h           |   4 +-
 vmmon-only/include/{vm_idt_x86.h => vm_idt.h} |  25 +-
 vmmon-only/include/vmmblob.h                  |   3 +-
 vmmon-only/include/x86_basic_defs.h           |  35 +-
 vmmon-only/include/x86cet.h                   |   2 +-
 vmmon-only/include/x86cpuid.h                 |  48 +-
 vmmon-only/include/x86desc.h                  | 112 ++--
 vmmon-only/include/x86msr.h                   |  62 ++-
 vmmon-only/include/x86paging_64.h             |   3 +-
 vmmon-only/include/x86paging_common.h         |  47 +-
 vmmon-only/include/x86svm.h                   |  83 +--
 vmmon-only/include/x86vt-exit-reasons.h       |   6 +-
 vmmon-only/include/x86vt-vmcs-fields.h        | 516 +++++++++++++++++-
 vmmon-only/include/x86vt.h                    |  79 ++-
 vmmon-only/linux/driver.c                     |   7 +-
 vmmon-only/linux/driver.h                     |   3 +-
 vmmon-only/linux/hostif.c                     |   9 +-
 vmmon-only/linux/hostif_priv.h                |   3 +-
 vmmon-only/linux/vmhost.h                     |   3 +-
 vmnet-only/bridge.c                           |  12 +-
 vmnet-only/compat_version.h                   |   6 +-
 vmnet-only/driver.c                           |  15 +-
 vmnet-only/net.h                              |   6 +-
 vmnet-only/vm_atomic.h                        | 211 ++++---
 vmnet-only/vm_basic_asm.h                     | 269 +++++----
 vmnet-only/vm_basic_defs.h                    |  93 +++-
 vmnet-only/vm_basic_types.h                   |   4 +-
 vmnet-only/vnetInt.h                          |  11 +-
 79 files changed, 1877 insertions(+), 941 deletions(-)
 rename vmmon-only/include/{vm_idt_x86.h => vm_idt.h} (77%)

diff --git a/vmmon-only/Makefile.kernel b/vmmon-only/Makefile.kernel
index 69ee8d03..f9ddf680 100644
--- a/vmmon-only/Makefile.kernel
+++ b/vmmon-only/Makefile.kernel
@@ -1,6 +1,7 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998,2015,2020 VMware, Inc. All rights reserved.
+# Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+# The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/Makefile.normal b/vmmon-only/Makefile.normal
index 70ea0764..b1cffe21 100644
--- a/vmmon-only/Makefile.normal
+++ b/vmmon-only/Makefile.normal
@@ -1,6 +1,7 @@
 #!/usr/bin/make -f
 ##########################################################
-# Copyright (C) 1998,2015,2017,2020 VMware, Inc. All rights reserved.
+# Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+# The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/bootstrap/bootstrap.c b/vmmon-only/bootstrap/bootstrap.c
index 24ede075..9624eabd 100644
--- a/vmmon-only/bootstrap/bootstrap.c
+++ b/vmmon-only/bootstrap/bootstrap.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015,2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,10 +19,11 @@
 /*
  * bootstrap.c --
  *
- *    Implements the early VMM bootstraping code that is executed
- *    by the host (vmmon/VMKernel) to create the VMM context.
+ *      Implements the early VMM bootstraping code that is executed
+ *      by the host (vmmon/VMKernel) to create the VMM context.
  */
 
+#if !defined VMKERNEL || defined VMK_HAS_VMM
 #include "vm_basic_types.h"
 #include "vm_basic_defs.h"
 #include "bootstrap_vmm.h"
@@ -51,3 +52,4 @@ BSVMM_Validate(void *buf, uint32 nbytes)
    }
    return bsParams;
 }
+#endif
diff --git a/vmmon-only/bootstrap/monLoader.c b/vmmon-only/bootstrap/monLoader.c
index a5e911b4..b7d151fc 100644
--- a/vmmon-only/bootstrap/monLoader.c
+++ b/vmmon-only/bootstrap/monLoader.c
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (c) 2015-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2015-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -53,6 +53,7 @@
 #error MonLoader cannot be built as part of this environment
 #endif
 
+#if !defined VMKERNEL || defined VMK_HAS_VMM
 #include "vm_basic_types.h"
 #include "monLoader.h"
 #include "vcpuid.h"
@@ -914,3 +915,4 @@ MonLoader_Process(MonLoaderHeader  *header,   // IN/OUT
    MonLoaderCallout_CleanUp(ctx.envCtx);
    return ret;
 }
+#endif
diff --git a/vmmon-only/bootstrap/monLoaderVmmon.c b/vmmon-only/bootstrap/monLoaderVmmon.c
index 18e13f91..afba1368 100644
--- a/vmmon-only/bootstrap/monLoaderVmmon.c
+++ b/vmmon-only/bootstrap/monLoaderVmmon.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 2016-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2016-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/bootstrap/vmmblob.c b/vmmon-only/bootstrap/vmmblob.c
index cba3fcff..76d2e05a 100644
--- a/vmmon-only/bootstrap/vmmblob.c
+++ b/vmmon-only/bootstrap/vmmblob.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2017-2020, 2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2017-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/apic.c b/vmmon-only/common/apic.c
index c738687c..86fc8d92 100644
--- a/vmmon-only/common/apic.c
+++ b/vmmon-only/common/apic.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 2011, 2016, 2018,2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2011-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/apic.h b/vmmon-only/common/apic.h
index 4d5e751c..2bac7f4e 100644
--- a/vmmon-only/common/apic.h
+++ b/vmmon-only/common/apic.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2011 VMware, Inc. All rights reserved.
+ * Copyright (c) 2011-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/comport.c b/vmmon-only/common/comport.c
index 521beba5..651518e6 100644
--- a/vmmon-only/common/comport.c
+++ b/vmmon-only/common/comport.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2006,2016,2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 2006-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/cpuid.c b/vmmon-only/common/cpuid.c
index 1c88672a..07c96277 100644
--- a/vmmon-only/common/cpuid.c
+++ b/vmmon-only/common/cpuid.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 1998, 2016-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/cpuid.h b/vmmon-only/common/cpuid.h
index ce625bda..b8e74e41 100644
--- a/vmmon-only/common/cpuid.h
+++ b/vmmon-only/common/cpuid.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 1998, 2016-2019 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/crosspage.c b/vmmon-only/common/crosspage.c
index 8a8c11c1..ac24ac70 100644
--- a/vmmon-only/common/crosspage.c
+++ b/vmmon-only/common/crosspage.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2016-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2016-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -59,7 +60,7 @@
 #include "segs.h"
 #include "x86_basic_defs.h"
 #include "vm_basic_defs.h"
-#include "vm_idt_x86.h"
+#include "vm_idt.h"
 #include "crosspage.h"
 
 /*
@@ -234,6 +235,38 @@ CrossPageInitSwitchIDTs(struct VMCrossPageData *cpData)
                           CrossPageVmmCodeVA(SwitchMCEHandler));
 }
 
+/*
+ *---------------------------------------------------------------------------
+ *
+ * SwitchExcGetCrossPageData --
+ *
+ *      Common code for the exception handlers to locate the data
+ *      crosspage so they can record their respective events.  In order to
+ *      reach this code an exception had to vector through the IDT.  The IDT
+ *      is known to be in the data page.  Therefore, the data page can be
+ *      found by accessing IDTR and rounding down to page alignment.
+ *
+ * Input:
+ *     None
+ *
+ * Output:
+ *     %rax = Page aligned address of the current crosspage data area.
+ *
+ * Note:
+ *     %rax (return value) and %rflags are destroyed, all other registers
+ *     are preserved.  Since this is only called by exception handlers, the
+ *     CPU has already saved %rflags so no additional handling is required.
+ *
+ *---------------------------------------------------------------------------
+ */
+
+#define SwitchExcGetCrossPageData              \
+   "subq            $0x10,            %%rsp\n" \
+   "sidt            0(%%rsp)\n"                \
+   "movq            2(%%rsp),         %%rax\n" /* DTR.offset */ \
+   "addq            $0x10,            %%rsp\n" \
+   "andq            %[PageAlignMask], %%rax\n"
+
 
 /*
  *-----------------------------------------------------------------------------
@@ -297,7 +330,9 @@ CrossPage_CodePage(void)
    EXPORTED_ASM_SYMBOL(SwitchDBHandler)
    ENDBR
    "pushq        %%rax\n"
-   "call         SwitchExcGetCrossPageData\n"
+
+   SwitchExcGetCrossPageData
+
    "addq         %[wsExceptionDB], %%rax\n"
    "movb         $1,               (%%rax)\n" /* log EXC_DB */
    "popq         %%rax\n"
@@ -338,7 +373,9 @@ CrossPage_CodePage(void)
    "pushq        %%rax\n"
    "pushq        %%rbx\n"
    "pushq        %%rcx\n"
-   "call         SwitchExcGetCrossPageData\n"
+
+   SwitchExcGetCrossPageData
+
    "movl         %[wsExceptionUD],      %%ecx\n"    /* log EXC_UD */
    "movb         $1,                    (%%rax, %%rcx)\n"
    /* Check if the exception came from a monitor RIP. */
@@ -405,7 +442,9 @@ CrossPage_CodePage(void)
    EXPORTED_ASM_SYMBOL(SwitchNMIHandler)
    ENDBR
    "pushq        %%rax\n"
-   "call         SwitchExcGetCrossPageData\n"
+
+   SwitchExcGetCrossPageData
+
    "addq         %[wsExceptionNMI], %%rax\n"
    "movb         $1,                (%%rax)\n" /* log EXC_NMI */
    "popq         %%rax\n"
@@ -441,7 +480,9 @@ CrossPage_CodePage(void)
    EXPORTED_ASM_SYMBOL(SwitchMCEHandler)
    ENDBR
    "pushq        %%rax\n"
-   "call         SwitchExcGetCrossPageData\n"
+
+   SwitchExcGetCrossPageData
+
    "addq         %[wsExceptionMC], %%rax\n"
    "movb         $1,              (%%rax)\n" /* log EXC_MC */
    "popq         %%rax\n"
@@ -611,40 +652,6 @@ CrossPage_CodePage(void)
    "cld\n"
    "lretq\n"
 
-   /*
-    *---------------------------------------------------------------------------
-    *
-    * SwitchExcGetCrossPageData --
-    *
-    *      Common function for the exception handlers to locate the data
-    *      crosspage so they can record their respective events.  In order to
-    *      reach this code an exception had to vector through the IDT.  The IDT
-    *      is known to be in the data page.  Therefore, the data page can be
-    *      found by accessing IDTR and rounding down to page alignment.
-    *
-    * Input:
-    *     None
-    *
-    * Output:
-    *     %rax = Page aligned address of the current crosspage data area.
-    *
-    * Note:
-    *     %rax (return value) and %rflags are destroyed, all other registers
-    *     are preserved.  Since this is only called by exception handlers, the
-    *     CPU has already saved %rflags so no additional handling is required.
-    *
-    *---------------------------------------------------------------------------
-    */
-
-   ".p2align 4\n"
-   "SwitchExcGetCrossPageData:\n"
-   "subq            $0x10,            %%rsp\n"
-   "sidt            0(%%rsp)\n"
-   "movq            2(%%rsp),         %%rax\n" /* DTR.offset */
-   "addq            $0x10,            %%rsp\n"
-   "andq            %[PageAlignMask], %%rax\n"
-   "ret\n"
-
    EXPORTED_ASM_SYMBOL(CrossPage_CodeEnd)
 
    : /* No output list, this is not really C code. */
diff --git a/vmmon-only/common/crosspage.h b/vmmon-only/common/crosspage.h
index e877ff09..6de7cf3a 100644
--- a/vmmon-only/common/crosspage.h
+++ b/vmmon-only/common/crosspage.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2020-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/hostKernel.h b/vmmon-only/common/hostKernel.h
index 752d3cc4..a1580891 100644
--- a/vmmon-only/common/hostKernel.h
+++ b/vmmon-only/common/hostKernel.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998,2019 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/hostif.h b/vmmon-only/common/hostif.h
index 107f700e..232182d6 100644
--- a/vmmon-only/common/hostif.h
+++ b/vmmon-only/common/hostif.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/hostifGlobalLock.h b/vmmon-only/common/hostifGlobalLock.h
index 678e84ab..6291bdc6 100644
--- a/vmmon-only/common/hostifGlobalLock.h
+++ b/vmmon-only/common/hostifGlobalLock.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/hostifMem.h b/vmmon-only/common/hostifMem.h
index a0f587e0..741be744 100644
--- a/vmmon-only/common/hostifMem.h
+++ b/vmmon-only/common/hostifMem.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 1998, 2008, 2018 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/memtrack.c b/vmmon-only/common/memtrack.c
index 2e015d17..1ab10f71 100644
--- a/vmmon-only/common/memtrack.c
+++ b/vmmon-only/common/memtrack.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2018,2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/memtrack.h b/vmmon-only/common/memtrack.h
index 5bfab3f4..2b6bf996 100644
--- a/vmmon-only/common/memtrack.h
+++ b/vmmon-only/common/memtrack.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998,2017-2018,2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/moduleloop.c b/vmmon-only/common/moduleloop.c
index ca1063f0..4f3e0a0f 100644
--- a/vmmon-only/common/moduleloop.c
+++ b/vmmon-only/common/moduleloop.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/phystrack.c b/vmmon-only/common/phystrack.c
index 4b33805d..10b09fe5 100644
--- a/vmmon-only/common/phystrack.c
+++ b/vmmon-only/common/phystrack.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998,2014,2019-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/phystrack.h b/vmmon-only/common/phystrack.h
index 47d10cf9..a9491f98 100644
--- a/vmmon-only/common/phystrack.h
+++ b/vmmon-only/common/phystrack.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998,2019 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/sharedAreaVmmon.c b/vmmon-only/common/sharedAreaVmmon.c
index 6c66f2b0..1af3c264 100644
--- a/vmmon-only/common/sharedAreaVmmon.c
+++ b/vmmon-only/common/sharedAreaVmmon.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2018,2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2018-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/statVarsVmmon.c b/vmmon-only/common/statVarsVmmon.c
index f3bf1136..754055f0 100644
--- a/vmmon-only/common/statVarsVmmon.c
+++ b/vmmon-only/common/statVarsVmmon.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2018-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2018-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/task.c b/vmmon-only/common/task.c
index 5d34cf4d..fd859c3b 100644
--- a/vmmon-only/common/task.c
+++ b/vmmon-only/common/task.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -30,7 +31,6 @@
  *          -restores the IDT,CR0,CR2,CR4 and EFLAGS
  *
  *      This file is pretty much independent of the host OS.
- *
  */
 
 #ifdef __linux__
@@ -73,7 +73,6 @@
 #include "x86paging_common.h"
 #include "x86paging_64.h"
 #include "memtrack.h"
-#include "monLoader.h"
 #include "crosspage.h"
 #include "cpu_defs.h"
 
@@ -544,7 +543,7 @@ Task_Terminate(void)
  *-----------------------------------------------------------------------------
  */
 
-Selector
+static Selector
 TaskGetFlatWriteableDataSegment(void)
 {
    DTR hostGDTR;
diff --git a/vmmon-only/common/task.h b/vmmon-only/common/task.h
index 6957d410..80caea9d 100644
--- a/vmmon-only/common/task.h
+++ b/vmmon-only/common/task.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2013,2015,2019-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/common/vmx86.c b/vmmon-only/common/vmx86.c
index 86e52fb4..33d2c1fa 100644
--- a/vmmon-only/common/vmx86.c
+++ b/vmmon-only/common/vmx86.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -49,7 +50,11 @@
 #include "x86svm.h"
 #include "x86cpuid_asm.h"
 #if defined(__linux__)
+#if LINUX_VERSION_CODE < KERNEL_VERSION(6, 8, 0)
 #include <asm/timex.h>
+#else
+#include <linux/timex.h>
+#endif
 #endif
 #include "perfctr.h"
 #include "x86vtinstr.h"
@@ -152,6 +157,7 @@ static Vmx86GetMSRData msrCacheQueryData;
    MSRNUMVT(MSR_VMX_EPT_VPID,             EPT)                                 \
    MSRNUMVT(MSR_VMX_VMFUNC,               VMFunc)                              \
    MSRNUMVT(MSR_VMX_3RD_CTLS,             3rd)                                 \
+   MSRNUMVT(MSR_VMX_EXIT_CTLS2,           Exit2)                               \
    MSRNUMVT2(MSR_VMX_PINBASED_CTLS,       Ctls)                                \
    MSRNUMVT2(MSR_VMX_PROCBASED_CTLS,      Ctls)                                \
    MSRNUMVT2(MSR_VMX_EXIT_CTLS,           Ctls)                                \
@@ -696,7 +702,7 @@ Vmx86FreeCrossPages(VMDriver *vm)
  *-----------------------------------------------------------------------------
  */
 
-void
+static void
 Vmx86FreeVMDriver(VMDriver *vm)
 {
    Vmx86_Free(vm->ptRootMpns);
@@ -729,7 +735,7 @@ Vmx86FreeVMDriver(VMDriver *vm)
  *-----------------------------------------------------------------------------
  */
 
-VMDriver *
+static VMDriver *
 Vmx86AllocVMDriver(uint32 numVCPUs)
 {
    VMDriver *vm = Vmx86_Calloc(1, sizeof *vm, TRUE);
diff --git a/vmmon-only/common/vmx86.h b/vmmon-only/common/vmx86.h
index 89262309..fb103fa2 100644
--- a/vmmon-only/common/vmx86.h
+++ b/vmmon-only/common/vmx86.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/addrlayout.h b/vmmon-only/include/addrlayout.h
index f2d6ef68..5b661b88 100644
--- a/vmmon-only/include/addrlayout.h
+++ b/vmmon-only/include/addrlayout.h
@@ -90,7 +90,7 @@ typedef struct {
  *
  * This checking is only performed when using gcc.
  */
-#define REGION(name, length) static INLINE void name(void) { \
+#define REGION(name, length) static inline void name(void) { \
    ASSERT_ON_COMPILE(FIELD_PAGE_NUMBER(name##_REGION_MARKER) == \
                      REGION_FIELD_PAGE_NUMBER(name)); \
    ASSERT_ON_COMPILE((length % 512) == 0); \
@@ -269,31 +269,31 @@ enum {
  * range of a particular monitor stack.  (Don't adjust without
  * considering uint64 overflow when va is very high.)
  */
-static INLINE Bool
+static inline Bool
 AddrLayout_InMonStack(VA64 va, size_t len)
 {
    return MON_STACK_BASE <= va && va <= MON_STACK_TOP - len;
 }
 
-static INLINE Bool
+static inline Bool
 AddrLayout_InNMIStack(VA64 va, size_t len)
 {
    return va >= NMI_STACK_BASE && va <= NMI_STACK_TOP - len;
 }
 
-static INLINE Bool
+static inline Bool
 AddrLayout_InDFStack(VA64 va, size_t len)
 {
    return va >= DF_STACK_BASE && va <= DF_STACK_TOP - len;
 }
 
-static INLINE Bool
+static inline Bool
 AddrLayout_InMCStack(VA64 va, size_t len)
 {
    return va >= MC_STACK_BASE && va <= MC_STACK_TOP - len;
 }
 
-static INLINE Bool
+static inline Bool
 AddrLayout_InAMonitorStack(VA va, size_t len)
 {
    return AddrLayout_InMonStack(va, len)  ||
diff --git a/vmmon-only/include/bootstrap_vmm.h b/vmmon-only/include/bootstrap_vmm.h
index 1e481223..b4c0b81b 100644
--- a/vmmon-only/include/bootstrap_vmm.h
+++ b/vmmon-only/include/bootstrap_vmm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2015,2017 VMware, Inc. All rights reserved.
+ * Copyright (C) 2015,2017,2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +19,7 @@
 /*
  * bootstrap_vmm.h --
  *
- *    Public VMM bootstrap declarations.
+ *      Public VMM bootstrap declarations.
  */
 
 #ifndef _BOOTSTRAP_VMM_H
@@ -60,6 +60,6 @@ typedef struct BSVMM_HostParams {
    BSVMM_GDTInit    gdtInit;
 } BSVMM_HostParams;
 
-BSVMM_HostParams* BSVMM_Validate(void *buf, uint32 nbytes);
+BSVMM_HostParams *BSVMM_Validate(void *buf, uint32 nbytes);
 
 #endif
diff --git a/vmmon-only/include/compat_sched.h b/vmmon-only/include/compat_sched.h
index 3f3304bd..9f553640 100644
--- a/vmmon-only/include/compat_sched.h
+++ b/vmmon-only/include/compat_sched.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2002 VMware, Inc. All rights reserved.
+ * Copyright (c) 2002-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -86,10 +87,12 @@ static inline _syscall0(int, compat_yield);
 #   define for_each_process(p) for_each_task(p)
 #endif
 
+#if LINUX_VERSION_CODE < KERNEL_VERSION(6, 8, 0)
 #ifndef do_each_thread
 #   define do_each_thread(g, t) for_each_task(g) { t = g; do
 #   define while_each_thread(g, t) while (0) }
 #endif
+#endif
 
 
 /*
diff --git a/vmmon-only/include/compat_version.h b/vmmon-only/include/compat_version.h
index 4a0d7316..e0e721a9 100644
--- a/vmmon-only/include/compat_version.h
+++ b/vmmon-only/include/compat_version.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -141,6 +142,9 @@
 #   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(9, 2)
 #      define RHEL92_BACKPORTS 1
 #   endif
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(9, 4)
+#      define RHEL94_BACKPORTS 1
+#   endif
 #endif
 
 #endif /* __COMPAT_VERSION_H__ */
diff --git a/vmmon-only/include/intelVT.h b/vmmon-only/include/intelVT.h
index 0ea222c9..93090931 100644
--- a/vmmon-only/include/intelVT.h
+++ b/vmmon-only/include/intelVT.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2008-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2008-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -64,7 +65,8 @@ extern "C" {
    MSRNUM(MSR_VMX_TRUE_EXIT_CTLS)      \
    MSRNUM(MSR_VMX_TRUE_ENTRY_CTLS)     \
    MSRNUM(MSR_VMX_VMFUNC)              \
-   MSRNUM(MSR_VMX_3RD_CTLS)
+   MSRNUM(MSR_VMX_3RD_CTLS)            \
+   MSRNUM(MSR_VMX_EXIT_CTLS2)
 
 
 #define EXTRACT_FIELD(msr, basename) \
@@ -132,7 +134,8 @@ IntelVT_FindCommonBasic(const MSRCache *data,    // IN
    unsigned cpu;
    const uint64 orFields = MSR_VMX_BASIC_32BITPA;
    const uint64 andFields = MSR_VMX_BASIC_TRUE_CTLS | MSR_VMX_BASIC_DUALVMM |
-                            MSR_VMX_BASIC_ADVANCED_IOINFO;
+                            MSR_VMX_BASIC_ADVANCED_IOINFO |
+                            MSR_VMX_BASIC_VMENTRY_IGNS_ERR_CODE;
    uint64 commonVal = getMSR(data, MSR_VMX_BASIC, 0);
    for (cpu = 1; cpu < numCPUs; cpu++) {
       uint64 thisCpu = getMSR(data, MSR_VMX_BASIC, cpu);
@@ -376,6 +379,24 @@ IntelVT_FindCommon3rd(const MSRCache *data,     // IN
 }
 
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * IntelVT_FindCommonExit2 --
+ *
+ *      Computes and returns a common MSR_VMX_EXIT_CTLS2 feature MSR across
+ *      all logical processors on the host.
+ *
+ *----------------------------------------------------------------------
+ */
+
+static INLINE uint64
+IntelVT_FindCommonExit2(const MSRCache *data,     // IN
+                        IntelVTMSRGet_Fn getMSR,  // IN
+                        unsigned numCPUs)         // IN
+{
+   return IntelVTFindCommon(MSR_VMX_EXIT_CTLS2, data, getMSR, numCPUs, TRUE);
+}
 #undef EXTRACT_FIELD
 #undef INSERT_FIELD
 #undef INVALID_VMX_BASIC
diff --git a/vmmon-only/include/iocontrols.h b/vmmon-only/include/iocontrols.h
index 74bbe6ce..48391ec6 100644
--- a/vmmon-only/include/iocontrols.h
+++ b/vmmon-only/include/iocontrols.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -146,7 +146,7 @@ PtrToVA64(void const *ptr) // IN
  * the NT specific VMX86_DRIVER_VERSION.
  */
 
-#define VMMON_VERSION           (416 << 16 | 0)
+#define VMMON_VERSION           (417 << 16 | 0)
 #define VMMON_VERSION_MAJOR(v)  ((uint32) (v) >> 16)
 #define VMMON_VERSION_MINOR(v)  ((uint16) (v))
 
diff --git a/vmmon-only/include/monAddrLayout.h b/vmmon-only/include/monAddrLayout.h
index 43d2e992..57ca068c 100644
--- a/vmmon-only/include/monAddrLayout.h
+++ b/vmmon-only/include/monAddrLayout.h
@@ -61,13 +61,13 @@ typedef struct VMM64_AddrLayout {
 #define VMM_MONAS_5LP_FIRST_L5OFF   1
 #define VMM_MONAS_5LP_LAST_L5OFF   34
 
-static INLINE PT_Level
+static inline PT_Level
 MonAS_GetPagingLevel(void)
 {
    return PT_LEVEL_4;
 }
 
-static INLINE Bool
+static inline Bool
 MonAS_Uses5LevelPaging(void)
 {
    return MonAS_GetPagingLevel() == PT_LEVEL_5;
diff --git a/vmmon-only/include/monLoader.h b/vmmon-only/include/monLoader.h
index 494cf858..4adc7384 100644
--- a/vmmon-only/include/monLoader.h
+++ b/vmmon-only/include/monLoader.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (c) 2015-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2015-2020,2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -117,14 +117,16 @@
 #ifndef _MON_LOADER
 #define _MON_LOADER
 
+#if defined VMKERNEL && !defined VMK_HAS_VMM
+#error "VMK code should only include this file when the VMK supports the VMM!"
+#endif
+
 #include "vm_basic_types.h"
 #include "vm_pagetable.h"
 #include "vcpuid.h"   /* Vcpuid */
 
 #if defined VM_X86_64
 #include "x86paging_64.h"
-#elif defined VM_ARM_64
-#include "vmsa.h"
 #endif
 
 #define ML_NAME_MAX 16
@@ -146,24 +148,6 @@
 
 #define ML_PTE_2_PFN(_pte)          LM_PTE_2_PFN(_pte)
 
-#elif defined VM_ARM_64
-
-#define _ML_PERM_COMMON (ARM_PTE_BLOCK_AP(ARM_AP_PL0)   | ARM_PTE_BLOCK_AF | \
-                         ARM_PTE_BLOCK_SH(ARM_SH_OUTER) | ARM_PTE_BLOCK_L3_TYPE)
-#define ARM_PTE_BLOCK_AP_RO ARM_PTE_BLOCK_AP(ARM_AP_RO)
-
-#define ML_PERM_RW   (_ML_PERM_COMMON |                       ARM_PTE_BLOCK_XN)
-#define ML_PERM_RO   (_ML_PERM_COMMON | ARM_PTE_BLOCK_AP_RO | ARM_PTE_BLOCK_XN)
-#define ML_PERM_RX   (_ML_PERM_COMMON | ARM_PTE_BLOCK_AP_RO                   )
-
-#define ML_PERM_TBL   ML_PERM_RW
-#define ML_PERM_MASK (_ML_PERM_COMMON | ARM_PTE_BLOCK_AP_RO | ARM_PTE_BLOCK_XN)
-
-#define ML_PERM_PRESENT(_flags)   (((_flags) & ARM_PTE_VALID) != 0)
-#define ML_PERM_WRITEABLE(_flags) (((_flags) & ARM_PTE_BLOCK_AP_RO) == 0)
-
-#define ML_PTE_2_PFN(_pte)    (((_pte) & ARM_PTE_PFN_MASK) >> PT_PTE_PFN_SHIFT)
-
 #endif
 
 #define ML_PERMS_MATCH(x,p) (((x) & ML_PERM_MASK) == ((p) & ML_PERM_MASK))
@@ -315,7 +299,7 @@ MonLoaderError MonLoader_Process(MonLoaderHeader *header, unsigned numVCPUs,
  *
  *----------------------------------------------------------------------
  */
-static INLINE size_t
+static inline size_t
 MonLoader_GetFixedHeaderSize(void)
 {
    return sizeof(MonLoaderHeader);
@@ -332,7 +316,7 @@ MonLoader_GetFixedHeaderSize(void)
  *
  *----------------------------------------------------------------------
  */
-static INLINE size_t
+static inline size_t
 MonLoader_GetFullHeaderSize(MonLoaderHeader *header)
 {
    return MonLoader_GetFixedHeaderSize() +
diff --git a/vmmon-only/include/perfctr.h b/vmmon-only/include/perfctr.h
index e9343b45..165202c7 100644
--- a/vmmon-only/include/perfctr.h
+++ b/vmmon-only/include/perfctr.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2012,2014-2019,2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -36,19 +37,6 @@
 #include "perfctr_arch.h"
 
 #define PERF_EVENT_NAME_LEN                      64
-/*
- * nmiNo      -- vmm peer is not attempting to do nmi profiling this run.
- * nmiYes     -- vmm peer is doing nmi profiling and nmis are currently enabled.
- * nmiStopped -- vmm peer is doing nmi profiling, but nmis are temporarily
- *               disabled for safety reasons.
- */
-typedef enum {nmiNo = 0, nmiYes, nmiStopped} NMIStatus;
-typedef struct NMIShared { /* shared with vmx and vmkernel */
-   NMIStatus vmmStatus;
-   int32     nmiErrorCode;
-   int64     nmiErrorData;
-   NMI_SHARED_ARCH_FIELDS
-} NMIShared;
 
 /*
  * CrossProf: structures for unified profiling of vmm, vmx, and
diff --git a/vmmon-only/include/perfctr_arch.h b/vmmon-only/include/perfctr_arch.h
index 2a98b07c..afaf9219 100644
--- a/vmmon-only/include/perfctr_arch.h
+++ b/vmmon-only/include/perfctr_arch.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2014, 2019-2020, 2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2014-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -40,8 +41,19 @@
 #include "vm_asm.h"
 #include "x86cpuid_asm.h"
 
-#define NMI_SHARED_ARCH_FIELDS \
-   uint64 nmiMaskedTSC;
+/*
+ * nmiNo      -- vmm peer is not attempting to do nmi profiling this run.
+ * nmiYes     -- vmm peer is doing nmi profiling and nmis are currently enabled.
+ * nmiStopped -- vmm peer is doing nmi profiling, but nmis are temporarily
+ *               disabled for safety reasons.
+ */
+typedef enum {nmiNo = 0, nmiYes, nmiStopped} NMIStatus;
+typedef struct NMIShared { /* shared with vmx and vmkernel */
+   NMIStatus vmmStatus;
+   int32     nmiErrorCode;
+   int64     nmiErrorData;
+   uint64    nmiMaskedTSC;
+} NMIShared;
 
 #define PERFCTR_AMD_NUM_COUNTERS                 4
 #define PERFCTR_AMD_EXT_NUM_COUNTERS             6
@@ -580,7 +592,7 @@
 /*
  * Program/reprogram event reg(s) associated w/perfctrs & start or stop perfctrs
  */
-static INLINE void
+static inline void
 PerfCtr_WriteEvtSel(uint32 addr,       // IN: Event register to write
                     uint32 escrVal)    // IN: event register value
 {
@@ -591,7 +603,7 @@ PerfCtr_WriteEvtSel(uint32 addr,       // IN: Event register to write
 /*
  * Set/reset performance counters to engender desired period before overflow
  */
-static INLINE void
+static inline void
 PerfCtr_WriteCounter(uint32 addr,   // IN: counter to write
                      uint64 value)  // IN: value to write
 {
@@ -599,7 +611,7 @@ PerfCtr_WriteCounter(uint32 addr,   // IN: counter to write
 }
 
 
-static INLINE uint64
+static inline uint64
 PerfCtr_SelValidBits(Bool amd)
 {
    /*
@@ -621,25 +633,25 @@ PerfCtr_SelValidBits(Bool amd)
    return bits;
 }
 
-static INLINE uint64
+static inline uint64
 PerfCtr_PgcValidBits(unsigned numGenCtrs, unsigned numFixCtrs)
 {
    return MASK64(numGenCtrs) | (MASK64(numFixCtrs) << 32);
 }
 
-static INLINE uint64
+static inline uint64
 PerfCtr_FccValidBits(unsigned numFixCtrs)
 {
    return MASK64(numFixCtrs * 4);
 }
 
-static INLINE uint64
+static inline uint64
 PerfCtr_PgcToOvfValidBits(uint64 pgcValBits)
 {
    return pgcValBits | MASKRANGE64(63, 61);
 }
 
-static INLINE uint64
+static inline uint64
 PerfCtr_PgcToStsRstValidBits(uint64 pgcValBits)
 {
    return pgcValBits |
@@ -647,7 +659,7 @@ PerfCtr_PgcToStsRstValidBits(uint64 pgcValBits)
           MASKRANGE64(63, 58);
 }
 
-static INLINE uint64
+static inline uint64
 PerfCtr_PgcToGssValidBits(uint64 pgcValBits)
 {
    return pgcValBits |
@@ -673,7 +685,7 @@ PerfCtr_PgcToGssValidBits(uint64 pgcValBits)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 PerfCtr_HypervisorCPUIDSig(CPUIDRegs *name)
 {
    CPUIDRegs regs;
@@ -708,7 +720,7 @@ PerfCtr_HypervisorCPUIDSig(CPUIDRegs *name)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 PerfCtr_PEBSAvailable(void)
 {
    CPUIDRegs regs;
@@ -747,7 +759,7 @@ PerfCtr_PEBSAvailable(void)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 PerfCtr_PTAvailable(void)
 {
    CPUIDRegs regs;
diff --git a/vmmon-only/include/pgtbl.h b/vmmon-only/include/pgtbl.h
index 3f43c62a..5de6fb1d 100644
--- a/vmmon-only/include/pgtbl.h
+++ b/vmmon-only/include/pgtbl.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2002,2014-2017,2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2002-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -86,7 +87,7 @@ PgtblVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a process
          if (pmd_large(*pmd)) {
             mpn = pmd_pfn(*pmd) + ((addr & ~PMD_MASK) >> PAGE_SHIFT);
          } else {
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(6,5,0)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(6,5,0) || defined(RHEL94_BACKPORTS)
             pte_t *pte = pte_offset_kernel(pmd, addr);
 #else
             pte_t *pte = pte_offset_map(pmd, addr);
diff --git a/vmmon-only/include/ptsc.h b/vmmon-only/include/ptsc.h
index 477e6ea8..1e79df79 100644
--- a/vmmon-only/include/ptsc.h
+++ b/vmmon-only/include/ptsc.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2017,2019-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2017,2019-2022,2024 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -104,21 +104,21 @@ VmAbsoluteTS PTSC_InitialCount(const char *module,
 Bool PTSC_HasPerfectlySynchronizedTSCs(void);
 VmRelativeTS PTSC_RefClockOffset(void);
 
-static INLINE int64
+static inline int64
 PTSC_Hz(void)
 {
    ASSERT(ptscInfo.hz);
    return ptscInfo.hz;
 }
 
-static INLINE uint32
+static inline uint32
 PTSC_KHz(void)
 {
    ASSERT(ptscInfo.kHz);
    return ptscInfo.kHz;
 }
 
-static INLINE uint32
+static inline uint32
 PTSC_MHz(void)
 {
    ASSERT(ptscInfo.mHz);
@@ -132,25 +132,25 @@ PTSC_MHz(void)
  * of the signed type.
  */
 
-static INLINE VmRelativeTS
+static inline VmRelativeTS
 PTSC_USToCycles(int64 us)
 {
    return Muls64x32s64(us, ptscInfo.usToCycles.mult, ptscInfo.usToCycles.shift);
 }
 
-static INLINE VmRelativeTS
+static inline VmRelativeTS
 PTSC_MSToCycles(int64 ms)
 {
    return Muls64x32s64(ms, ptscInfo.msToCycles.mult, ptscInfo.msToCycles.shift);
 }
 
-static INLINE int64
+static inline int64
 PTSC_CyclesToNS(VmRelativeTS ts)
 {
    return Muls64x32s64(ts, ptscInfo.cyclesToNs.mult, ptscInfo.cyclesToNs.shift);
 }
 
-static INLINE int64
+static inline int64
 PTSC_CyclesToUS(VmRelativeTS ts)
 {
    return Muls64x32s64(ts, ptscInfo.cyclesToUs.mult, ptscInfo.cyclesToUs.shift);
@@ -163,7 +163,7 @@ PTSC_CyclesToUS(VmRelativeTS ts)
  */
 #include "user_layout.h"
 
-static INLINE VmAbsoluteTS
+static inline VmAbsoluteTS
 PTSC_Get(void)
 {
    extern __thread User_ThreadData vmkUserTdata;
@@ -197,7 +197,7 @@ VmAbsoluteTS PTSC_Get(void);
  *-----------------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 PTSC_HasSynchronizedTSCs(void)
 {
    return ptscInfo.hwTSCsSynced;
@@ -215,7 +215,7 @@ PTSC_HasSynchronizedTSCs(void)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 PTSC_HostAdjustedTSCs(void)
 {
    return ptscInfo.hwTSCsAdjusted;
@@ -233,7 +233,7 @@ PTSC_HostAdjustedTSCs(void)
  *----------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 PTSC_AdvanceTimer(VmAbsoluteTS now,
                   VmIntervalTS period,
                   VmAbsoluteTS *deadline)
diff --git a/vmmon-only/include/sharedAreaVmmon.h b/vmmon-only/include/sharedAreaVmmon.h
index a009fdaf..408be0c6 100644
--- a/vmmon-only/include/sharedAreaVmmon.h
+++ b/vmmon-only/include/sharedAreaVmmon.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2018 VMware, Inc. All rights reserved.
+ * Copyright (c) 2018-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/statVarsVmmon.h b/vmmon-only/include/statVarsVmmon.h
index fa379d1c..0c06e228 100644
--- a/vmmon-only/include/statVarsVmmon.h
+++ b/vmmon-only/include/statVarsVmmon.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2018-2019 VMware, Inc. All rights reserved.
+ * Copyright (c) 2018-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/vcpuid.h b/vmmon-only/include/vcpuid.h
index 12c3dd12..bb8aaad6 100644
--- a/vmmon-only/include/vcpuid.h
+++ b/vmmon-only/include/vcpuid.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2014, 2016-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2014,2016-2021,2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -50,7 +51,7 @@ typedef uint32 Vcpuid;                 // VCPU number
 #define IS_BOOT_VCPUID(vcpuid)  ((vcpuid) == BOOT_VCPU_ID)
 
 #define MAX_VCPUS            2048
-#define MAX_CORES_PER_SOCKET  256
+#define MAX_CORES_PER_SOCKET  512
 #define MAX_VCPU_SOCKETS      128
 
 /*
@@ -60,7 +61,7 @@ typedef uint32 Vcpuid;                 // VCPU number
 #define MAX_SMALL_VM_VCPUS 128
 
 /* Supported limit. */
-#define MAX_SUPPORTED_VCPUS   768
+#define MAX_SUPPORTED_VCPUS   960
 
 #if defined __cplusplus
 } // extern "C"
diff --git a/vmmon-only/include/vcpuset.h b/vmmon-only/include/vcpuset.h
index 831a0511..16947ea5 100644
--- a/vmmon-only/include/vcpuset.h
+++ b/vmmon-only/include/vcpuset.h
@@ -146,7 +146,7 @@ extern VCPUSet  vcpuSetFull;
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_Empty(VCPUSet *vcs)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -165,7 +165,7 @@ VCPUSet_Empty(VCPUSet *vcs)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 VCPUSet_IsEmpty(const VCPUSet *vcs)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -186,7 +186,7 @@ VCPUSet_IsEmpty(const VCPUSet *vcs)
  *
  *----------------------------------------------------------------------
  */
-static INLINE const VCPUSet *
+static inline const VCPUSet *
 VCPUSet_Full(void)
 {
    /*
@@ -210,7 +210,7 @@ VCPUSet_Full(void)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_Copy(VCPUSet *dest, const VCPUSet *src)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -229,7 +229,7 @@ VCPUSet_Copy(VCPUSet *dest, const VCPUSet *src)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 VCPUSet_Equals(const VCPUSet *vcs1, const VCPUSet *vcs2)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -251,7 +251,7 @@ VCPUSet_Equals(const VCPUSet *vcs1, const VCPUSet *vcs2)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 VCPUSet_IsMember(const VCPUSet *vcs, Vcpuid v)
 {
    ASSERT(v < MAX_VCPUS);
@@ -270,7 +270,7 @@ VCPUSet_IsMember(const VCPUSet *vcs, Vcpuid v)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 VCPUSet_AtomicIsMember(VCPUSet *vcs, Vcpuid v)
 {
    volatile uint64 *subset = &vcs->subset[VCS_VCPUID_SUBSET_IDX(v)];
@@ -296,7 +296,7 @@ VCPUSet_AtomicIsMember(VCPUSet *vcs, Vcpuid v)
  *----------------------------------------------------------------------
  */
 
-static INLINE Vcpuid
+static inline Vcpuid
 VCPUSet_FindFirst(const VCPUSet *vcs)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -308,7 +308,7 @@ VCPUSet_FindFirst(const VCPUSet *vcs)
    return VCPUID_INVALID;
 }
 
-static INLINE Vcpuid
+static inline Vcpuid
 VCPUSet_FindLast(const VCPUSet *vcs)
 {
    FOR_EACH_SUBSET_IN_SET_COUNTDOWN(idx) {
@@ -344,7 +344,7 @@ VCPUSet_FindLast(const VCPUSet *vcs)
  *----------------------------------------------------------------------
  */
 
-static INLINE Vcpuid
+static inline Vcpuid
 VCPUSet_FindFirstInSubset(const VCPUSet *vcs, uint64 *subset,
                           unsigned *subsetIdx, unsigned maxSubsets)
 {
@@ -375,7 +375,7 @@ VCPUSet_FindFirstInSubset(const VCPUSet *vcs, uint64 *subset,
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_Remove(VCPUSet *vcs, Vcpuid v)
 {
    ASSERT(v < MAX_VCPUS);
@@ -383,7 +383,7 @@ VCPUSet_Remove(VCPUSet *vcs, Vcpuid v)
 }
 
 
-static INLINE void
+static inline void
 VCPUSet_AtomicRemove(VCPUSet *vcs, Vcpuid v)
 {
    volatile uint64 *subset = &vcs->subset[VCS_VCPUID_SUBSET_IDX(v)];
@@ -403,7 +403,7 @@ VCPUSet_AtomicRemove(VCPUSet *vcs, Vcpuid v)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_IncludeSet(VCPUSet *dest, const VCPUSet *src)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -412,7 +412,7 @@ VCPUSet_IncludeSet(VCPUSet *dest, const VCPUSet *src)
 }
 
 
-static INLINE void
+static inline void
 VCPUSet_RemoveSet(VCPUSet *dest, const VCPUSet *src)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -432,7 +432,7 @@ VCPUSet_RemoveSet(VCPUSet *dest, const VCPUSet *src)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_Include(VCPUSet *vcs, Vcpuid v)
 {
    ASSERT(v < MAX_VCPUS);
@@ -440,7 +440,7 @@ VCPUSet_Include(VCPUSet *vcs, Vcpuid v)
 }
 
 
-static INLINE void
+static inline void
 VCPUSet_AtomicInclude(VCPUSet *vcs, Vcpuid v)
 {
    volatile uint64 *subset = &vcs->subset[VCS_VCPUID_SUBSET_IDX(v)];
@@ -460,7 +460,7 @@ VCPUSet_AtomicInclude(VCPUSet *vcs, Vcpuid v)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 VCPUSet_AtomicTestInclude(VCPUSet *vcs, Vcpuid v)
 {
    volatile uint64 *subset = &vcs->subset[VCS_VCPUID_SUBSET_IDX(v)];
@@ -480,7 +480,7 @@ VCPUSet_AtomicTestInclude(VCPUSet *vcs, Vcpuid v)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_PopulateRange(VCPUSet *vcs, unsigned firstVCPU,
                           unsigned numVCPUs)
 {
@@ -512,7 +512,7 @@ VCPUSet_PopulateRange(VCPUSet *vcs, unsigned firstVCPU,
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_Populate(VCPUSet *vcs, unsigned numVCPUs)
 {
    VCPUSet_PopulateRange(vcs, 0, numVCPUs);
@@ -529,7 +529,7 @@ VCPUSet_Populate(VCPUSet *vcs, unsigned numVCPUs)
  *----------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 VCPUSet_Subset(const VCPUSet *vcs,
                    unsigned subset)
 {
@@ -548,7 +548,7 @@ VCPUSet_Subset(const VCPUSet *vcs,
  *----------------------------------------------------------------------
  */
 
-static INLINE uint64 *
+static inline uint64 *
 VCPUSet_SubsetPtr(VCPUSet *vcs, unsigned subset)
 {
    ASSERT(subset < VCS_SUBSET_COUNT);
@@ -567,7 +567,7 @@ VCPUSet_SubsetPtr(VCPUSet *vcs, unsigned subset)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 VCPUSet_IsSupersetOrEqual(const VCPUSet *vcs1, const VCPUSet *vcs2)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -590,7 +590,7 @@ VCPUSet_IsSupersetOrEqual(const VCPUSet *vcs1, const VCPUSet *vcs2)
  *----------------------------------------------------------------------
  */
 
-static INLINE Bool
+static inline Bool
 VCPUSet_IsSubsetOrEqual(const VCPUSet *vcs1, const VCPUSet *vcs2)
 {
    return VCPUSet_IsSupersetOrEqual(vcs2, vcs1);
@@ -607,7 +607,7 @@ VCPUSet_IsSubsetOrEqual(const VCPUSet *vcs1, const VCPUSet *vcs2)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_MakeSingleton(VCPUSet *vcs, Vcpuid v)
 {
    VCPUSet_Empty(vcs);
@@ -626,7 +626,7 @@ VCPUSet_MakeSingleton(VCPUSet *vcs, Vcpuid v)
  *----------------------------------------------------------------------
  */
 
-static INLINE Vcpuid
+static inline Vcpuid
 VCPUSet_FindSingleton(const VCPUSet *vcs)
 {
    uint64 foundSub = 0;
@@ -658,7 +658,7 @@ VCPUSet_FindSingleton(const VCPUSet *vcs)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VCPUSet_IsFull(const VCPUSet *vcs)
 {
    return VCPUSet_Equals(vcs, VCPUSet_Full());
@@ -677,7 +677,7 @@ VCPUSet_IsFull(const VCPUSet *vcs)
  *----------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 VCPUSet_AtomicReadWriteSubset(VCPUSet *vcs, uint64 vcpus,
                                   unsigned n)
 {
@@ -695,7 +695,7 @@ VCPUSet_AtomicReadWriteSubset(VCPUSet *vcs, uint64 vcpus,
  *
  *----------------------------------------------------------------------
  */
-static INLINE int
+static inline int
 VCPUSet_Size(const VCPUSet *vcs)
 {
    int n = 0;
@@ -721,7 +721,7 @@ VCPUSet_Size(const VCPUSet *vcs)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_UnionSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
 {
    ASSERT(n < VCS_SUBSET_COUNT);
@@ -740,7 +740,7 @@ VCPUSet_UnionSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_SubtractSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
 {
    ASSERT(n < VCS_SUBSET_COUNT);
@@ -759,7 +759,7 @@ VCPUSet_SubtractSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_AtomicUnionSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
 {
    uint64 *subsetPtr = &vcs->subset[n];
@@ -779,7 +779,7 @@ VCPUSet_AtomicUnionSubset(VCPUSet *vcs, uint64 vcpus, unsigned n)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_Invert(VCPUSet *vcs)
 {
    VCPUSet temp;
@@ -800,7 +800,7 @@ VCPUSet_Invert(VCPUSet *vcs)
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 VCPUSet_Intersection(VCPUSet *dest, const VCPUSet *src)
 {
    FOR_EACH_SUBSET_IN_SET(idx) {
@@ -823,7 +823,7 @@ VCPUSet_Intersection(VCPUSet *dest, const VCPUSet *src)
  */
 
 #ifdef VCS_SNPRINTF
-static INLINE char *
+static inline char *
 VCPUSet_LogFormat(char *buf, size_t size, const VCPUSet *vcs)
 {
    unsigned offset  = 0;
diff --git a/vmmon-only/include/virtual_vt.h b/vmmon-only/include/virtual_vt.h
index 695ba9a5..332b08e6 100644
--- a/vmmon-only/include/virtual_vt.h
+++ b/vmmon-only/include/virtual_vt.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2008-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2008-2023 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -37,7 +38,7 @@
  * Virtualized VT support
  */
 
-#define VVT_NUM_MSRS                 (MSR_VMX_VMFUNC - MSR_VMX_BASIC + 1)
+#define VVT_NUM_MSRS                 (MSR_VMX_EXIT_CTLS2 - MSR_VMX_BASIC + 1)
 
 #define VVT_VMCS_ID                  CONST64U(1)
 #define VVT_VMCS_SIZE                ((uint64)(PAGE_SIZE))
@@ -85,6 +86,8 @@
 #define VVT_EXIT_CTLS                QWORD(VVT_EXIT_CTLS1,                  \
                                            VVT_EXIT_CTLS0)
 
+#define VVT_EXIT_CTLS2               MSR_VMX_EXIT_CTLS2_REPORT_FRACT_SHSTK
+
 #define VVT_ENTRY_CTLS0              (VT_ENTRY_CTLS_DEFAULT1 |              \
                                       VVT_TRUE_ENTRY_CTLS0)
 #define VVT_ENTRY_CTLS1              VVT_TRUE_ENTRY_CTLS1
@@ -314,7 +317,7 @@ typedef struct {
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VVT_SupportedFromFeatures(uint64 basic, uint64 misc, uint64 cr0Fixed0,
                           uint64 cr0Fixed1, uint64 cr4Fixed0,
                           uint64 cr4Fixed1, uint64 secondary, uint64 eptVPID,
diff --git a/vmmon-only/include/vm_asm.h b/vmmon-only/include/vm_asm.h
index bfcf011f..2a89c468 100644
--- a/vmmon-only/include/vm_asm.h
+++ b/vmmon-only/include/vm_asm.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2014,2019,2024 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -44,41 +44,41 @@
 #include "vm_asm_x86.h"
 
 
-static INLINE void
+static inline void
 SET_FS64(uint64 fs64)
 {
    X86MSR_SetMSR(MSR_FSBASE, fs64);
 }
 
 
-static INLINE void
+static inline void
 SET_GS64(uint64 gs64)
 {
    X86MSR_SetMSR(MSR_GSBASE, gs64);
 }
 
-static INLINE void
+static inline void
 SET_KernelGS64(uint64 kgs64)
 {
    X86MSR_SetMSR(MSR_KERNELGSBASE, kgs64);
 }
 
 
-static INLINE uint64
+static inline uint64
 GET_FS64(void)
 {
    return X86MSR_GetMSR(MSR_FSBASE);
 }
 
 
-static INLINE uint64
+static inline uint64
 GET_GS64(void)
 {
    return X86MSR_GetMSR(MSR_GSBASE);
 }
 
 
-static INLINE uint64
+static inline uint64
 GET_KernelGS64(void)
 {
    return X86MSR_GetMSR(MSR_KERNELGSBASE);
diff --git a/vmmon-only/include/vm_asm_x86.h b/vmmon-only/include/vm_asm_x86.h
index a6eac4e9..9f75386b 100644
--- a/vmmon-only/include/vm_asm_x86.h
+++ b/vmmon-only/include/vm_asm_x86.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2014,2016-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -85,7 +86,7 @@
 
 
 /* Checked against the Intel manual and GCC --hpreg */
-static INLINE void
+static inline void
 _Set_GDT(_GETSET_DTR_TYPE *dtr)
 {
    __asm__(
@@ -96,7 +97,7 @@ _Set_GDT(_GETSET_DTR_TYPE *dtr)
 }
 
 /* Checked against the Intel manual and GCC --hpreg */
-static INLINE void
+static inline void
 _Set_IDT(_GETSET_DTR_TYPE *dtr)
 {
    __asm__(
@@ -111,7 +112,7 @@ _Set_IDT(_GETSET_DTR_TYPE *dtr)
  * volatile because there's a hidden input (the [IG]DTR) that can change
  * without the compiler knowing it.
  */
-static INLINE void
+static inline void
 _Get_GDT(_GETSET_DTR_TYPE *dtr)
 {
    __asm__ __volatile__(
@@ -125,7 +126,7 @@ _Get_GDT(_GETSET_DTR_TYPE *dtr)
  * volatile because the [IG]DT can change without the compiler knowing it
  * (when we use l[ig]dt).
  */
-static INLINE void
+static inline void
 _Get_IDT(_GETSET_DTR_TYPE *dtr)
 {
    __asm__ __volatile__(
@@ -153,7 +154,7 @@ _Get_IDT(_GETSET_DTR_TYPE *dtr)
  * volatile because the LDT can change without the compiler knowing it
  * (when we use lldt).
  */
-static INLINE void
+static inline void
 _GET_LDT(Selector * const result)
 {
    __asm__ __volatile__("sldt %0"
@@ -168,7 +169,7 @@ _GET_LDT(Selector * const result)
 
 
 #define _BUILD_SET_R(func, reg)        \
-   static INLINE void                  \
+   static inline void                  \
    func(uintptr_t r)                   \
    {                                   \
       __asm__("mov %0, %%" #reg        \
@@ -184,7 +185,7 @@ _GET_LDT(Selector * const result)
  * gcc that smsw clobbers cr0 for example).
  */
 #define _BUILD_GET_R(func, reg)                         \
-   static INLINE uintptr_t                              \
+   static inline uintptr_t                              \
    func(void)                                           \
    {                                                    \
       uintptr_t result;                                 \
@@ -252,7 +253,7 @@ _BUILD_GET_R(_GET_DR7, dr7)
  *      time install better type checking.
  */
 #define _BUILD_GET_SEG(func, reg)                \
-   static INLINE Selector                        \
+   static inline Selector                        \
    func(void)                                    \
    {                                             \
       Selector result;                           \
@@ -285,7 +286,7 @@ _BUILD_GET_SEG(GET_SS, ss)
 
    volatile because the content of TR can change without the compiler knowing
    it (when we use task gates). */
-static INLINE void
+static inline void
 _GET_TR(Selector * const result)
 {
    __asm__ __volatile__("str %0"
@@ -302,7 +303,7 @@ _GET_TR(Selector * const result)
 
    We use this to restore interrupts, so this cannot be reordered around
    by gcc */
-static INLINE void
+static inline void
 _Set_flags(uintptr_t f)
 {
    __asm__ __volatile__(
@@ -321,7 +322,7 @@ _Set_flags(uintptr_t f)
    volatile because gcc 2.7.2.3 doesn't know when eflags are modified (it
    seems to ignore the "cc" clobber). gcc 2.95.2 is ok: it optimize 2
    successive calls only if there is no instructions in between. */
-static INLINE uintptr_t
+static inline uintptr_t
 _Get_flags(void)
 {
    uintptr_t result;
@@ -341,20 +342,20 @@ _Get_flags(void)
    var = _Get_flags();       \
 } while (0)
 
-static INLINE Bool
+static inline Bool
 HwInterruptsEnabled(uint32 eflags)
 {
    return (eflags & EFLAGS_IF) != 0;
 }
 
-static INLINE void
+static inline void
 HwInterruptsDisable(uint64 *rflags)
 {
    *rflags &= ~EFLAGS_IF;
 }
 
 /* Checked against the Intel manual and GCC --hpreg */
-static INLINE void
+static inline void
 CLTS(void)
 {
    __asm__ __volatile__ ("clts");
@@ -376,7 +377,7 @@ CLTS(void)
 #define RETURN_FROM_INT()   __asm__ __volatile__("iret" :: )
 
 #ifdef VM_X86_64
-static INLINE uint64
+static inline uint64
 GET_SSP(void)
 {
    uint64 ssp = 0x3; /* INVALID_SSP */
@@ -396,28 +397,28 @@ GET_SSP(void)
 #elif defined _MSC_VER  /* !__GNUC__ */
 
 #define _BUILD_SET_DR(func, reg)                      \
-   static INLINE void                                 \
+   static inline void                                 \
    func(uintptr_t r)                                  \
    {                                                  \
       __writedr(reg, r);                              \
    }
 
 #define _BUILD_GET_DR(func, reg)                      \
-   static INLINE uintptr_t                            \
+   static inline uintptr_t                            \
    func(void)                                         \
    {                                                  \
       return __readdr(reg);                           \
    }
 
 #define _BUILD_SET_CR(func, reg)                      \
-   static INLINE void                                 \
+   static inline void                                 \
    func(uintptr_t r)                                  \
    {                                                  \
       __writecr##reg(r);                              \
    }
 
 #define _BUILD_GET_CR(func, reg)                      \
-   static INLINE uintptr_t                            \
+   static inline uintptr_t                            \
    func(void)                                         \
    {                                                  \
       return __readcr##reg();                         \
@@ -448,25 +449,25 @@ _BUILD_GET_CR(_GET_CR3, 3);
 _BUILD_GET_CR(_GET_CR4, 4);
 _BUILD_GET_CR(_GET_CR8, 8);
 
-static INLINE void
+static inline void
 _Set_GDT(_GETSET_DTR_TYPE *dtr)
 {
    _lgdt(dtr);
 }
 
-static INLINE void
+static inline void
 _Get_GDT(_GETSET_DTR_TYPE *dtr)
 {
    _sgdt(dtr);
 }
 
-static INLINE void
+static inline void
 _Set_IDT(_GETSET_DTR_TYPE *dtr)
 {
    __lidt(dtr);
 }
 
-static INLINE void
+static inline void
 _Get_IDT(_GETSET_DTR_TYPE *dtr)
 {
    __sidt(dtr);
@@ -524,7 +525,7 @@ _Get_IDT(_GETSET_DTR_TYPE *dtr)
 #define SET_CR4(expr) SET_CR_DR(CR, 4, expr)
 #define SET_CR8(expr) SET_CR_DR(CR, 8, expr)
 
-static INLINE Bool
+static inline Bool
 INTERRUPTS_ENABLED(void)
 {
 #if !defined(USERLEVEL)
@@ -562,7 +563,7 @@ INTERRUPTS_ENABLED(void)
 
 
 #if defined (__GNUC__)
-static INLINE unsigned
+static inline unsigned
 CURRENT_CPL(void)
 {
    return SELECTOR_RPL(GET_CS());
@@ -570,7 +571,7 @@ CURRENT_CPL(void)
 #endif
 
 
-static INLINE uint64
+static inline uint64
 RDPMC(int counter)
 {
 #ifdef __GNUC__
@@ -603,7 +604,7 @@ RDPMC(int counter)
 
 
 #if defined(VMM) || defined(VMKERNEL) || defined(FROBOS) || defined (ULM)
-static INLINE uint64
+static inline uint64
 __XGETBV(int cx)
 {
 #ifdef __GNUC__
@@ -629,7 +630,7 @@ __XGETBV(int cx)
 #endif
 }
 
-static INLINE void
+static inline void
 __XSETBV(int cx, uint64 val)
 {
 #ifdef __GNUC__
@@ -643,7 +644,7 @@ __XSETBV(int cx, uint64 val)
 #endif
 }
 
-static INLINE uint64
+static inline uint64
 GET_XCR0(void)
 {
    return __XGETBV(0);
@@ -651,7 +652,7 @@ GET_XCR0(void)
 
 #define SET_XCR0(val) __XSETBV(0, val)
 
-static INLINE void
+static inline void
 SET_XCR0_IF_NEEDED(uint64 newVal, uint64 oldVal)
 {
 #ifndef VMM_BOOTSTRAP
@@ -664,7 +665,7 @@ SET_XCR0_IF_NEEDED(uint64 newVal, uint64 oldVal)
 #endif
 
 
-static INLINE uint32
+static inline uint32
 RDTSCP_AuxOnly(void)
 {
 #ifdef __GNUC__
@@ -686,7 +687,7 @@ RDTSCP_AuxOnly(void)
 }
 
 
-static INLINE uint64
+static inline uint64
 RDTSCP(void)
 {
 #ifdef __GNUC__
@@ -706,27 +707,20 @@ RDTSCP(void)
 }
 
 
-static INLINE void
+static inline void
 MONITOR(void *addr, uint32 extensions, uint32 hints)
 {
-   /*
-    * Flush the monitored cache line to work around hardware bug
-    * on Dunnington CPUs which can cause false wakeups.
-    * (cf. PowerSetCState in the vmkernel.)
-    */
 #ifdef __GNUC__
    __asm__ __volatile__(
-      "clflush (%0);"
       "monitor" : : "a" (addr), "c" (extensions), "d" (hints)
    );
 #elif defined _MSC_VER
-   _mm_clflush(addr);
    _mm_monitor(addr, extensions, hints);
 #endif
 }
 
 
-static INLINE void
+static inline void
 MWAIT(uint32 extensions, uint32 hints)
 {
 #ifdef __GNUC__
@@ -739,7 +733,7 @@ MWAIT(uint32 extensions, uint32 hints)
 }
 
 
-static INLINE void
+static inline void
 MONITORX(void *addr, uint32 extensions, uint32 hints)
 {
 #ifdef __GNUC__
@@ -752,7 +746,7 @@ MONITORX(void *addr, uint32 extensions, uint32 hints)
 }
 
 
-static INLINE void
+static inline void
 MWAITX(uint32 extensions, uint32 hints, uint32 timeout)
 {
 #ifdef __GNUC__
diff --git a/vmmon-only/include/vm_atomic.h b/vmmon-only/include/vm_atomic.h
index 87bf1ece..7c836360 100644
--- a/vmmon-only/include/vm_atomic.h
+++ b/vmmon-only/include/vm_atomic.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -183,6 +184,17 @@ typedef ALIGNED(16) struct Atomic_uint128 {
 #define dmb() __asm__ __volatile__("dmb" : : : "memory")
 #endif
 
+/*
+ * Whether GCC flags output operands are supported.
+ * If building with GCC 6+ on x86, and 10+ on arm, flags output is supported.
+ * Some pieces are still built with GCC 4, which doesn't support flag outputs.
+ */
+#ifdef __GCC_ASM_FLAG_OUTPUTS__
+#define IF_ASM_FLAG_OUTPUT(supportedValue, fallbackValue) supportedValue
+#else /* older gcc (or not gcc), flags output is not supported */
+#define IF_ASM_FLAG_OUTPUT(supportedValue, fallbackValue) fallbackValue
+#endif
+
 
 /* Convert a volatile uint32 to Atomic_uint32. */
 static INLINE Atomic_uint32 *
@@ -318,7 +330,7 @@ Atomic_Read8(Atomic_uint8 const *var)  // IN:
    uint8 val;
 
 #if defined VM_ATOMIC_USE_C11
-   val = atomic_load((const _Atomic uint8 *)&var->value);
+   val = atomic_load((const _Atomic(uint8) *)&var->value);
 #elif defined __GNUC__ && defined VM_ARM_32
    val = AtomicUndefined(var);
 #elif defined __GNUC__ && defined VM_ARM_64
@@ -360,7 +372,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
                   uint8 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_exchange((_Atomic uint8 *)&var->value, val);
+   return atomic_exchange((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + val);
 #elif defined __GNUC__ && defined VM_ARM_64
@@ -404,7 +416,7 @@ Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
               uint8 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_store((_Atomic uint8 *)&var->value, val);
+   atomic_store((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_32
    AtomicUndefined(var + val);
 #elif defined __GNUC__ && defined VM_ARM_64
@@ -446,7 +458,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
 {
 #if defined VM_ATOMIC_USE_C11
    atomic_compare_exchange_strong(
-      (_Atomic uint8 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint8) *)&var->value, &oldVal, newVal);
    return oldVal;
 #elif defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + oldVal + newVal);
@@ -498,7 +510,7 @@ Atomic_ReadAnd8(Atomic_uint8 *var, // IN/OUT
    uint8 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_and((_Atomic uint8 *)&var->value, val);
+   res = atomic_fetch_and((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, and, val);
 #else
@@ -562,7 +574,7 @@ Atomic_ReadOr8(Atomic_uint8 *var, // IN/OUT
    uint8 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_or((_Atomic uint8 *)&var->value, val);
+   res = atomic_fetch_or((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, orr, val);
 #else
@@ -626,7 +638,7 @@ Atomic_ReadXor8(Atomic_uint8 *var, // IN/OUT
    uint8 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_xor((_Atomic uint8 *)&var->value, val);
+   res = atomic_fetch_xor((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, eor, val);
 #else
@@ -690,7 +702,7 @@ Atomic_ReadAdd8(Atomic_uint8 *var, // IN/OUT
    uint8 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_add((_Atomic uint8 *)&var->value, val);
+   res = atomic_fetch_add((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, add, val);
 #else
@@ -752,7 +764,7 @@ Atomic_Sub8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_sub((_Atomic uint8 *)&var->value, val);
+   atomic_fetch_sub((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, sub, val);
 #else
@@ -879,7 +891,7 @@ Atomic_Read32(Atomic_uint32 const *var) // IN
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   value = atomic_load((_Atomic uint32 *)&var->value);
+   value = atomic_load((_Atomic(uint32) *)&var->value);
 #elif defined __GNUC__
    /*
     * Use inline assembler to force using a single load instruction to
@@ -940,7 +952,7 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
                    uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_exchange((_Atomic uint32 *)&var->value, val);
+   return atomic_exchange((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 retVal;
@@ -1009,7 +1021,7 @@ Atomic_Write32(Atomic_uint32 *var, // OUT
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store((_Atomic uint32 *)&var->value, val);
+   atomic_store((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #if defined VM_ARM_64
    _VMATOM_X(W, 32, &var->value, val);
@@ -1091,7 +1103,7 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    atomic_compare_exchange_strong(
-      (_Atomic uint32 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint32) *)&var->value, &oldVal, newVal);
    return oldVal;
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
@@ -1167,7 +1179,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    atomic_compare_exchange_strong(
-      (_Atomic uint64 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint64) *)&var->value, &oldVal, newVal);
    return oldVal;
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
@@ -1261,7 +1273,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_and((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_and((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1323,7 +1335,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
             uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_or((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_or((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1385,7 +1397,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_xor((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_xor((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1448,7 +1460,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_xor((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_xor((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__
 #if defined VM_ARM_64
    _VMATOM_X(OP, 64, TRUE, &var->value, eor, val);
@@ -1492,7 +1504,7 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_add((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_add((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1554,7 +1566,7 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_sub((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_sub((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1724,7 +1736,7 @@ Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
    uint32 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_or((_Atomic uint32 *)&var->value, val);
+   res = atomic_fetch_or((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, orr, val);
 #else
@@ -1760,7 +1772,7 @@ Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
    uint32 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_and((_Atomic uint32 *)&var->value, val);
+   res = atomic_fetch_and((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, and, val);
 #else
@@ -1797,7 +1809,7 @@ Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
    uint64 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_or((_Atomic uint64 *)&var->value, val);
+   res = atomic_fetch_or((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, orr, val);
 #else
@@ -1833,7 +1845,7 @@ Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
    uint64 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_and((_Atomic uint64 *)&var->value, val);
+   res = atomic_fetch_and((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, and, val);
 #else
@@ -1872,7 +1884,7 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
                  uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_fetch_add((_Atomic uint32 *)&var->value, val);
+   return atomic_fetch_add((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1986,7 +1998,7 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    return atomic_compare_exchange_strong(
-      (_Atomic uint64 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint64) *)&var->value, &oldVal, newVal);
 #elif defined __GNUC__
 #if defined VM_ARM_ANY
    return Atomic_ReadIfEqualWrite64(var, oldVal, newVal) == oldVal;
@@ -1997,10 +2009,10 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
 #if defined __x86_64__
    uint64 dummy;
    __asm__ __volatile__(
-      "lock; cmpxchgq %3, %0" "\n\t"
-      "sete %1"
+      "lock; cmpxchgq %3, %0"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "sete %1")
       : "+m" (*var),
-        "=qm" (equal),
+        IF_ASM_FLAG_OUTPUT("=@cce", "=qm") (equal),
         "=a" (dummy)
       : "r" (newVal),
         "2" (oldVal)
@@ -2042,9 +2054,9 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
    __asm__ __volatile__(
       "xchgl %%ebx, %6"      "\n\t"
       "lock; cmpxchg8b (%3)" "\n\t"
-      "xchgl %%ebx, %6"      "\n\t"
-      "sete %0"
-      : "=qm" (equal),
+      "xchgl %%ebx, %6"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "sete %0")
+      : IF_ASM_FLAG_OUTPUT("=@cce", "=qm") (equal),
         "=a" (dummy1),
         "=d" (dummy2)
       : /*
@@ -2064,10 +2076,10 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
    );
 #   else
    __asm__ __volatile__(
-      "lock; cmpxchg8b %0" "\n\t"
-      "sete %1"
+      "lock; cmpxchg8b %0"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "sete %1")
       : "+m" (*var),
-        "=qm" (equal),
+        IF_ASM_FLAG_OUTPUT("=@cce", "=qm") (equal),
         "=a" (dummy1),
         "=d" (dummy2)
       : "2" (((S_uint64 *)&oldVal)->lowValue),
@@ -2114,7 +2126,7 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    return atomic_compare_exchange_strong(
-      (_Atomic uint32 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint32) *)&var->value, &oldVal, newVal);
 #elif defined __GNUC__
 #if defined VM_ARM_ANY
    return Atomic_ReadIfEqualWrite32(var, oldVal, newVal) == oldVal;
@@ -2123,10 +2135,10 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
    uint32 dummy;
 
    __asm__ __volatile__(
-      "lock; cmpxchgl %3, %0" "\n\t"
-      "sete %1"
+      "lock; cmpxchgl %3, %0"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "sete %1")
       : "+m" (*var),
-        "=qm" (equal),
+        IF_ASM_FLAG_OUTPUT("=@cce", "=qm") (equal),
         "=a" (dummy)
       : "r" (newVal),
         "2" (oldVal)
@@ -2160,7 +2172,7 @@ static INLINE uint64
 Atomic_Read64(Atomic_uint64 const *var) // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_load((const _Atomic uint64 *)&var->value);
+   return atomic_load((const _Atomic(uint64) *)&var->value);
 #else
 #if defined __GNUC__
    uint64 value;
@@ -2284,7 +2296,7 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_fetch_add((_Atomic uint64 *)&var->value, val);
+   return atomic_fetch_add((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, add, val);
 #elif defined __x86_64__
@@ -2340,7 +2352,7 @@ Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_fetch_sub((_Atomic uint64 *)&var->value, val);
+   return atomic_fetch_sub((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
@@ -2434,7 +2446,7 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_add((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_add((_Atomic(uint64) *)&var->value, val);
 #elif !defined VM_64BIT
    Atomic_ReadAdd64(var, val); /* Return value is unused. */
 #elif defined __GNUC__
@@ -2479,7 +2491,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_sub((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_sub((_Atomic(uint64) *)&var->value, val);
 #elif !defined VM_64BIT
    Atomic_ReadSub64(var, val); /* Return value is unused. */
 #elif defined __GNUC__
@@ -2604,7 +2616,7 @@ Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
                    uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_exchange((_Atomic uint64 *)&var->value, val);
+   return atomic_exchange((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -2657,7 +2669,7 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store((_Atomic uint64 *)&var->value, val);
+   atomic_store((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined __x86_64__
    /*
     * There is no move instruction for 64-bit immediate to memory, so unless
@@ -2710,7 +2722,7 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
             uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_or((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_or((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -2756,7 +2768,7 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_and((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_and((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -2885,8 +2897,9 @@ Atomic_TestBit64(Atomic_uint64 *var, // IN
    ASSERT(bit <= 63);
 #if defined __x86_64__ && defined __GNUC__
    __asm__ __volatile__(
-      "btq %2, %1; setc %0"
-      : "=rm"(out)
+      "btq %2, %1"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "setc %0")
+      : IF_ASM_FLAG_OUTPUT("=@ccc", "=rm") (out)
       : "m" (var->value),
         "rJ" ((uint64)bit)
       : "cc"
@@ -2923,8 +2936,10 @@ Atomic_TestSetBit64(Atomic_uint64 *var, // IN/OUT
    Bool out;
    ASSERT(bit <= 63);
    __asm__ __volatile__(
-      "lock; btsq %2, %1; setc %0"
-      : "=rm" (out), "+m" (var->value)
+      "lock; btsq %2, %1"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "setc %0")
+      : IF_ASM_FLAG_OUTPUT("=@ccc", "=rm") (out),
+        "+m" (var->value)
       : "rJ" ((uint64)bit)
       : "cc", "memory"
    );
@@ -2969,7 +2984,7 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   value = atomic_load((_Atomic uint16 *)&var->value);
+   value = atomic_load((_Atomic(uint16) *)&var->value);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "movw %1, %0"
@@ -3015,7 +3030,7 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
                    uint16 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_exchange((_Atomic uint16 *)&var->value, val);
+   return atomic_exchange((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "xchgw %0, %1"
@@ -3080,7 +3095,7 @@ Atomic_Write16(Atomic_uint16 *var,  // OUT:
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store((_Atomic uint16 *)&var->value, val);
+   atomic_store((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "movw %1, %0"
@@ -3124,7 +3139,7 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    atomic_compare_exchange_strong(
-      (_Atomic uint16 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint16) *)&var->value, &oldVal, newVal);
    return oldVal;
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    uint16 val;
@@ -3192,7 +3207,7 @@ Atomic_ReadAnd16(Atomic_uint16 *var, // IN/OUT
    uint16 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_and((_Atomic uint16 *)&var->value, val);
+   res = atomic_fetch_and((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 16, TRUE, &var->value, and, val);
 #else
@@ -3226,7 +3241,7 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_and((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_and((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; andw %1, %0"
@@ -3283,7 +3298,7 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
             uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_or((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_or((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; orw %1, %0"
@@ -3340,7 +3355,7 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_xor((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_xor((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; xorw %1, %0"
@@ -3397,7 +3412,7 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_add((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_add((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; addw %1, %0"
@@ -3454,7 +3469,7 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_sub((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_sub((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; subw %1, %0"
@@ -3577,7 +3592,7 @@ Atomic_ReadOr16(Atomic_uint16 *var, // IN/OUT
    uint16 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_or((_Atomic uint16 *)&var->value, val);
+   res = atomic_fetch_or((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 16, TRUE, &var->value, orr, val);
 #else
@@ -3611,7 +3626,7 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
                  uint16 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_fetch_add((_Atomic uint16 *)&var->value, val);
+   return atomic_fetch_add((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; xaddw %0, %1"
@@ -3916,6 +3931,32 @@ MAKE_ATOMIC_TYPE(Bool, 8, Bool, Bool, Bool)
 #define ATOMIC_BITVECTOR(varName, capacity) \
       Atomic_uint8 varName[CEILING(capacity, 8)]
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_SetBitVector --
+ *
+ *      Atomically set the bit 'index' in bit vector var.
+ *
+ *      The index input value specifies which bit to modify and is 0-based.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_SetBitVector(Atomic_uint8 *var, // IN/OUT
+                    unsigned index)    // IN
+{
+   Atomic_Or8(var + index / 8, 1 << index % 8);
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -3941,9 +3982,10 @@ Atomic_TestSetBitVector(Atomic_uint8 *var, // IN/OUT
 #if defined __x86_64__ && defined __GNUC__
    Bool bit;
    __asm__ __volatile__(
-      "lock; bts %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (var->value)
+      "lock; bts %2, %1"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "setc %0")
+      : IF_ASM_FLAG_OUTPUT("=@ccc", "=qQm") (bit),
+        "+m" (var->value)
       : "rI" (index)
       : "cc", "memory"
    );
@@ -3955,6 +3997,32 @@ Atomic_TestSetBitVector(Atomic_uint8 *var, // IN/OUT
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ClearBitVector --
+ *
+ *      Atomically clear the bit 'index' in bit vector var.
+ *
+ *      The index input value specifies which bit to modify and is 0-based.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_ClearBitVector(Atomic_uint8 *var, // IN/OUT
+                      unsigned index)    // IN
+{
+   Atomic_And8(var + index / 8, ~(1 << index % 8));
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -3980,9 +4048,10 @@ Atomic_TestClearBitVector(Atomic_uint8 *var, // IN/OUT
 #if defined __x86_64__ && defined __GNUC__
    Bool bit;
    __asm__ __volatile__(
-      "lock; btr %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (var->value)
+      "lock; btr %2, %1"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "setc %0")
+      : IF_ASM_FLAG_OUTPUT("=@ccc", "=qQm") (bit),
+        "+m" (var->value)
       : "rI" (index)
       : "cc", "memory"
    );
diff --git a/vmmon-only/include/vm_atomic_acqrel.h b/vmmon-only/include/vm_atomic_acqrel.h
index 639aefd4..9754bedd 100644
--- a/vmmon-only/include/vm_atomic_acqrel.h
+++ b/vmmon-only/include/vm_atomic_acqrel.h
@@ -166,7 +166,7 @@ Atomic_Read8Acquire(Atomic_uint8 const *var)  // IN:
    uint8 val;
 
 #if defined VM_ATOMIC_USE_C11
-   val = atomic_load_explicit((_Atomic uint8 *)&var->value,
+   val = atomic_load_explicit((_Atomic(uint8) *)&var->value,
                               memory_order_acquire);
 #elif defined __GNUC__
 #  if defined __i386__ || defined __x86_64__
@@ -228,7 +228,7 @@ Atomic_Read16Acquire(Atomic_uint16 const *var)  // IN:
    ASSERT((uintptr_t)var % 2 == 0);
 
 #if defined VM_ATOMIC_USE_C11
-   val = atomic_load_explicit((_Atomic uint16 *)&var->value,
+   val = atomic_load_explicit((_Atomic(uint16) *)&var->value,
                               memory_order_acquire);
 #elif defined __GNUC__
 #  if defined __x86_64__ || defined __i386__
@@ -290,7 +290,7 @@ Atomic_Read32Acquire(Atomic_uint32 const *var)  // IN:
    ASSERT((uintptr_t)var % 4 == 0);
 
 #if defined VM_ATOMIC_USE_C11
-   val = atomic_load_explicit((_Atomic uint32 *)&var->value,
+   val = atomic_load_explicit((_Atomic(uint32) *)&var->value,
                               memory_order_acquire);
 #elif defined __GNUC__
    /*
@@ -361,7 +361,7 @@ Atomic_Read64Acquire(Atomic_uint64 const *var)  // IN:
    ASSERT((uintptr_t)var % 8 == 0);
 
 #if defined VM_ATOMIC_USE_C11
-   val = atomic_load_explicit((_Atomic uint64 *)&var->value,
+   val = atomic_load_explicit((_Atomic(uint64) *)&var->value,
                               memory_order_acquire);
 #elif defined __GNUC__
 #  if defined __x86_64__
@@ -458,7 +458,7 @@ Atomic_Write8Release(Atomic_uint8 *var,  // OUT:
                      uint8 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_store_explicit((_Atomic uint8 *)&var->value, val,
+   atomic_store_explicit((_Atomic(uint8) *)&var->value, val,
                          memory_order_release);
 #elif defined __GNUC__
 #  if defined __i386__ || defined __x86_64__
@@ -517,7 +517,7 @@ Atomic_Write16Release(Atomic_uint16 *var,  // OUT:
    ASSERT((uintptr_t)var % 2 == 0);
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store_explicit((_Atomic uint16 *)&var->value, val,
+   atomic_store_explicit((_Atomic(uint16) *)&var->value, val,
                          memory_order_release);
 #elif defined __GNUC__
 #  if defined __x86_64__ || defined __i386__
@@ -576,7 +576,7 @@ Atomic_Write32Release(Atomic_uint32 *var,  // OUT:
    ASSERT((uintptr_t)var % 4 == 0);
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store_explicit((_Atomic uint32 *)&var->value, val,
+   atomic_store_explicit((_Atomic(uint32) *)&var->value, val,
                          memory_order_release);
 #elif defined __GNUC__
 #  if defined __x86_64__ || defined __i386__
@@ -640,7 +640,7 @@ Atomic_Write64Release(Atomic_uint64 *var,  // OUT:
    ASSERT((uintptr_t)var % 8 == 0);
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store_explicit((_Atomic uint64 *)&var->value, val,
+   atomic_store_explicit((_Atomic(uint64) *)&var->value, val,
                          memory_order_release);
 #elif defined __GNUC__
 #  if defined __x86_64__
diff --git a/vmmon-only/include/vm_basic_asm.h b/vmmon-only/include/vm_basic_asm.h
index c6485d9a..5e6fb3dd 100644
--- a/vmmon-only/include/vm_basic_asm.h
+++ b/vmmon-only/include/vm_basic_asm.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 2003-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2003-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,9 +18,9 @@
  *********************************************************/
 
 /*
- * vm_basic_asm.h
+ * vm_basic_asm.h --
  *
- *	Basic asm macros
+ *      Basic asm macros.
  */
 
 #ifndef _VM_BASIC_ASM_H_
@@ -56,12 +57,15 @@
 #include "mul64.h"
 #elif defined VM_ARM_64
 #include "vm_basic_asm_arm64.h"
+#ifdef VMKERNEL
+#include "vmk_arm_mode.h"
+#endif
 #else
 #define MUL64_NO_ASM 1
 #include "mul64.h"
 #endif
 
-#if defined _M_ARM64EC
+#if defined _M_ARM64EC || defined _M_ARM64
 #include "vm_assert.h"
 #define MUL64_NO_ASM 1
 #include "mul64.h"
@@ -91,18 +95,18 @@ extern "C" {
  * lssbPtr_0   LSB set (uintptr_t;64-bit)  0..63    -1
  * mssbPtr_0   MSB set (uintptr_t;32-bit)  0..31    -1
  * mssbPtr_0   MSB set (uintptr_t;64-bit)  0..63    -1
- * lssbPtr     LSB set (uintptr_t;32-bit)  1..32    0
- * lssbPtr     LSB set (uintptr_t;64-bit)  1..64    0
- * mssbPtr     MSB set (uintptr_t;32-bit)  1..32    0
- * mssbPtr     MSB set (uintptr_t;64-bit)  1..64    0
  * lssb32      LSB set (uint32)            1..32    0
  * mssb32      MSB set (uint32)            1..32    0
  * lssb64      LSB set (uint64)            1..64    0
  * mssb64      MSB set (uint64)            1..64    0
+ * lssbPtr     LSB set (uintptr_t;32-bit)  1..32    0
+ * lssbPtr     LSB set (uintptr_t;64-bit)  1..64    0
+ * mssbPtr     MSB set (uintptr_t;32-bit)  1..32    0
+ * mssbPtr     MSB set (uintptr_t;64-bit)  1..64    0
  */
 
 #if defined(_MSC_VER) && !defined(__clang__) // Clang defines _MSC_VER on Windows
-static INLINE int
+static inline int
 lssb32_0(const uint32 value)
 {
    unsigned long idx;
@@ -120,7 +124,7 @@ lssb32_0(const uint32 value)
    return idx;
 }
 
-static INLINE int
+static inline int
 mssb32_0(const uint32 value)
 {
    unsigned long idx;
@@ -138,7 +142,7 @@ mssb32_0(const uint32 value)
    return idx;
 }
 
-static INLINE int
+static inline int
 lssb64_0(const uint64 value)
 {
    if (UNLIKELY(value == 0)) {
@@ -169,7 +173,7 @@ lssb64_0(const uint64 value)
    }
 }
 
-static INLINE int
+static inline int
 mssb64_0(const uint64 value)
 {
    if (UNLIKELY(value == 0)) {
@@ -228,7 +232,7 @@ mssb64_0(const uint64 value)
  * **********************************************************
  */
 
-static INLINE int
+static inline int
 lssb32_0(uint32 v)
 {
    int value = (int)v;
@@ -246,7 +250,7 @@ lssb32_0(uint32 v)
    return __builtin_ffs(value) - 1;
 }
 
-static INLINE int
+static inline int
 mssb32_0(uint32 value)
 {
    /*
@@ -269,7 +273,7 @@ mssb32_0(uint32 value)
    }
 }
 
-static INLINE int
+static inline int
 lssb64_0(const uint64 v)
 {
    int64 value = (int64)v;
@@ -300,7 +304,7 @@ lssb64_0(const uint64 v)
 }
 
 
-static INLINE int
+static inline int
 mssb64_0(const uint64 value)
 {
    if (UNLIKELY(value == 0)) {
@@ -333,7 +337,7 @@ mssb64_0(const uint64 value)
 
 #endif // __GNUC__
 
-static INLINE int
+static inline int
 lssbPtr_0(const uintptr_t value)
 {
 #ifdef VM_64BIT
@@ -343,13 +347,13 @@ lssbPtr_0(const uintptr_t value)
 #endif
 }
 
-static INLINE unsigned
+static inline unsigned
 lssbPtr(const uintptr_t value)
 {
    return (unsigned)lssbPtr_0(value) + 1;
 }
 
-static INLINE int
+static inline int
 mssbPtr_0(const uintptr_t value)
 {
 #ifdef VM_64BIT
@@ -359,41 +363,39 @@ mssbPtr_0(const uintptr_t value)
 #endif
 }
 
-static INLINE unsigned
+static inline unsigned
 mssbPtr(const uintptr_t value)
 {
    return (unsigned)mssbPtr_0(value) + 1;
 }
 
-static INLINE unsigned
+static inline unsigned
 lssb32(const uint32 value)
 {
    return (unsigned)lssb32_0(value) + 1;
 }
 
-static INLINE unsigned
+static inline unsigned
 mssb32(const uint32 value)
 {
    return (unsigned)mssb32_0(value) + 1;
 }
 
-static INLINE unsigned
+static inline unsigned
 lssb64(const uint64 value)
 {
    return (unsigned)lssb64_0(value) + 1;
 }
 
-static INLINE unsigned
+static inline unsigned
 mssb64(const uint64 value)
 {
    return (unsigned)mssb64_0(value) + 1;
 }
 
-#ifdef __GNUC__
-#if defined(VM_X86_ANY) || defined(VM_ARM_ANY)
 
 /*
- *----------------------------------------------------------------------
+ *-----------------------------------------------------------------------------
  *
  * uint16set --
  *
@@ -405,16 +407,18 @@ mssb64(const uint64 value)
  * Side effects:
  *      As with memset.
  *
- *----------------------------------------------------------------------
+ *-----------------------------------------------------------------------------
  */
 
-static INLINE void *
-uint16set(void *dst, uint16 val, size_t count)
+static inline void *
+uint16set(void *dst,    // OUT
+          uint16 val,   // IN
+          size_t count) // IN
 {
-#ifdef VM_ARM_32
+#if defined __GNUC__ && defined VM_ARM_32
    void *tmpDst = dst;
 
-   __asm__ __volatile__ (
+   __asm__ __volatile__(
       "cmp     %1, #0\n\t"
       "beq     2f\n"
       "1:\n\t"
@@ -425,7 +429,7 @@ uint16set(void *dst, uint16 val, size_t count)
       : "+r" (tmpDst), "+r" (count)
       : "r" (val)
       : "cc", "memory");
-#elif defined(VM_ARM_64)
+#elif defined __GNUC__ && defined VM_ARM_64
    void   *tmpDst = dst;
    uint64  tmpVal = 0;
 
@@ -433,7 +437,7 @@ uint16set(void *dst, uint16 val, size_t count)
       return dst;
    }
 
-   __asm__ __volatile__ (
+   __asm__ __volatile__(
       "cbz     %3, 1f\n\t"
 
       // Copy 16 bits twice...
@@ -469,24 +473,31 @@ uint16set(void *dst, uint16 val, size_t count)
       : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
       : "r" ((uint64)val)
       : "cc", "memory");
-#else
+#elif defined __GNUC__ && defined VM_X86_ANY
    size_t dummy0;
    void *dummy1;
 
-   __asm__ __volatile__("\t"
-                        "cld"            "\n\t"
-                        "rep ; stosw"    "\n"
-                        : "=c" (dummy0), "=D" (dummy1)
-                        : "0" (count), "1" (dst), "a" (val)
-                        : "memory", "cc"
-      );
+   __asm__ __volatile__(
+      "cld"            "\n\t"
+      "rep ; stosw"    "\n"
+      : "=c" (dummy0), "=D" (dummy1)
+      : "0" (count), "1" (dst), "a" (val)
+      : "memory", "cc");
+#elif defined _MSC_VER && defined VM_X86_ANY
+   __stosw((uint16 *)dst, val, count);
+#else /* Fall back to a plain C implementation. */
+   size_t i;
+
+   for (i = 0; i < count; i++) {
+      ((uint16 *)dst)[i] = val;
+   }
 #endif
    return dst;
 }
 
 
 /*
- *----------------------------------------------------------------------
+ *-----------------------------------------------------------------------------
  *
  * uint32set --
  *
@@ -498,16 +509,18 @@ uint16set(void *dst, uint16 val, size_t count)
  * Side effects:
  *      As with memset.
  *
- *----------------------------------------------------------------------
+ *-----------------------------------------------------------------------------
  */
 
-static INLINE void *
-uint32set(void *dst, uint32 val, size_t count)
+static inline void *
+uint32set(void *dst,    // OUT
+          uint32 val,   // IN
+          size_t count) // IN
 {
-#ifdef VM_ARM_32
+#if defined __GNUC__ && defined VM_ARM_32
    void *tmpDst = dst;
 
-   __asm__ __volatile__ (
+   __asm__ __volatile__(
       "cmp     %1, #0\n\t"
       "beq     2f\n"
       "1:\n\t"
@@ -518,15 +531,15 @@ uint32set(void *dst, uint32 val, size_t count)
       : "+r" (tmpDst), "+r" (count)
       : "r" (val)
       : "cc", "memory");
-#elif defined(VM_ARM_64)
+#elif defined __GNUC__ && defined VM_ARM_64
    void   *tmpDst = dst;
-   uint64 tmpVal = val;
+   uint64  tmpVal = val;
 
    if (count == 0) {
       return dst;
    }
 
-   __asm__ __volatile__ (
+   __asm__ __volatile__(
       "cbz     %2, 1f\n\t"
 
       // Drop our value in the top 32 bits, then copy from there to the bottom
@@ -560,65 +573,21 @@ uint32set(void *dst, uint32 val, size_t count)
       : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
       :
       : "cc", "memory");
-#else
+#elif defined __GNUC__ && defined VM_X86_ANY
    size_t dummy0;
    void *dummy1;
 
-   __asm__ __volatile__("\t"
-                        "cld"            "\n\t"
-                        "rep ; stosl"    "\n"
-                        : "=c" (dummy0), "=D" (dummy1)
-                        : "0" (count), "1" (dst), "a" (val)
-                        : "memory", "cc"
-      );
-#endif
-   return dst;
-}
-
-#else /* unknown system: rely on C to write */
-static INLINE void *
-uint16set(void *dst, uint16 val, size_t count)
-{
-   size_t i;
-   for (i = 0; i < count; i++) {
-     ((uint16 *) dst)[i] = val;
-   }
-   return dst;
-}
-
-static INLINE void *
-uint32set(void *dst, uint32 val, size_t count)
-{
-   size_t i;
-   for (i = 0; i < count; i++) {
-     ((uint32 *) dst)[i] = val;
-   }
-   return dst;
-}
-#endif // defined(VM_X86_ANY) || defined(VM_ARM_ANY)
-#elif defined(_MSC_VER)
-
-static INLINE void *
-uint16set(void *dst, uint16 val, size_t count)
-{
-#ifdef VM_X86_ANY
-   __stosw((uint16*)dst, val, count);
-#else
+   __asm__ __volatile__(
+      "cld"            "\n\t"
+      "rep ; stosl"    "\n"
+      : "=c" (dummy0), "=D" (dummy1)
+      : "0" (count), "1" (dst), "a" (val)
+      : "memory", "cc");
+#elif defined _MSC_VER && defined VM_X86_ANY
+   __stosd((unsigned long *)dst, (unsigned long)val, count);
+#else /* Fall back to a plain C implementation. */
    size_t i;
-   for (i = 0; i < count; i++) {
-      ((uint16 *)dst)[i] = val;
-   }
-#endif
-   return dst;
-}
 
-static INLINE void *
-uint32set(void *dst, uint32 val, size_t count)
-{
-#ifdef VM_X86_ANY
-   __stosd((unsigned long*)dst, (unsigned long)val, count);
-#else
-   size_t i;
    for (i = 0; i < count; i++) {
       ((uint32 *)dst)[i] = val;
    }
@@ -626,10 +595,6 @@ uint32set(void *dst, uint32 val, size_t count)
    return dst;
 }
 
-#else
-#error "No compiler defined for uint*set"
-#endif
-
 
 /*
  *-----------------------------------------------------------------------------
@@ -641,7 +606,7 @@ uint32set(void *dst, uint32 val, size_t count)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint16
+static inline uint16
 Bswap16(uint16 v)
 {
 #if defined(VM_ARM_64) && !defined(_MSC_VER)
@@ -663,7 +628,7 @@ Bswap16(uint16 v)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint32
+static inline uint32
 Bswap32(uint32 v) // IN
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -700,14 +665,23 @@ Bswap32(uint32 v) // IN
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 Bswap64(uint64 v) // IN
 {
-#if defined(VM_ARM_64) && !defined(_MSC_VER)
+#if defined _MSC_VER
+   return _byteswap_uint64(v);
+#elif defined __GNUC__
+
+/* TODO: Return __builtin_bswap64(v) if gcc-arm64 is verified to use "rev". */
+#if defined VM_ARM_64
    __asm__("rev %0, %0" : "+r"(v));
    return v;
 #else
-   return ((uint64)Bswap((uint32)v) << 32) | Bswap((uint32)(v >> 32));
+   return __builtin_bswap64(v);
+#endif
+
+#else
+   return ((uint64)Bswap32((uint32)v) << 32) | Bswap32((uint32)(v >> 32));
 #endif
 }
 
@@ -717,7 +691,7 @@ Bswap64(uint64 v) // IN
  * on non-P4 IA32 systems, the encoding is interpreted as a REPZ-NOP.
  * Use volatile to avoid NOP removal.
  */
-static INLINE void
+static inline void
 PAUSE(void)
 #if defined(__GNUC__) || defined(VM_ARM_32)
 {
@@ -750,7 +724,7 @@ PAUSE(void)
  *
  * volatile because the tsc always changes without the compiler knowing it.
  */
-static INLINE uint64
+static inline uint64
 RDTSC(void)
 #ifdef __GNUC__
 {
@@ -776,11 +750,12 @@ RDTSC(void)
 #elif defined(VM_ARM_64)
    /*
     * Keep this implementation in sync with:
+    * bora/vmkernel/hardware/arm64/tscsync_arch.h::TSCSyncRDTSC()
     * bora/lib/vprobe/arm64/vp_emit_tc.c::VpEmit_BuiltinRDTSCWork()
     * bora/modules/vmkernel/tests/core/xmapTest/xmapTest_arm64.c::XMapTest_SetupLoopCode()
     */
-#if defined(VMKERNEL) && !defined(VMK_ARM_EL1_OR_VHE)
-   return MRS(CNTPCT_EL0);
+#ifdef VMKERNEL
+   return MRSx(VMK_CNT_CT_EL);
 #else
    return MRS(CNTVCT_EL0);
 #endif
@@ -799,8 +774,8 @@ RDTSC(void)
 #else
 {
    /*
-    * We need to do more inverstagetion here to find
-    * a microsoft equivalent of that code
+    * We need to do more investigation here to find
+    * a Microsoft equivalent of that code.
     */
    NOT_IMPLEMENTED();
    return 0;
@@ -852,49 +827,49 @@ RDTSC(void)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 SetBit32(uint32 *var, unsigned index)
 {
    *var |= 1 << index;
 }
 
-static INLINE void
+static inline void
 ClearBit32(uint32 *var, unsigned index)
 {
    *var &= ~(1 << index);
 }
 
-static INLINE void
+static inline void
 ToggleBit32(uint32 *var, unsigned index)
 {
    *var ^= 1 << index;
 }
 
-static INLINE void
+static inline void
 SetBit64(uint64 *var, unsigned index)
 {
    *var |= CONST64U(1) << index;
 }
 
-static INLINE void
+static inline void
 ClearBit64(uint64 *var, unsigned index)
 {
    *var &= ~(CONST64U(1) << index);
 }
 
-static INLINE void
+static inline void
 ToggleBit64(uint64 *var, unsigned index)
 {
    *var ^= (CONST64U(1) << index);
 }
 
-static INLINE Bool
+static inline Bool
 TestBit32(const uint32 *var, unsigned index)
 {
    return (*var & (1 << index)) != 0;
 }
 
-static INLINE Bool
+static inline Bool
 TestBit64(const uint64 *var, unsigned index)
 {
    return (*var & (CONST64U(1) << index)) != 0;
@@ -927,7 +902,7 @@ TestBit64(const uint64 *var, unsigned index)
 #define GCC_ASM_BT_EPILOG "\n\tsetc\t%0" : "=qQm"
 #endif
 
-static INLINE Bool
+static inline Bool
 SetBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -946,7 +921,7 @@ SetBitVector(void *var, int32 index)
 #endif
 }
 
-static INLINE Bool
+static inline Bool
 ClearBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -965,7 +940,7 @@ ClearBitVector(void *var, int32 index)
 #endif
 }
 
-static INLINE Bool
+static inline Bool
 ComplementBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -984,7 +959,7 @@ ComplementBitVector(void *var, int32 index)
 #endif
 }
 
-static INLINE Bool
+static inline Bool
 TestBitVector(const void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -1012,7 +987,7 @@ TestBitVector(const void *var, int32 index)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 RoundDownPow2_64(uint64 value)
 {
    if ((value & (value - 1)) == 0) {
@@ -1026,12 +1001,12 @@ RoundDownPow2_64(uint64 value)
 }
 
 
-static INLINE uint32
+static inline uint32
 RoundDownPow2_32(uint32 value)
 {
    if ((value & (value - 1)) == 0) {
       /*
-       * Already a power of two.
+       * Already zero or a power of two.
        */
       return value;
    }
@@ -1051,7 +1026,7 @@ RoundDownPow2_32(uint32 value)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 RoundUpPow2C64(uint64 value)
 {
    if (value <= 1 || value > (CONST64U(1) << 63)) {
@@ -1062,7 +1037,7 @@ RoundUpPow2C64(uint64 value)
 }
 
 #if defined(__GNUC__) && defined(VM_X86_64)
-static INLINE uint64
+static inline uint64
 RoundUpPow2Asm64(uint64 value)
 {
    uint64 out = 2;
@@ -1080,7 +1055,7 @@ RoundUpPow2Asm64(uint64 value)
 }
 #endif
 
-static INLINE uint64
+static inline uint64
 RoundUpPow2_64(uint64 value)
 {
 #if defined(__GNUC__) && defined(VM_X86_64)
@@ -1094,7 +1069,7 @@ RoundUpPow2_64(uint64 value)
 #endif
 }
 
-static INLINE uint32
+static inline uint32
 RoundUpPow2C32(uint32 value)
 {
    if (value <= 1 || value > (1U << 31)) {
@@ -1107,7 +1082,7 @@ RoundUpPow2C32(uint32 value)
 }
 
 #ifdef __GNUC__
-static INLINE uint32
+static inline uint32
 RoundUpPow2Asm32(uint32 value)
 {
 #ifdef VM_ARM_32
@@ -1143,7 +1118,7 @@ RoundUpPow2Asm32(uint32 value)
 }
 #endif // __GNUC__
 
-static INLINE uint32
+static inline uint32
 RoundUpPow2_32(uint32 value)
 {
 #ifdef __GNUC__
@@ -1174,7 +1149,7 @@ RoundUpPow2_32(uint32 value)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE unsigned
+static inline unsigned
 PopCount32(uint32 value)
 {
 #if defined(__GNUC__) && defined(__POPCNT__)
@@ -1243,7 +1218,7 @@ PopCount32(uint32 value)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE unsigned
+static inline unsigned
 PopCount64(uint64 value)
 {
 #if defined(__GNUC__) && defined(__POPCNT__)
@@ -1291,7 +1266,7 @@ PopCount64(uint64 value)
 
 #ifdef __GNUC__
 
-static INLINE void
+static inline void
 INTR_RW_BARRIER_RW(void)
 {
    __asm__ __volatile__("" ::: "memory");
@@ -1308,19 +1283,19 @@ INTR_RW_BARRIER_RW(void)
 
 #elif defined _MSC_VER
 
-static INLINE void
+static inline void
 INTR_R_BARRIER_R(void)
 {
    _ReadBarrier();
 }
 
-static INLINE void
+static inline void
 INTR_W_BARRIER_W(void)
 {
    _WriteBarrier();
 }
 
-static INLINE void
+static inline void
 INTR_RW_BARRIER_RW(void)
 {
    _ReadWriteBarrier();
diff --git a/vmmon-only/include/vm_basic_defs.h b/vmmon-only/include/vm_basic_defs.h
index 80bbad90..74749032 100644
--- a/vmmon-only/include/vm_basic_defs.h
+++ b/vmmon-only/include/vm_basic_defs.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2003-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2003-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -209,32 +210,40 @@ Max(int a, int b)
 #define PAGE_SHIFT_16KB  14
 #define PAGE_SHIFT_64KB  16
 
-#ifndef PAGE_SHIFT // {
+#define PAGE_SIZE_4KB    4096
+#define PAGE_SIZE_16KB   16384
+#define PAGE_SIZE_64KB   65536
+
 #if defined __x86_64__ || defined __i386__
-   #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+   #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
 #elif defined __APPLE__
    #if defined VM_ARM_ANY
-      #define PAGE_SHIFT    PAGE_SHIFT_16KB
+      #define VMW_PAGE_SHIFT PAGE_SHIFT_16KB
+      #define VMW_PAGE_SIZE  PAGE_SIZE_16KB
    #else
-      #define PAGE_SHIFT    PAGE_SHIFT_4KB
+      #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+      #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
    #endif
 #elif defined VM_ARM_64
-   #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+   #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
 #elif defined __arm__
-   #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+   #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
 #elif defined __wasm__
-   #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+   #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
 #else
    #error
 #endif
-#endif // }
 
-#define PAGE_SIZE_4KB    (1 << PAGE_SHIFT_4KB)
-#define PAGE_SIZE_16KB   (1 << PAGE_SHIFT_16KB)
-#define PAGE_SIZE_64KB   (1 << PAGE_SHIFT_64KB)
+#ifndef PAGE_SHIFT
+#define PAGE_SHIFT VMW_PAGE_SHIFT
+#endif
 
 #ifndef PAGE_SIZE
-#define PAGE_SIZE     (1 << PAGE_SHIFT)
+#define PAGE_SIZE     VMW_PAGE_SIZE
 #endif
 
 #define PAGE_MASK_4KB    (PAGE_SIZE_4KB - 1)
@@ -419,6 +428,16 @@ Max(int a, int b)
 #endif
 #define QWORD(_hi, _lo)   ((((uint64)(_hi)) << 32) | ((uint32)(_lo)))
 
+#ifndef HIDWORD128
+#define HIDWORD128(_qw)    ((uint64)((_qw) >> 64))
+#endif
+#ifndef LODWORD128
+#define LODWORD128(_qw)    ((uint64)(_qw))
+#endif
+#ifndef QWORD128
+#define QWORD128(_hi, _lo) ((((uint128)(_hi)) << 64) | ((uint64)(_lo)))
+#endif
+
 
 /*
  * Deposit a field _src at _pos bits from the right,
@@ -551,19 +570,50 @@ typedef int pid_t;
  * Convenience macros and definitions. Can often be used instead of #ifdef.
  */
 
+#ifdef VMK_HAS_VMM
+#define VMK_HAS_VMM_ONLY(...) __VA_ARGS__
+#else
+#define VMK_HAS_VMM_ONLY(...)
+#endif
+
+#if defined VMM || defined VMK_HAS_VMM
+/* Structure field only used to support the VMM (as opposed to the ULM). */
+#define VMM_ONLY_FIELD(name) name
+#else
+/*
+ * Structure field only used to support the VMM (as opposed to the ULM).
+ * Until VMK_HAS_VMM is retired, keep this field so the size of the structure
+ * is unchanged (was bug 3354277), but prepend an underscore to the field's
+ * name to verify at compile time that the field is indeed not used.
+ */
+#define VMM_ONLY_FIELD(name) _##name
+#endif
+
 #undef ARM64_ONLY
 #ifdef VM_ARM_64
-#define ARM64_ONLY(x)    x
+#define ARM64_ONLY(...)  __VA_ARGS__
 #else
-#define ARM64_ONLY(x)
+#define ARM64_ONLY(...)
 #endif
 
 #undef X86_ONLY
+#ifdef _MSC_VER
+/*
+ * Old MSVC versions (such as MSVC 14.29.30133, used to build Workstation's
+ * offset checker) are notorious to have non-standard __VA_ARGS__ handling.
+ */
 #ifdef VM_X86_ANY
 #define X86_ONLY(x)      x
 #else
 #define X86_ONLY(x)
 #endif
+#else
+#ifdef VM_X86_ANY
+#define X86_ONLY(...)    __VA_ARGS__
+#else
+#define X86_ONLY(...)
+#endif
+#endif
 
 #undef DEBUG_ONLY
 #ifdef VMX86_DEBUG
@@ -631,6 +681,12 @@ typedef int pid_t;
 #define HOSTED_ONLY(x) x
 #endif
 
+#ifdef VMX86_FDM
+#define vmx86_fdm 1
+#else
+#define vmx86_fdm 0
+#endif
+
 #ifdef VMX86_ESXIO
 #define vmx86_esxio      1
 #else
@@ -906,12 +962,13 @@ typedef int pid_t;
 
 /* VMW_FALLTHROUGH
  *
- *   Instructs GCC 9 and above to not warn when a case label of a
+ *   Instructs capable compilers to not warn when a case label of a
  *   'switch' statement falls through to the next label.
  *
- *   If not GCC 9 or above, expands to nothing.
+ *   If not a matched compiler, expands to nothing.
  */
-#if __GNUC__ >= 9
+#if (defined(__GNUC__) && (__GNUC__ >= 9)) ||           \
+    (defined(__clang__) && (__clang_major__ >= 13))
 #define VMW_FALLTHROUGH() __attribute__((fallthrough))
 #else
 #define VMW_FALLTHROUGH()
diff --git a/vmmon-only/include/vm_basic_types.h b/vmmon-only/include/vm_basic_types.h
index 0cfc0264..559577e8 100644
--- a/vmmon-only/include/vm_basic_types.h
+++ b/vmmon-only/include/vm_basic_types.h
@@ -353,8 +353,8 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
       #define FMTPD      "I"
       #define FMTH       "I"
    #endif
-#elif defined __APPLE__ || (!defined VMKERNEL && \
-                            defined __linux__ && defined __KERNEL__)
+#elif defined __APPLE__ || defined __EMSCRIPTEN__ || \
+      (!defined VMKERNEL && defined __linux__ && defined __KERNEL__)
    /* semi-LLP64 targets; 'long' is 64-bit, but uint64_t is 'long long' */
    #define FMT64         "ll"
    #if defined(__APPLE__) && KERNEL
diff --git a/vmmon-only/include/vm_idt_x86.h b/vmmon-only/include/vm_idt.h
similarity index 77%
rename from vmmon-only/include/vm_idt_x86.h
rename to vmmon-only/include/vm_idt.h
index 8672af02..8ee706c1 100644
--- a/vmmon-only/include/vm_idt_x86.h
+++ b/vmmon-only/include/vm_idt.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2012,2017-2018,2020,2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2012-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,13 +18,13 @@
  *********************************************************/
 
 /*
- * vm_idt_x86.h --
+ * vm_idt.h --
  *
- *	Definitions for IDT use in x86/x86-64 ESX and hosted VMware Products.
+ *      Definitions for IDT use in VMware Products which run VMs on x86_64.
  */
 
-#ifndef _VM_IDT_X86_H_
-#define _VM_IDT_X86_H_
+#ifndef _VM_IDT_H_
+#define _VM_IDT_H_
 
 #define INCLUDE_ALLOW_USERLEVEL
 #define INCLUDE_ALLOW_MODULE
@@ -55,11 +56,13 @@ extern "C" {
 
 #define IDT_NUM_GATES              0x100
 /*
- * The monitor and the vmkernel use gate stub handlers of a single size in
- * their IDTs.  The only exception is the #PF gate (#14) which is twice as
- * long in the monitor IDT, to copy CR2.
+ * The monitor and the vmkernel use gate stub handlers of a constant size in
+ * their respective gate stubs called by IDT entries.  The only exception is
+ * the #PF gate (#14) which is twice as long in the monitor IDT, to copy CR2.
  */
-#define IDT_STUB_SIZE              16
+#define IDT_VMM_STUB_SIZE              16
+#define IDT_VMK_STUB_SIZE              32
+#define IDT_VMK_STUB_SIZE_BITS          5
 
 #define IST_NONE                    0
 /* IST entries for the monitor. */
@@ -73,7 +76,7 @@ extern "C" {
 #define IST_VMK_NMI                 7
 
 
-static INLINE int
+static inline int
 IDT_MonitorISTForVector(int v)
 {
    /*
@@ -93,4 +96,4 @@ IDT_MonitorISTForVector(int v)
 } // extern "C"
 #endif
 
-#endif /* _VM_IDT_X86_H_ */
+#endif /* _VM_IDT_H_ */
diff --git a/vmmon-only/include/vmmblob.h b/vmmon-only/include/vmmblob.h
index 95e19e5c..fbeaa499 100644
--- a/vmmon-only/include/vmmblob.h
+++ b/vmmon-only/include/vmmblob.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2017-2018 VMware, Inc. All rights reserved.
+ * Copyright (c) 2017-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index 2a79373b..2592c9e8 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2006-2021,2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2006-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -19,7 +20,7 @@
 /*
  * x86_basic_defs.h --
  *
- *    Basic macros describing the x86 architecture.
+ *      Basic macros describing the x86 architecture.
  */
 
 #ifndef _X86_BASIC_DEFS_H_
@@ -35,12 +36,12 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
-#define X86_MAX_INSTR_LEN  15   /* Max byte length of an x86 instruction. */
+#define X86_MAX_INSTR_LEN  15   /* Max byte length of an x86 instruction */
 
 #define NUM_IDT_VECTORS 256
 
 /*
- *   control registers
+ * Control registers
  */
 
 #define CR0_PE         0x00000001
@@ -78,6 +79,10 @@
 #ifndef CR3_PCID_MASK
 #define CR3_PCID_MASK  0xFFF
 #endif
+
+#define CR3_LAM_U57    (1ULL << 61)
+#define CR3_LAM_U48    (1ULL << 62)
+#define CR3_LAM_USER   (CR3_LAM_U48 | CR3_LAM_U57)
 #define CR3_NO_FLUSH   (1ULL << 63)
 
 #define CR4_VME        0x00000001
@@ -104,11 +109,13 @@
 #define CR4_CET        0x00800000
 #define CR4_PKS        0x01000000
 #define CR4_UINTR      0x02000000
-#define CR4_RESERVED   CONST64U(0xfffffffffe089000)
+#define CR4_LASS       0x08000000
+#define CR4_LAM_SUP    0x10000000
+#define CR4_RESERVED   CONST64U(0xffffffffee089000)
 #define CR8_RESERVED   CONST64U(0xfffffffffffffff0)
 
 /*
- * Debug registers.
+ * Debug registers
  */
 
 #define DR_COUNT       4
@@ -186,8 +193,10 @@
 #define DEBUG_STATUS_BT   (1<<15)
 
 /*
- *   exception error codes
+ * Exception vectors
  */
+#define EXC_VEC_MIN       0
+#define EXC_VEC_MAX      31
 
 #define EXC_DE            0
 #define EXC_DB            1
@@ -209,17 +218,19 @@
 #define EXC_XF           19  // SIMD exception.
 #define EXC_VE           20  // Virtualization exception - VT only.
 #define EXC_CP           21  // Control Protection exception.
+#define EXC_HV           28  // Hypervisor injection exception (SVM only)
 #define EXC_VC           29  // VMM communication exception (SVM / SEV-ES only).
 #define EXC_SX           30  // Security exception (SVM only).
 
-/* Bitmap of the exception vectors that have associated error codes. */
+/* Bitmap of the exception vectors that have associated error codes */
 #define EXC_WITH_ERR_CODE_MASK ((1u << EXC_DF) | (1u << EXC_TS) | \
                                 (1u << EXC_NP) | (1u << EXC_SS) | \
                                 (1u << EXC_GP) | (1u << EXC_PF) | \
-                                (1u << EXC_AC) | (1u << EXC_CP))
+                                (1u << EXC_AC) | (1u << EXC_CP) | \
+                                (1u << EXC_VC) | (1u << EXC_SX))
 
 /*
- * eflag/rflag definitions.
+ * eflag/rflag definitions
  */
 
 #define EFLAGS_IOPL_SHIFT 12
@@ -268,14 +279,14 @@ typedef enum x86_FLAGS {
 } x86_FLAGS;
 
 /*
- *   MPX bound configuration registers
+ * MPX bound configuration registers
  */
 #define BNDCFG_EN        0x00000001
 #define BNDCFG_BNDPRSV   0x00000002
 #define BNDCFG_RSVD      0x00000ffc
 #define BNDCFG_BDBASE    CONST64U(0xfffffffffffff000)
 
-/* Reset state of RIP. */
+/* Reset state of RIP */
 #define RESET_RIP       0xfff0
 #define RESET_RIP_TDX   0xfffffff0  /* Reset RIP for TDX protected mode boot. */
 
diff --git a/vmmon-only/include/x86cet.h b/vmmon-only/include/x86cet.h
index 94c3cbe6..be52c865 100644
--- a/vmmon-only/include/x86cet.h
+++ b/vmmon-only/include/x86cet.h
@@ -71,7 +71,7 @@ typedef ALIGNED(8) struct {
  *   LA [63  ...  48][47 .... 15][14 13 12][11  ...  0]
  *         unused       byteNum    bitNum
  */
-static INLINE void
+static inline void
 CET_IBTComputeLegacyByte(LA la, uint64 *byteNum, uint8 *byteMask)
 {
    const unsigned bitsPerByte = 8;
diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index e2d297bf..5ef4e0a0 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -585,7 +586,7 @@ FLAG(   7,  1, EAX,  3,  1, RAO_INT,                             NO,    0 ) \
 FLAG(   7,  1, EAX,  4,  1, AVX_VNNI,                            YES,  20 ) \
 FLAG(   7,  1, EAX,  5,  1, AVX512BF16,                          YES,  18 ) \
 FLAG(   7,  1, EAX,  6,  1, LASS,                                NO,    0 ) \
-FLAG(   7,  1, EAX,  7,  1, CMPCCXADD,                           NO,    0 ) \
+FLAG(   7,  1, EAX,  7,  1, CMPCCXADD,                           YES,  22 ) \
 FLAG(   7,  1, EAX,  8,  1, ARCH_PERFMON_EXT,                    NO,    0 ) \
 FLAG(   7,  1, EAX, 10,  1, FAST_ZERO_MOVSB,                     YES,  20 ) \
 FLAG(   7,  1, EAX, 11,  1, FAST_SHORT_STOSB,                    YES,  20 ) \
@@ -593,12 +594,12 @@ FLAG(   7,  1, EAX, 12,  1, FAST_SHORT_CMPSB_SCASB,              YES,  20 ) \
 FLAG(   7,  1, EAX, 19,  1, WRMSRNS,                             NO,    0 ) \
 FLAG(   7,  1, EAX, 21,  1, AMX_FP16,                            YES,  21 ) \
 FLAG(   7,  1, EAX, 22,  1, HRESET,                              NO,    0 ) \
-FLAG(   7,  1, EAX, 23,  1, AVX_IFMA,                            NO,    0 ) \
-FLAG(   7,  1, EAX, 26,  1, LAM,                                 NO,    0 ) \
+FLAG(   7,  1, EAX, 23,  1, AVX_IFMA,                            YES,  22 ) \
+FLAG(   7,  1, EAX, 26,  1, LAM,                                 YES,  22 ) \
 FLAG(   7,  1, EAX, 27,  1, MSRLIST,                             NO,    0 ) \
 FLAG(   7,  1, EBX,  0,  1, LEAF7_PPIN,                          NO,    0 ) \
-FLAG(   7,  1, EDX,  4,  1, AVX_VNNI_INT8,                       NO,    0 ) \
-FLAG(   7,  1, EDX,  5,  1, AVX_NE_CONVERT,                      NO,    0 ) \
+FLAG(   7,  1, EDX,  4,  1, AVX_VNNI_INT8,                       YES,  22 ) \
+FLAG(   7,  1, EDX,  5,  1, AVX_NE_CONVERT,                      YES,  22 ) \
 FLAG(   7,  1, EDX,  8,  1, AMX_COMPLEX,                         NO,    0 ) \
 FLAG(   7,  1, EDX, 14,  1, PREFETCHI,                           YES,  21 ) \
 FLAG(   7,  1, EDX, 18,  1, CET_SSS,                             NO,    0 ) \
@@ -787,16 +788,24 @@ FLAG(  12,  0, EAX,  0,  1, SGX1,                                ANY,  17 ) \
 FLAG(  12,  0, EAX,  1,  1, SGX2,                                ANY,  21 ) \
 FLAG(  12,  0, EAX,  5,  1, SGX_OVERSUB_ENCLV,                   NO,    0 ) \
 FLAG(  12,  0, EAX,  6,  1, SGX_OVERSUB_ENCLS,                   NO,    0 ) \
-FLAG(  12,  0, EAX,  7,  1, SGX_EVERIFYREPORT2,                  NO,    0 ) \
+FLAG(  12,  0, EAX,  7,  1, SGX_EVERIFYREPORT2,                  ANY, FUT ) \
 FLAG(  12,  0, EAX, 10,  1, SGX_EUPDATESVN,                      NO,    0 ) \
+FLAG(  12,  0, EAX, 11,  1, SGX_EDECCSSA,                        ANY, FUT ) \
 FLAG(  12,  0, EBX,  0,  1, SGX_MISCSELECT_EXINFO,               ANY, FUT ) \
-FIELD( 12,  0, EBX,  1, 31, SGX_MISCSELECT_RSVD,                 NO,    0 ) \
+FLAG(  12,  0, EBX,  1,  1, SGX_MISCSELECT_CPINFO,               ANY, FUT ) \
 FIELD( 12,  0, EDX,  0,  8, MAX_ENCLAVE_SIZE_NOT64,              ANY,  17 ) \
 FIELD( 12,  0, EDX,  8,  8, MAX_ENCLAVE_SIZE_64,                 ANY,  17 ) \
-FIELD( 12,  1, EAX,  0, 32, SECS_ATTRIBUTES0,                    ANY,  17 ) \
-FIELD( 12,  1, EBX,  0, 32, SECS_ATTRIBUTES1,                    ANY,  17 ) \
-FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES2,                    ANY,  17 ) \
-FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES3,                    ANY,  17 ) \
+FLAG(  12,  1, EAX,  1,  1, SECS_ATTRIBUTES_DEBUG,               ANY,  17 ) \
+FLAG(  12,  1, EAX,  2,  1, SECS_ATTRIBUTES_MODE64BIT,           ANY,  17 ) \
+FLAG(  12,  1, EAX,  4,  1, SECS_ATTRIBUTES_PROVISIONKEY,        ANY,  17 ) \
+FLAG(  12,  1, EAX,  5,  1, SECS_ATTRIBUTES_EINITTOKEN_KEY,      ANY,  17 ) \
+FLAG(  12,  1, EAX,  6,  1, SECS_ATTRIBUTES_CET,                 NO,    0 ) \
+FLAG(  12,  1, EAX,  7,  1, SECS_ATTRIBUTES_KSS,                 ANY,  17 ) \
+FLAG(  12,  1, EAX,  8,  1, SECS_ATTRIBUTES_LAM_U57,             NO,    0 ) \
+FLAG(  12,  1, EAX,  9,  1, SECS_ATTRIBUTES_LAM_U48,             NO,    0 ) \
+FLAG(  12,  1, EAX, 10,  1, SECS_ATTRIBUTES_AEXNOTIFY,           ANY, FUT ) \
+FIELD( 12,  1, ECX,  0, 32, SECS_ATTRIBUTES_XFRM_LOW,            ANY,  17 ) \
+FIELD( 12,  1, EDX,  0, 32, SECS_ATTRIBUTES_XFRM_HIGH,           ANY,  17 ) \
 FIELD( 12,  2, EAX,  0,  4, EPC00_VALID,                         ANY,  17 ) \
 FIELD( 12,  2, EAX, 12, 20, EPC00_BASE_LOW,                      ANY,  17 ) \
 FIELD( 12,  2, EBX,  0, 20, EPC00_BASE_HIGH,                     ANY,  17 ) \
@@ -1301,7 +1310,7 @@ CPUID_8A_EDX_14 \
 FLAG(  8A,  0, EDX, 15,  1, SVM_V_VMSAVE_VMLOAD,                 NO,    0 ) \
 FLAG(  8A,  0, EDX, 16,  1, SVM_VGIF,                            NO,    0 ) \
 FLAG(  8A,  0, EDX, 17,  1, SVM_GMET,                            YES,  17 ) \
-FLAG(  8A,  0, EDX, 18,  1, SVMEDX_RSVD3,                        NO,    0 ) \
+FLAG(  8A,  0, EDX, 18,  1, SVM_x2AVIC,                          NO,    0 ) \
 FLAG(  8A,  0, EDX, 19,  1, SVM_SSS,                             YES,  20 ) \
 FLAG(  8A,  0, EDX, 20,  1, SVM_GUEST_SPEC_CTRL,                 NO,    0 ) \
 FLAG(  8A,  0, EDX, 21,  1, SVM_NON_WRITEABLE_PT,                NO,    0 ) \
@@ -1408,8 +1417,8 @@ FLAG( 81F,  0, EAX,  0,  1, SME,                                 NO,    0 ) \
 FLAG( 81F,  0, EAX,  1,  1, SEV,                                 YES,  17 ) \
 FLAG( 81F,  0, EAX,  2,  1, PAGE_FLUSH_MSR,                      NO,    0 ) \
 FLAG( 81F,  0, EAX,  3,  1, SEV_ES,                              YES,  17 ) \
-FLAG( 81F,  0, EAX,  4,  1, SEV_SNP,                             NO,    0 ) \
-FLAG( 81F,  0, EAX,  5,  1, VMPL,                                NO,    0 ) \
+FLAG( 81F,  0, EAX,  4,  1, SEV_SNP,                             YES, FUT ) \
+FLAG( 81F,  0, EAX,  5,  1, VMPL,                                YES, FUT ) \
 FLAG( 81F,  0, EAX,  6,  1, RMPQUERY,                            NO,    0 ) \
 FLAG( 81F,  0, EAX,  7,  1, VMPL_SSS,                            NO,    0 ) \
 FLAG( 81F,  0, EAX,  8,  1, SECURE_TSC,                          NO,    0 ) \
@@ -1424,10 +1433,13 @@ FLAG( 81F,  0, EAX, 16,  1, SEV_VTE,                             NO,    0 ) \
 FLAG( 81F,  0, EAX, 17,  1, VMGEXIT_PARAMETER,                   NO,    0 ) \
 FLAG( 81F,  0, EAX, 18,  1, VIRTUAL_MSR_TOM,                     NO,    0 ) \
 FLAG( 81F,  0, EAX, 19,  1, SEV_IBS_VIRT,                        NO,    0 ) \
-FLAG( 81F,  0, EAX, 24,  1, VMSA_REG_PROT,                       NO,    0 ) \
+FLAG( 81F,  0, EAX, 24,  1, VMSA_REG_PROT,                       YES, FUT ) \
+FLAG( 81F,  0, EAX, 25,  1, SMT_PROTECTION,                      NO,    0 ) \
+FLAG( 81F,  0, EAX, 28,  1, SVSM_COMM_PAGE_MSR,                  NO,    0 ) \
+FLAG( 81F,  0, EAX, 29,  1, NESTED_VIRT_SNP_MSR,                 NO,    0 ) \
 FIELD(81F,  0, EBX,  0,  6, SME_PAGE_TABLE_BIT_NUM,              YES,  17 ) \
 FIELD(81F,  0, EBX,  6,  6, SME_PHYS_ADDR_SPACE_REDUCTION,       NO,    0 ) \
-FIELD(81F,  0, EBX, 12,  4, NUM_VMPL,                            NO,    0 ) \
+FIELD(81F,  0, EBX, 12,  4, NUM_VMPL,                            YES, FUT ) \
 FIELD(81F,  0, ECX,  0, 32, NUM_ENCRYPTED_GUESTS,                NO,    0 ) \
 FIELD(81F,  0, EDX,  0, 32, SEV_MIN_ASID,                        NO,    0 )
 
@@ -1465,6 +1477,8 @@ FLAG( 821,  0, EAX, 11,  1, AMD_FAST_SHORT_CMPSB,                YES,  20 ) \
 FLAG( 821,  0, EAX, 13,  1, PREFETCHCTL_MSR,                     NO,    0 ) \
 FLAG( 821,  0, EAX, 17,  1, CPL3_CPUID_GP,                       NO,    0 ) \
 FLAG( 821,  0, EAX, 18,  1, EPSF,                                NO,    0 ) \
+FLAG( 821,  0, EAX, 19,  1, FAST_REP_SCASB,                      YES,  22 ) \
+FLAG( 821,  0, EAX, 20,  1, LEAF821_PREFETCHI,                   YES,  22 ) \
 FIELD(821,  0, EBX,  0, 12, MICROCODE_PATCH_SIZE,                NO,    0 )
 
 /*    LEVEL, SUB-LEVEL, REG, POS, SIZE, NAME,               MON SUPP, HWV  */
diff --git a/vmmon-only/include/x86desc.h b/vmmon-only/include/x86desc.h
index 6d7fd2b6..00f8ec01 100644
--- a/vmmon-only/include/x86desc.h
+++ b/vmmon-only/include/x86desc.h
@@ -101,90 +101,90 @@
  * consistency.  
  */
 
-static INLINE uint32 Desc_Type(const Descriptor *d)     { return d->type; }
-static INLINE uint32 Desc_S(const Descriptor *d)        { return d->S; }
-static INLINE uint32 Desc_DPL(const Descriptor *d)      { return d->DPL; }
-static INLINE uint32 Desc_Present(const Descriptor *d)  { return d->present; }
-static INLINE uint32 Desc_AVL(const Descriptor *d)      { return d->AVL; }
-static INLINE uint32 Desc_LongMode(const Descriptor *d) { return d->longmode; }
-static INLINE uint32 Desc_DB(const Descriptor *d)       { return d->DB; }
-static INLINE uint32 Desc_Gran(const Descriptor *d)     { return d->gran; }
-
-static INLINE uint32
+static inline uint32 Desc_Type(const Descriptor *d)     { return d->type; }
+static inline uint32 Desc_S(const Descriptor *d)        { return d->S; }
+static inline uint32 Desc_DPL(const Descriptor *d)      { return d->DPL; }
+static inline uint32 Desc_Present(const Descriptor *d)  { return d->present; }
+static inline uint32 Desc_AVL(const Descriptor *d)      { return d->AVL; }
+static inline uint32 Desc_LongMode(const Descriptor *d) { return d->longmode; }
+static inline uint32 Desc_DB(const Descriptor *d)       { return d->DB; }
+static inline uint32 Desc_Gran(const Descriptor *d)     { return d->gran; }
+
+static inline uint32
 Desc64_Type(const Descriptor64 *d)
 {
    return (uint32)d->type;
 }
 
-static INLINE uint32
+static inline uint32
 Desc64_S(const Descriptor64 *d)
 {
    return (uint32)d->S;
 }
 
-static INLINE uint32
+static inline uint32
 Desc64_DPL(const Descriptor64 *d)
 {
    return (uint32)d->DPL;
 }
 
-static INLINE uint32
+static inline uint32
 Desc64_Present(const Descriptor64 *d)
 {
    return (uint32)d->present;
 }
 
-static INLINE uint32
+static inline uint32
 Desc64_AVL(const Descriptor64 *d)
 {
    return (uint32)d->AVL;
 }
 
-static INLINE uint32
+static inline uint32
 Desc64_Gran(const Descriptor64 *d)
 {
    return (uint32)d->gran;
 }
 
-static INLINE uint32
+static inline uint32
 Desc64_ExtAttrs(const Descriptor64 *d)
 {
    return (uint32)d->ext_attrs;
 }
 
-static INLINE LA32
+static inline LA32
 Desc_GetBase(const Descriptor *d)
 {
    return ((unsigned)d->base_hi  << 24) |
           ((unsigned)d->base_mid << 16) | d->base_lo;
 }
 
-static INLINE LA64
+static inline LA64
 Desc64_GetBase(const Descriptor64 *d)
 {
    return ((uint64)d->base_hi << 32)  |
           ((uint64)d->base_mid << 24) | (uint64)d->base_lo;
 }
 
-static INLINE LA32
+static inline LA32
 Desc64_GetBaseHi(const Descriptor64 *d)
 {
    return (LA32)d->base_hi;
 }
 
-static INLINE VA32
+static inline VA32
 Desc_GetLimit(const Descriptor *d)
 {
    return ((unsigned)d->limit_hi << 16) | d->limit_lo;
 }
 
-static INLINE VA32
+static inline VA32
 Desc64_GetLimit(const Descriptor64 *d)
 {
    return (VA32)(((unsigned)d->limit_hi << 16) | d->limit_lo);
 }
 
-static INLINE Bool
+static inline Bool
 Desc_EqualIgnoreAccessed(const Descriptor *d1, const Descriptor *d2)
 {
    const DescriptorUnion *du1 = (const DescriptorUnion*) d1;
@@ -197,7 +197,7 @@ Desc_EqualIgnoreAccessed(const Descriptor *d1, const Descriptor *d2)
       (du1->word[1] & mask) == (du2->word[1] & mask);
 }
 
-static INLINE Bool
+static inline Bool
 Desc64_EqualIgnoreAccessed(const Descriptor64 *d1, const Descriptor64 *d2)
 {
    const Descriptor64Union *du1 = (const Descriptor64Union*) d1;
@@ -211,21 +211,21 @@ Desc64_EqualIgnoreAccessed(const Descriptor64 *d1, const Descriptor64 *d2)
           du1->qword[1] == du2->qword[1];
 }
 
-static INLINE void Desc_SetType(Descriptor *d, uint32 val)     { d->type     = val; }
-static INLINE void Desc_SetS(Descriptor *d, uint32 val)        { d->S        = val; }
-static INLINE void Desc_SetDPL(Descriptor *d, uint32 val)      { d->DPL      = val; }
-static INLINE void Desc_SetPresent(Descriptor *d, uint32 val)  { d->present  = val; }
-static INLINE void Desc_SetDB(Descriptor *d, uint32 val)       { d->DB       = val; }
-static INLINE void Desc_SetLongmode(Descriptor *d, uint32 val) { d->longmode = val; }
-static INLINE void Desc_SetGran(Descriptor *d, uint32 val)     { d->gran     = val; }
-
-static INLINE void Desc64_SetType(Descriptor64 *d, uint32 val)    { d->type     = val; }
-static INLINE void Desc64_SetS(Descriptor64 *d, uint32 val)       { d->S        = val; }
-static INLINE void Desc64_SetDPL(Descriptor64 *d, uint32 val)     { d->DPL      = val; }
-static INLINE void Desc64_SetPresent(Descriptor64 *d, uint32 val) { d->present  = val; }
-static INLINE void Desc64_SetGran(Descriptor64 *d, uint32 val)    { d->gran     = val; }
-
-static INLINE void
+static inline void Desc_SetType(Descriptor *d, uint32 val)     { d->type     = val; }
+static inline void Desc_SetS(Descriptor *d, uint32 val)        { d->S        = val; }
+static inline void Desc_SetDPL(Descriptor *d, uint32 val)      { d->DPL      = val; }
+static inline void Desc_SetPresent(Descriptor *d, uint32 val)  { d->present  = val; }
+static inline void Desc_SetDB(Descriptor *d, uint32 val)       { d->DB       = val; }
+static inline void Desc_SetLongmode(Descriptor *d, uint32 val) { d->longmode = val; }
+static inline void Desc_SetGran(Descriptor *d, uint32 val)     { d->gran     = val; }
+
+static inline void Desc64_SetType(Descriptor64 *d, uint32 val)    { d->type     = val; }
+static inline void Desc64_SetS(Descriptor64 *d, uint32 val)       { d->S        = val; }
+static inline void Desc64_SetDPL(Descriptor64 *d, uint32 val)     { d->DPL      = val; }
+static inline void Desc64_SetPresent(Descriptor64 *d, uint32 val) { d->present  = val; }
+static inline void Desc64_SetGran(Descriptor64 *d, uint32 val)    { d->gran     = val; }
+
+static inline void
 Desc_SetBase(Descriptor *d, LA32 newBase)
 {
    d->base_hi  = BASE_HI(newBase);
@@ -234,7 +234,7 @@ Desc_SetBase(Descriptor *d, LA32 newBase)
    ASSERT(Desc_GetBase(d) == newBase);
 }
 
-static INLINE void
+static inline void
 Desc64_SetBase(Descriptor64 *d, LA64 newBase)
 {
    d->base_hi  = (uint32)BASE64_HI(newBase);
@@ -243,7 +243,7 @@ Desc64_SetBase(Descriptor64 *d, LA64 newBase)
    ASSERT(Desc64_GetBase(d) == newBase);
 }
 
-static INLINE void
+static inline void
 Desc_SetLimit(Descriptor *d, VA32 newLimit)
 {
    d->limit_lo = LIMIT_LO(newLimit);
@@ -251,7 +251,7 @@ Desc_SetLimit(Descriptor *d, VA32 newLimit)
    ASSERT(Desc_GetLimit(d) == newLimit);
 }
 
-static INLINE void
+static inline void
 Desc64_SetLimit(Descriptor64 *d, VA32 newLimit)
 {
    d->limit_lo = LIMIT_LO(newLimit);
@@ -270,7 +270,7 @@ Desc64_SetLimit(Descriptor64 *d, VA32 newLimit)
  *
  *-----------------------------------------------------------------------------
  */
-static INLINE void 
+static inline void 
 Desc_SetDescriptor(Descriptor *d, LA32 base, VA32 limit, uint32 type, 
                    uint32 S, uint32 DPL, uint32 present, uint32 DB, 
                    uint32 gran)
@@ -312,10 +312,10 @@ Desc_SetDescriptor(Descriptor *d, LA32 base, VA32 limit, uint32 type,
  * are included only for backwards compatibility with existing macros.  
  */
 
-static INLINE uint32 DESC_TYPE(Descriptor d)       { return d.type; }
-static INLINE uint32 DESC_S(Descriptor d)          { return d.S; }
-static INLINE uint32 DESC_DPL(Descriptor d)        { return d.DPL; }
-static INLINE uint32 DESC_PRESENT(Descriptor d)    { return d.present; }
+static inline uint32 DESC_TYPE(Descriptor d)       { return d.type; }
+static inline uint32 DESC_S(Descriptor d)          { return d.S; }
+static inline uint32 DESC_DPL(Descriptor d)        { return d.DPL; }
+static inline uint32 DESC_PRESENT(Descriptor d)    { return d.present; }
 
 #define DT_CODE(_d)               ( DESC_S(_d) && (DESC_TYPE(_d) & 0x8) == 0x8)
 #define DT_CONFORMING_CODE(_d)    ( DESC_S(_d) && (DESC_TYPE(_d) & 0xc) == 0xc)
@@ -358,7 +358,7 @@ static INLINE uint32 DESC_PRESENT(Descriptor d)    { return d.present; }
  *-----------------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 Desc_SetSystemDescriptor64(Descriptor *d, uint64 base, uint32 limit,
                            uint32 type, uint32 DPL, uint32 present,
                            uint32 DB, uint32 gran)
@@ -385,7 +385,7 @@ Desc_SetSystemDescriptor64(Descriptor *d, uint64 base, uint32 limit,
  *   Given descriptor, return the code/stack size that it specifies.
  *----------------------------------------------------------------------
  */
-static INLINE unsigned
+static inline unsigned
 Desc_DBSize(const Descriptor *desc)
 {
    /*
@@ -420,7 +420,7 @@ Desc_DBSize(const Descriptor *desc)
  *----------------------------------------------------------------------
  */
 
-static INLINE VA32
+static inline VA32
 Desc_ExpandedLimit(const Descriptor *d)
 {
    VA32 limit = Desc_GetLimit(d);
@@ -431,7 +431,7 @@ Desc_ExpandedLimit(const Descriptor *d)
    return limit;
 }
 
-static INLINE VA32
+static inline VA32
 Desc64_ExpandedLimit(const Descriptor64 *d)
 {
    VA32 limit = Desc64_GetLimit(d);
@@ -458,7 +458,7 @@ Desc64_ExpandedLimit(const Descriptor64 *d)
  *----------------------------------------------------------------------
  */
 
-static INLINE uint32
+static inline uint32
 Desc_PackLimit(VA32 limit)
 {
    if (limit < (1 << 20)) {
@@ -485,7 +485,7 @@ Desc_PackLimit(VA32 limit)
  *----------------------------------------------------------------------
  */
 
-static INLINE VA
+static inline VA
 Desc_UnpackLimit(uint32 limit)
 {
    ASSERT(limit < (1 << 21));
@@ -500,7 +500,7 @@ Desc_UnpackLimit(uint32 limit)
  * For expand-down segments, valid offsets range from limit+1 to 
  * 0xffff or 0xffffffff, depending on the D/B bit in the descriptor.  
  */
-static INLINE Bool
+static inline Bool
 Desc_InBoundsExpandDown(VA vaddr, VA limit, uint32 size, VA supremum)
 {
    ASSERT(supremum == 0xffff || supremum == 0xffffffff);
@@ -509,7 +509,7 @@ Desc_InBoundsExpandDown(VA vaddr, VA limit, uint32 size, VA supremum)
 
 
 /* For expand-up segments, valid offsets range from 0 to limit. */
-static INLINE Bool
+static inline Bool
 Desc_InBoundsExpandUp(VA vaddr, VA limit, uint32 size)
 {
    return vaddr <= limit && size - 1 <= limit - vaddr;
@@ -574,13 +574,13 @@ typedef struct Gate {
 #define GT64_CALL(_gate)         ((_gate).type == GT_64BIT_CALL)
 
 
-static INLINE VA
+static inline VA
 CallGate_GetOffset(const Gate *cg)
 {
    return ((unsigned)cg->offset_hi << 16) | cg->offset_lo;
 }
 
-static INLINE void
+static inline void
 CallGate_SetOffset(Gate *cg, VA32 offset)
 {
    cg->offset_lo = GATE_OFFSET_LO(offset);
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index bafc51d6..7e05f440 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -73,6 +74,7 @@ typedef struct MSRQuery {
 #define MSR_TSC               0x00000010
 #define MSR_PLATFORM_ID       0x00000017
 #define MSR_APIC_BASE         0x0000001b
+#define MSR_MSRLIST_BARRIER   0x0000002f
 #define MSR_SMI_COUNT         0x00000034 // Intel Nehalem Family
 #define MSR_CORE_THREAD_COUNT 0x00000035 // Intel Nehalem Family +
 #define MSR_FEATCTL           0x0000003a
@@ -142,6 +144,12 @@ typedef struct MSRQuery {
 #define MSR_TEST_CTRL_SPLIT_LOCK_DETECT           (1ULL << 29)
 #endif
 
+#define MSR_XAPIC_DISABLE_STATUS             0xbd
+#define MSR_XAPIC_DISABLE_STATUS_LEGACY_XAPIC_DIS (1ULL << 0)
+
+#define MSR_CORE_CAPABILITIES                0xcf
+#define MSR_CORE_CAPABILITIES_EXTSVC_ENTITLED     (1ULL << 14) // Intel email
+
 #define IA32_MSR_ARCH_CAPABILITIES           0x10a
 #define MSR_ARCH_CAPABILITIES_RDCL_NO             (1ULL << 0)
 #define MSR_ARCH_CAPABILITIES_IBRS_ALL            (1ULL << 1)
@@ -152,6 +160,7 @@ typedef struct MSRQuery {
 #define MSR_ARCH_CAPABILITIES_IF_PSCHANGE_MC_NO   (1ULL << 6)
 #define MSR_ARCH_CAPABILITIES_TSX_CTRL            (1ULL << 7)
 #define MSR_ARCH_CAPABILITIES_TAA_NO              (1ULL << 8)
+#define MSR_ARCH_CAPABILITIES_MCU_CONTROL         (1ULL << 9)
 #define MSR_ARCH_CAPABILITIES_MISC_PKG_CTRLS      (1ULL << 10)
 #define MSR_ARCH_CAPABILITIES_ENERGY_FILT_CTL     (1ULL << 11)
 #define MSR_ARCH_CAPABILITIES_DOITM               (1ULL << 12)
@@ -163,6 +172,7 @@ typedef struct MSRQuery {
 #define MSR_ARCH_CAPABILITIES_RRSBA               (1ULL << 19)
 #define MSR_ARCH_CAPABILITIES_BHI_NO              (1ULL << 20)
 #define MSR_ARCH_CAPABILITIES_XAPIC_DIS_STATUS    (1ULL << 21)
+#define MSR_ARCH_CAPABILITIES_EXTSVC_ENTITLED     (1ULL << 22)
 #define MSR_ARCH_CAPABILITIES_OVERCLOCKING_STATUS (1ULL << 23)
 #define MSR_ARCH_CAPABILITIES_PBRSB_NO            (1ULL << 24)
 
@@ -196,6 +206,9 @@ typedef struct MSRQuery {
 #define MSR_MISC_FEATURES_ENABLES            0x140
 #endif
 
+#define MSR_UARCH_MISC_CTL                   0x1b01
+#define MSR_UARCH_MISC_CTL_DOITM                   (1ULL << 0)
+
 #define MSR_XFD                              0x1c4
 #define MSR_XFD_ERR                          0x1c5
 
@@ -313,6 +326,8 @@ typedef struct MSRQuery {
 #define MSR_ARCH_LBR_FROM_IP 0x00001500
 #define MSR_ARCH_LBR_TO_IP   0x00001600
 #define MSR_ARCH_LBR_INFO    0x00001200
+#define MSR_LER_FROM_IP      0x000001dd
+#define MSR_LER_TO_IP        0x000001de
 
 /* MSR_ARCH_LBR_CTL bits */
 #define MSR_ARCH_LBR_CTL_LBREN         0x000001
@@ -726,13 +741,32 @@ typedef struct MSRQuery {
 #define MSR_VM_CR_SVME_DISABLE     0x0000000000000010ULL
 #define MSR_VM_CR_RESERVED         0xffffffffffffffe0ULL
 
+/* AMD RAPL related MSRs. */
+#define MSR_AMD_RAPL_POWER_UNIT    0xc0010299
+#define MSR_AMD_PKG_ENERGY_STATUS  0xc001029b
+
 /* SEV related MSRs. */
 #define MSR_VMPAGE_FLUSH           0xc001011e
 #define MSR_GHCB_PA                0xc0010130
 #define MSR_SEV_STATUS             0xc0010131
 
+/* SEV feature-enabled bits in MSR_SEV_STATUS. */
+#define MSR_SEV_STATUS_SEV_EN           (1ULL << 0)
+#define MSR_SEV_STATUS_SEV_ES_EN_BIT    1
+#define MSR_SEV_STATUS_SEV_ES_EN        (1ULL << MSR_SEV_STATUS_SEV_ES_EN_BIT)
+#define MSR_SEV_STATUS_SEV_SNP_EN_BIT   2
+#define MSR_SEV_STATUS_SEV_SNP_EN       (1ULL << MSR_SEV_STATUS_SEV_SNP_EN_BIT)
+#define MSR_SEV_STATUS_DBG_SWAP         (1ULL << 7)
+#define MSR_SEV_STATUS_NO_HOST_IBS_EN   (1ULL << 8)
+#define MSR_SEV_STATUS_BTB_ISOLATE_EN   (1ULL << 9)
+#define MSR_SEV_STATUS_VMSA_REG_PROT_EN (1ULL << 16)
+
+/* Fields in MSR_GHCB_PA for the MSR protocol. */
+#define MSR_GHCB_PA_FUNCTION_MASK           0x0000000000000fffULL
+#define MSR_GHCB_PA_DATA_MASK               0xfffffffffffff000ULL
+
 /* Commands identifiers used in the MSR_GHCB_PA MSR protocol. */
-#define MSR_GHCB_PA_FUNCTION_MASK           0xfffULL
+#define MSR_GHCB_PA_VMGEXIT                 0x0
 #define MSR_GHCB_PA_SEVINFO_HV              0x1
 #define MSR_GHCB_PA_SEVINFO_REQ             0x2
 #define MSR_GHCB_PA_AP_JUMP_TABLE           0x3
@@ -746,6 +780,8 @@ typedef struct MSRQuery {
 #define MSR_GHCB_PA_REGISTER_GHCB_GPA_RESP  0x13
 #define MSR_GHCB_PA_SNP_PSC_REQ             0x14
 #define MSR_GHCB_PA_SNP_PSC_RESP            0x15
+#define MSR_GHCB_PA_RUN_VMPL_REQ            0x16
+#define MSR_GHCB_PA_RUN_VMPL_RESP           0x17
 #define MSR_GHCB_PA_FEATURES_REQ            0x80
 #define MSR_GHCB_PA_FEATURES_RESP           0x81
 #define MSR_GHCB_PA_TERMINATE               0x100
@@ -779,8 +815,14 @@ typedef struct MSRQuery {
 /* Field definitions for MSR_GHCB_PA_SNP_PSC_RESP */
 #define MSR_GHCB_PA_SNP_PSC_ERRCODE_SHIFT   32
 
+/* Field definitions for MSR_GHCB_PA_RUN_VMPL_REQ. */
+#define MSR_GHCB_PA_RUN_VMPL_REQ_VMPL       0x000000ff00000000ULL
+
+/* Field definitions for MSR_GHCB_PA_RUN_VMPL_RESP. */
+#define MSR_GHCB_PA_RUN_VMPL_RESP_ERROR     0xffffffff00000000ULL
+
 /* Field definitions for MSR_GHCB_PA_FEATURES_REQ */
-#define MSR_GHCB_PA_FEATURES_SHIFT          12
+#define MSR_GHCB_PA_FEATURES_RESP_FEATURES  0xfffffffffffff000ULL
 
 /* Field definitions for MSR_GHCB_PA_TERMINATE request. */
 #define MSR_GHCB_PA_TERMINATE_ECS_MASK      0xfULL
@@ -806,14 +848,6 @@ typedef struct MSRQuery {
 #define SEV_TERM_FROBOS_PSC_FAILED       11 /* Page state change req failed. */
 #define SEV_TERM_FROBOS_NESTED_VC_EXC    12 /* A nested #VC occurred. */
 
-/* SEV feature-enabled bits in MSR_SEV_STATUS. */
-#define MSR_SEV_STATUS_SEV_EN_BIT      0
-#define MSR_SEV_STATUS_SEV_EN          (1ULL << MSR_SEV_STATUS_SEV_EN_BIT)
-#define MSR_SEV_STATUS_SEV_ES_EN_BIT   1
-#define MSR_SEV_STATUS_SEV_ES_EN       (1ULL << MSR_SEV_STATUS_SEV_ES_EN_BIT)
-#define MSR_SEV_STATUS_SEV_SNP_EN_BIT  2
-#define MSR_SEV_STATUS_SEV_SNP_EN      (1ULL << MSR_SEV_STATUS_SEV_SNP_EN_BIT)
-
 /* SEV-SNP (Secure Nested Paging) MSRs. */
 #define MSR_RMP_BASE              0xc0010132 // Address of first byte of RMP
 #define MSR_RMP_END               0xc0010133 // Address of last byte of RMP
@@ -924,8 +958,10 @@ typedef struct MSRQuery {
 #ifndef MSR_TSX_FORCE_ABORT
 /* MSR for forcing RTM abort to recover PMC3 (see PR 2333817) */
 /* See SKZ87 in intel 335901-009 6th-gen-x-series-spec-update.pdf */
-#define MSR_TSX_FORCE_ABORT                      0x0000010f
-#define MSR_TSX_FORCE_ABORT_RTM_BIT_INDEX        0
+#define MSR_TSX_FORCE_ABORT                      0x10f
+#define MSR_TSX_FORCE_ABORT_RTM                       (1ULL << 0)
+#define MSR_TSX_FROCE_ABORT_TSX_CPUID_CLEAR           (1ULL << 1)
+#define MSR_TSX_FORCE_ABORT_SDV_ENABLE_RTM            (1ULL << 2)
 #endif
 
 /*
diff --git a/vmmon-only/include/x86paging_64.h b/vmmon-only/include/x86paging_64.h
index 15de9ef3..d1c31833 100644
--- a/vmmon-only/include/x86paging_64.h
+++ b/vmmon-only/include/x86paging_64.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (c) 1998-2014,2016,2018-2020,2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2014,2016,2018-2020,2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -71,6 +71,7 @@
 #define LM_MAKE_L2E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
 #define LM_MAKE_L1E(_pfn, _avail, _flags) LM_MAKE_PTE(_pfn, _avail, _flags)
 
+#define NPT_PTE_SSS_LEAF(npte)     (PTE_NOEXECUTE(npte) && !PTE_USER(npte))
 
 /*
  *----------------------------------------------------------------------
diff --git a/vmmon-only/include/x86paging_common.h b/vmmon-only/include/x86paging_common.h
index ab4409f7..3226deec 100644
--- a/vmmon-only/include/x86paging_common.h
+++ b/vmmon-only/include/x86paging_common.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -121,4 +122,48 @@ typedef enum {
    PM_NUM     = 4, /* number of different paging modes.                    */
 } PagingMode;
 
+/*
+ *----------------------------------------------------------------------
+ *
+ * TLB_INVPCID
+ *
+ *      Invalidate mappings in the TLB(s) and paging structure cache(s)
+ *      according to the given descriptor and type. The Intel SDM
+ *      defines four possible INVPCID types:
+ *
+ *      INVPCID_EXTENT_ADDR - individual-address invalidation:
+ *         Invalidate mappings (except global translations) for the
+ *         linear address and PCID specified in invalDesc.
+ *
+ *      INVPCID_EXTENT_PCID_CTX - single-context invalidation:
+ *          Invalidate all mappings (except global translations) for
+ *          the PCID specified in invalDesc.
+ *
+ *      INVPCID_EXTENT_ALL_CTX - all-context invalidation: Invalidate
+ *          all mappings, including global translations, for any PCID.
+ *
+ *      INVPCID_EXTENT_ALL_CTX_LOCAL - all-context invalidation:
+ *          Invalidate all mappings (except global translations, for
+ *          any PCID. May invalidate global translations as well.
+ *
+ * Results:
+ *      None.
+ *
+ * Side effects:
+ *      TLB(s), paging structure cache(s), and global translations may
+ *      be flushed.
+ *
+ *----------------------------------------------------------------------
+ */
+#ifdef __GNUC__
+static inline void
+TLB_INVPCID(InvpcidArg *invalDesc, uint64 invalType)
+{
+   __asm__ __volatile__("invpcid (%0), %1"
+                        : /* no outputs */
+                        : "r"(invalDesc), "r"(invalType)
+                        : "memory");
+}
+#endif
+
 #endif /* _X86PAGING_COMMON_H_ */
diff --git a/vmmon-only/include/x86svm.h b/vmmon-only/include/x86svm.h
index 09edbb84..6e3e42f0 100644
--- a/vmmon-only/include/x86svm.h
+++ b/vmmon-only/include/x86svm.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2005-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 2005-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -145,6 +146,7 @@
 #define SVM_VMCB_APIC_VIGN_TPR             0x0000000000100000ULL
 #define SVM_VMCB_APIC_VINTR_MASKING        0x0000000001000000ULL
 #define SVM_VMCB_APIC_VGIF_ENABLE          0x0000000002000000ULL
+#define SVM_VMCB_APIC_X2AVIC_ENABLE        0x0000000040000000ULL
 #define SVM_VMCB_APIC_AVIC_ENABLE          0x0000000080000000ULL
 #define SVM_VMCB_APIC_VINTR_VECTOR_MASK    0x000000ff00000000ULL
 #define SVM_VMCB_APIC_VINTR_VECTOR_SHIFT   32
@@ -210,15 +212,21 @@
 #define SVM_VMCB_AR_GRAN_SHIFT      (AR_GRAN_SHIFT     - 4)
 
 /* VMSA.sevFeatures */
-#define SVM_VMSA_SEV_FEAT_SNP_ACTIVE   0x0000000000000001ULL
-#define SVM_VMSA_SEV_FEAT_VTOM         0x0000000000000002ULL
-#define SVM_VMSA_SEV_FEAT_REFLECT_VC   0x0000000000000004ULL
-#define SVM_VMSA_SEV_FEAT_RESTR_INJ    0x0000000000000008ULL
-#define SVM_VMSA_SEV_FEAT_ALT_INJ      0x0000000000000010ULL
-#define SVM_VMSA_SEV_FEAT_DBG_SWAP     0x0000000000000020ULL
-#define SVM_VMSA_SEV_FEAT_NO_HOST_IBS  0x0000000000000040ULL
-#define SVM_VMSA_SEV_FEAT_BTB_ISOLATE  0x0000000000000080ULL
-#define SVM_VMSA_SEV_FEAT_RSVD         0xffffffffffffff00ULL
+#define SVM_VMSA_SEV_FEAT_SNP_ACTIVE    0x0000000000000001ULL
+#define SVM_VMSA_SEV_FEAT_VTOM          0x0000000000000002ULL
+#define SVM_VMSA_SEV_FEAT_REFLECT_VC    0x0000000000000004ULL
+#define SVM_VMSA_SEV_FEAT_RESTR_INJ     0x0000000000000008ULL
+#define SVM_VMSA_SEV_FEAT_ALT_INJ       0x0000000000000010ULL
+#define SVM_VMSA_SEV_FEAT_DBG_SWAP      0x0000000000000020ULL
+#define SVM_VMSA_SEV_FEAT_NO_HOST_IBS   0x0000000000000040ULL
+#define SVM_VMSA_SEV_FEAT_BTB_ISOLATE   0x0000000000000080ULL
+#define SVM_VMSA_SEV_FEAT_VMPL_SSS      0x0000000000000100ULL
+#define SVM_VMSA_SEV_FEAT_SECURE_TSC    0x0000000000000200ULL
+#define SVM_VMSA_SEV_FEAT_VMGEXIT_PARAM 0x0000000000000400ULL
+#define SVM_VMSA_SEV_FEAT_IBS_VIRT      0x0000000000001000ULL
+#define SVM_VMSA_SEV_FEAT_VMSA_REG_PROT 0x0000000000004000ULL
+#define SVM_VMSA_SEV_FEAT_SMT_PROT      0x0000000000008000ULL
+#define SVM_VMSA_SEV_FEAT_RSVD          0xffffffffffff2800ULL
 
 /*
  * Unique Exit Codes
@@ -296,16 +304,21 @@
 #define SVM_NUM_HI_EXIT_REASONS  (SVM_LAST_HI_EXIT_REASON + 1 - \
                                   SVM_FIRST_HI_EXIT_REASON)
 
-#define SVM_EXITCODE_MMIO_READ           0x80000001   // SW only
-#define SVM_EXITCODE_MMIO_WRITE          0x80000002   // SW only
-#define SVM_EXITCODE_NMI_COMPLETE        0x80000003   // SW only
-#define SVM_EXITCODE_AP_RESET_HOLD       0x80000004   // SW only
-#define SVM_EXITCODE_AP_JUMP_TABLE       0x80000005   // SW only
-#define SVM_EXITCODE_SNP_PSC_REQ         0x80000010   // SW only
-#define SVM_EXITCODE_SNP_GUEST_REQ       0x80000011   // SW only
-#define SVM_EXITCODE_SNP_AP_CREATION     0x80000013   // SW only
-#define SVM_EXITCODE_HV_FEATURES         0x8000FFFD   // SW only
-#define SVM_EXITCODE_UNSUPPORTED         0x8000FFFF   // SW only
+/* These exit codes are SW only, and issued by the guest when SEV is enabled. */
+#define SVM_EXITCODE_MMIO_READ           0x80000001
+#define SVM_EXITCODE_MMIO_WRITE          0x80000002
+#define SVM_EXITCODE_NMI_COMPLETE        0x80000003
+#define SVM_EXITCODE_AP_RESET_HOLD       0x80000004
+#define SVM_EXITCODE_AP_JUMP_TABLE       0x80000005
+#define SVM_EXITCODE_SNP_PSC_REQ         0x80000010
+#define SVM_EXITCODE_SNP_GUEST_REQ       0x80000011
+#define SVM_EXITCODE_SNP_EXT_GUEST_REQ   0x80000012
+#define SVM_EXITCODE_SNP_AP_CREATION     0x80000013
+#define SVM_EXITCODE_SNP_APIC_ID_LIST    0x80000017
+#define SVM_EXITCODE_SNP_RUN_VMPL        0x80000018
+#define SVM_EXITCODE_HV_FEATURES         0x8000FFFD
+#define SVM_EXITCODE_TERMINATE           0x8000FFFE
+#define SVM_EXITCODE_UNSUPPORTED         0x8000FFFF
 #define SVM_EXITCODE_INVALID             (-1ULL)
 
 /* ExitInfo1 for I/O exits */
@@ -379,9 +392,15 @@
 #define SVM_APEXIT_GET            0x1
 
 /* ExitInfo1 for SNP AP creation exits */
-#define SVM_SNPAPCREATE_WAIT_INIT 0x0
-#define SVM_SNPAPCREATE_VMRUN     0x1
-#define SVM_SNPAPCREATE_DESTROY   0x2
+#define SVM_SNPAPCREATE_EI1_APIC_ID  0xffffffff00000000ULL
+#define SVM_SNPAPCREATE_EI1_VMPL     0x00000000000f0000ULL
+#define SVM_SNPAPCREATE_EI1_REQTYPE  0x000000000000ffffULL
+#define    SVM_SNPAPCREATE_EI1_REQTYPE_WAIT_INIT 0x0
+#define    SVM_SNPAPCREATE_EI1_REQTYPE_VMRUN     0x1
+#define    SVM_SNPAPCREATE_EI1_REQTYPE_DESTROY   0x2
+
+/* ExitInfo1 for SNP Run VMPL exits */
+#define SVM_SNPRUNVMPL_EI1_VMPL      0x00000000ffffffffULL
 
 /* Event Injection */
 #define SVM_INTINFO_VECTOR_MASK   0x000000ff
@@ -397,7 +416,7 @@
 #define SVM_INTINFO_VALID         0x80000000
 
 /* AVIC related definitions. */
-#define SVM_AVIC_PHYS_TBL_MAX_VCPUS  512
+#define SVM_AVIC_PHYS_TBL_MAX_APICID  255
 
 #define SVM_AVIC_PHYS_ID_TBL_VALID (1ULL << 63)
 
@@ -441,7 +460,7 @@ enum {
 #undef CLEANBIT
 };
 
-static INLINE uint64
+static inline uint64
 SVM_ExecCtlBit(uint32 exitCode)
 {
    VERIFY_EXEC_CTL(INTR);
@@ -513,7 +532,7 @@ SVM_ExecCtlBit(uint32 exitCode)
  *----------------------------------------------------------------------
  */
 
-static INLINE int
+static inline int
 SVM_MSRNumToIndex(uint32 msrNum, AccessMode accessMode)
 {
    ASSERT(accessMode == ACCESS_MODE_READ || accessMode == ACCESS_MODE_WRITE);
@@ -541,7 +560,7 @@ SVM_MSRNumToIndex(uint32 msrNum, AccessMode accessMode)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 SVM_EnabledFromFeatures(uint64 vmCR)
 {
    return (vmCR & MSR_VM_CR_SVME_DISABLE) == 0;
@@ -557,7 +576,7 @@ SVM_EnabledFromFeatures(uint64 vmCR)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 SVM_LockedFromFeatures(uint64 vmCR)
 {
    return (vmCR & MSR_VM_CR_SVM_LOCK) != 0;
@@ -573,7 +592,7 @@ SVM_LockedFromFeatures(uint64 vmCR)
  *   that the processor is SVM_Capable().
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 SVM_EnabledCPU(void)
 {
    return SVM_EnabledFromFeatures(X86MSR_GetMSR(MSR_VM_CR));
@@ -590,7 +609,7 @@ SVM_EnabledCPU(void)
  *   Verify that this CPU is SVM-capable.
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 SVM_CapableCPU(void)
 {
    return ((__GET_EAX_FROM_CPUID(0x80000000) >= 0x8000000a) &&
@@ -616,7 +635,7 @@ SVM_CapableCPU(void)
  *   (Family 17H), SVM is always supported.
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 SVM_SupportedRev(const CpuidInfo *cpuid)
 {
    CpuidVendor vendor = CpuidInfo_Vendor(cpuid);
@@ -635,7 +654,7 @@ SVM_SupportedRev(const CpuidInfo *cpuid)
  *   must support NPT, NRIP and flush by ASID.
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 SVM_SupportedCPU(const CpuidInfo *cpuid)
 {
    return SVM_SupportedRev(cpuid) &&
diff --git a/vmmon-only/include/x86vt-exit-reasons.h b/vmmon-only/include/x86vt-exit-reasons.h
index 30a9e66d..5ab0b322 100644
--- a/vmmon-only/include/x86vt-exit-reasons.h
+++ b/vmmon-only/include/x86vt-exit-reasons.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 2016-2018,2021-2022 VMware, Inc. All rights reserved.
+ * Copyright (C) 2016-2018,2021-2023 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -31,6 +31,8 @@
  * future use.
  */
 #define VT_EXITREASON_BASIC_REASON_MASK      0xFFFF
+#define VT_EXITREASON_FRACT_SHSTK            (1U << 25)
+#define VT_EXITREASON_BUSLOCK_ASSERTED       (1U << 26)
 #define VT_EXITREASON_INSIDE_ENCLAVE         (1U << 27)
 #define VT_EXITREASON_PENDING_MTF            (1U << 28)
 #define VT_EXITREASON_EXIT_ROOT_OPERATION    (1U << 29)
@@ -112,7 +114,7 @@ VT_EXIT(ENQCMD_PASID_FAIL,    72)
 VT_EXIT(ENQCMDS_PASID_FAIL,   73)
 VT_EXIT(BUS_LOCK,             74)
 VT_EXIT(NOTIFY_WINDOW,        75)
-VT_EXIT(VMEXIT76,             76)
+VT_EXIT(SEAMCALL,             76)
 VT_EXIT(TDCALL,               77)
 /* Bump this up if you add an exit reason. */
 #define VT_NUM_EXIT_REASONS   78
diff --git a/vmmon-only/include/x86vt-vmcs-fields.h b/vmmon-only/include/x86vt-vmcs-fields.h
index 69b09fdf..5ffeebf2 100644
--- a/vmmon-only/include/x86vt-vmcs-fields.h
+++ b/vmmon-only/include/x86vt-vmcs-fields.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2015-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2015-2023 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -142,6 +143,38 @@ VMCS_UNUSED(                        0x0038, _S16, _TC,  28)
 VMCS_UNUSED(                        0x003A, _S16, _TC,  29)
 VMCS_UNUSED(                        0x003C, _S16, _TC,  30)
 VMCS_UNUSED(                        0x003E, _S16, _TC,  31)
+VMCS_UNUSED(                        0x0040, _S16, _TC,  32)
+VMCS_UNUSED(                        0x0042, _S16, _TC,  33)
+VMCS_UNUSED(                        0x0044, _S16, _TC,  34)
+VMCS_UNUSED(                        0x0046, _S16, _TC,  35)
+VMCS_UNUSED(                        0x0048, _S16, _TC,  36)
+VMCS_UNUSED(                        0x004A, _S16, _TC,  37)
+VMCS_UNUSED(                        0x004C, _S16, _TC,  38)
+VMCS_UNUSED(                        0x004E, _S16, _TC,  39)
+VMCS_UNUSED(                        0x0050, _S16, _TC,  40)
+VMCS_UNUSED(                        0x0052, _S16, _TC,  41)
+VMCS_UNUSED(                        0x0054, _S16, _TC,  42)
+VMCS_UNUSED(                        0x0056, _S16, _TC,  43)
+VMCS_UNUSED(                        0x0058, _S16, _TC,  44)
+VMCS_UNUSED(                        0x005A, _S16, _TC,  45)
+VMCS_UNUSED(                        0x005C, _S16, _TC,  46)
+VMCS_UNUSED(                        0x005E, _S16, _TC,  47)
+VMCS_UNUSED(                        0x0060, _S16, _TC,  48)
+VMCS_UNUSED(                        0x0062, _S16, _TC,  49)
+VMCS_UNUSED(                        0x0064, _S16, _TC,  50)
+VMCS_UNUSED(                        0x0066, _S16, _TC,  51)
+VMCS_UNUSED(                        0x0068, _S16, _TC,  52)
+VMCS_UNUSED(                        0x006A, _S16, _TC,  53)
+VMCS_UNUSED(                        0x006C, _S16, _TC,  54)
+VMCS_UNUSED(                        0x006E, _S16, _TC,  55)
+VMCS_UNUSED(                        0x0070, _S16, _TC,  56)
+VMCS_UNUSED(                        0x0072, _S16, _TC,  57)
+VMCS_UNUSED(                        0x0074, _S16, _TC,  58)
+VMCS_UNUSED(                        0x0076, _S16, _TC,  59)
+VMCS_UNUSED(                        0x0078, _S16, _TC,  60)
+VMCS_UNUSED(                        0x007A, _S16, _TC,  61)
+VMCS_UNUSED(                        0x007C, _S16, _TC,  62)
+VMCS_UNUSED(                        0x007E, _S16, _TC,  63)
 VMCS_GROUP_END(16, CTL)
 
 /* 16-bit read-only data fields. */
@@ -178,6 +211,38 @@ VMCS_UNUSED(                        0x0438, _S16, _TD,  28)
 VMCS_UNUSED(                        0x043A, _S16, _TD,  29)
 VMCS_UNUSED(                        0x043C, _S16, _TD,  30)
 VMCS_UNUSED(                        0x043E, _S16, _TD,  31)
+VMCS_UNUSED(                        0x0440, _S16, _TD,  32)
+VMCS_UNUSED(                        0x0442, _S16, _TD,  33)
+VMCS_UNUSED(                        0x0444, _S16, _TD,  34)
+VMCS_UNUSED(                        0x0446, _S16, _TD,  35)
+VMCS_UNUSED(                        0x0448, _S16, _TD,  36)
+VMCS_UNUSED(                        0x044A, _S16, _TD,  37)
+VMCS_UNUSED(                        0x044C, _S16, _TD,  38)
+VMCS_UNUSED(                        0x044E, _S16, _TD,  39)
+VMCS_UNUSED(                        0x0450, _S16, _TD,  40)
+VMCS_UNUSED(                        0x0452, _S16, _TD,  41)
+VMCS_UNUSED(                        0x0454, _S16, _TD,  42)
+VMCS_UNUSED(                        0x0456, _S16, _TD,  43)
+VMCS_UNUSED(                        0x0458, _S16, _TD,  44)
+VMCS_UNUSED(                        0x045A, _S16, _TD,  45)
+VMCS_UNUSED(                        0x045C, _S16, _TD,  46)
+VMCS_UNUSED(                        0x045E, _S16, _TD,  47)
+VMCS_UNUSED(                        0x0460, _S16, _TD,  48)
+VMCS_UNUSED(                        0x0462, _S16, _TD,  49)
+VMCS_UNUSED(                        0x0464, _S16, _TD,  50)
+VMCS_UNUSED(                        0x0466, _S16, _TD,  51)
+VMCS_UNUSED(                        0x0468, _S16, _TD,  52)
+VMCS_UNUSED(                        0x046A, _S16, _TD,  53)
+VMCS_UNUSED(                        0x046C, _S16, _TD,  54)
+VMCS_UNUSED(                        0x046E, _S16, _TD,  55)
+VMCS_UNUSED(                        0x0470, _S16, _TD,  56)
+VMCS_UNUSED(                        0x0472, _S16, _TD,  57)
+VMCS_UNUSED(                        0x0474, _S16, _TD,  58)
+VMCS_UNUSED(                        0x0476, _S16, _TD,  59)
+VMCS_UNUSED(                        0x0478, _S16, _TD,  60)
+VMCS_UNUSED(                        0x047A, _S16, _TD,  61)
+VMCS_UNUSED(                        0x047C, _S16, _TD,  62)
+VMCS_UNUSED(                        0x047E, _S16, _TD,  63)
 VMCS_GROUP_END(16, DATA)
 
 /* 16-bit guest state. */
@@ -214,6 +279,38 @@ VMCS_UNUSED(                        0x0838, _S16, _TG,  28)
 VMCS_UNUSED(                        0x083A, _S16, _TG,  29)
 VMCS_UNUSED(                        0x083C, _S16, _TG,  30)
 VMCS_UNUSED(                        0x083E, _S16, _TG,  31)
+VMCS_UNUSED(                        0x0840, _S16, _TG,  32)
+VMCS_UNUSED(                        0x0842, _S16, _TG,  33)
+VMCS_UNUSED(                        0x0844, _S16, _TG,  34)
+VMCS_UNUSED(                        0x0846, _S16, _TG,  35)
+VMCS_UNUSED(                        0x0848, _S16, _TG,  36)
+VMCS_UNUSED(                        0x084A, _S16, _TG,  37)
+VMCS_UNUSED(                        0x084C, _S16, _TG,  38)
+VMCS_UNUSED(                        0x084E, _S16, _TG,  39)
+VMCS_UNUSED(                        0x0850, _S16, _TG,  40)
+VMCS_UNUSED(                        0x0852, _S16, _TG,  41)
+VMCS_UNUSED(                        0x0854, _S16, _TG,  42)
+VMCS_UNUSED(                        0x0856, _S16, _TG,  43)
+VMCS_UNUSED(                        0x0858, _S16, _TG,  44)
+VMCS_UNUSED(                        0x085A, _S16, _TG,  45)
+VMCS_UNUSED(                        0x085C, _S16, _TG,  46)
+VMCS_UNUSED(                        0x085E, _S16, _TG,  47)
+VMCS_UNUSED(                        0x0860, _S16, _TG,  48)
+VMCS_UNUSED(                        0x0862, _S16, _TG,  49)
+VMCS_UNUSED(                        0x0864, _S16, _TG,  50)
+VMCS_UNUSED(                        0x0866, _S16, _TG,  51)
+VMCS_UNUSED(                        0x0868, _S16, _TG,  52)
+VMCS_UNUSED(                        0x086A, _S16, _TG,  53)
+VMCS_UNUSED(                        0x086C, _S16, _TG,  54)
+VMCS_UNUSED(                        0x086E, _S16, _TG,  55)
+VMCS_UNUSED(                        0x0870, _S16, _TG,  56)
+VMCS_UNUSED(                        0x0872, _S16, _TG,  57)
+VMCS_UNUSED(                        0x0874, _S16, _TG,  58)
+VMCS_UNUSED(                        0x0876, _S16, _TG,  59)
+VMCS_UNUSED(                        0x0878, _S16, _TG,  60)
+VMCS_UNUSED(                        0x087A, _S16, _TG,  61)
+VMCS_UNUSED(                        0x087C, _S16, _TG,  62)
+VMCS_UNUSED(                        0x087E, _S16, _TG,  63)
 VMCS_GROUP_END(16, GUEST)
 
 /* 16-bit host state. */
@@ -250,6 +347,38 @@ VMCS_UNUSED(                        0x0C38, _S16, _TH,  28)
 VMCS_UNUSED(                        0x0C3A, _S16, _TH,  29)
 VMCS_UNUSED(                        0x0C3C, _S16, _TH,  30)
 VMCS_UNUSED(                        0x0C3E, _S16, _TH,  31)
+VMCS_UNUSED(                        0x0C40, _S16, _TH,  32)
+VMCS_UNUSED(                        0x0C42, _S16, _TH,  33)
+VMCS_UNUSED(                        0x0C44, _S16, _TH,  34)
+VMCS_UNUSED(                        0x0C46, _S16, _TH,  35)
+VMCS_UNUSED(                        0x0C48, _S16, _TH,  36)
+VMCS_UNUSED(                        0x0C4A, _S16, _TH,  37)
+VMCS_UNUSED(                        0x0C4C, _S16, _TH,  38)
+VMCS_UNUSED(                        0x0C4E, _S16, _TH,  39)
+VMCS_UNUSED(                        0x0C50, _S16, _TH,  40)
+VMCS_UNUSED(                        0x0C52, _S16, _TH,  41)
+VMCS_UNUSED(                        0x0C54, _S16, _TH,  42)
+VMCS_UNUSED(                        0x0C56, _S16, _TH,  43)
+VMCS_UNUSED(                        0x0C58, _S16, _TH,  44)
+VMCS_UNUSED(                        0x0C5A, _S16, _TH,  45)
+VMCS_UNUSED(                        0x0C5C, _S16, _TH,  46)
+VMCS_UNUSED(                        0x0C5E, _S16, _TH,  47)
+VMCS_UNUSED(                        0x0C60, _S16, _TH,  48)
+VMCS_UNUSED(                        0x0C62, _S16, _TH,  49)
+VMCS_UNUSED(                        0x0C64, _S16, _TH,  50)
+VMCS_UNUSED(                        0x0C66, _S16, _TH,  51)
+VMCS_UNUSED(                        0x0C68, _S16, _TH,  52)
+VMCS_UNUSED(                        0x0C6A, _S16, _TH,  53)
+VMCS_UNUSED(                        0x0C6C, _S16, _TH,  54)
+VMCS_UNUSED(                        0x0C6E, _S16, _TH,  55)
+VMCS_UNUSED(                        0x0C70, _S16, _TH,  56)
+VMCS_UNUSED(                        0x0C72, _S16, _TH,  57)
+VMCS_UNUSED(                        0x0C74, _S16, _TH,  58)
+VMCS_UNUSED(                        0x0C76, _S16, _TH,  59)
+VMCS_UNUSED(                        0x0C78, _S16, _TH,  60)
+VMCS_UNUSED(                        0x0C7A, _S16, _TH,  61)
+VMCS_UNUSED(                        0x0C7C, _S16, _TH,  62)
+VMCS_UNUSED(                        0x0C7E, _S16, _TH,  63)
 VMCS_GROUP_END(16, HOST)
 VMCS_SET_END(16)
 
@@ -289,6 +418,38 @@ VMCS_FIELD(LOW_PASID_DIR,           0x2038, _S64, _TC, 28, _NC, _NV, _NA,  _S)
 VMCS_FIELD(HIGH_PASID_DIR,          0x203A, _S64, _TC, 29, _NC, _NV, _NA,  _S)
 VMCS_FIELD(SHARED_EPTP,             0x203C, _S64, _TC, 30, _NC, _NV, _NA, _NS)
 VMCS_UNUSED(                        0x203E, _S64, _TC, 31)
+VMCS_UNUSED(                        0x2040, _S64, _TC, 32)
+VMCS_UNUSED(                        0x2042, _S64, _TC, 33)
+VMCS_FIELD(2ND_VMEXIT_CTL,          0x2044, _S64, _TC, 34, _NC,  _V, _NA,  _S)
+VMCS_UNUSED(                        0x2046, _S64, _TC, 35)
+VMCS_UNUSED(                        0x2048, _S64, _TC, 36)
+VMCS_UNUSED(                        0x204A, _S64, _TC, 37)
+VMCS_UNUSED(                        0x204C, _S64, _TC, 38)
+VMCS_UNUSED(                        0x204E, _S64, _TC, 39)
+VMCS_UNUSED(                        0x2050, _S64, _TC, 40)
+VMCS_UNUSED(                        0x2052, _S64, _TC, 41)
+VMCS_UNUSED(                        0x2054, _S64, _TC, 42)
+VMCS_UNUSED(                        0x2056, _S64, _TC, 43)
+VMCS_UNUSED(                        0x2058, _S64, _TC, 44)
+VMCS_UNUSED(                        0x205A, _S64, _TC, 45)
+VMCS_UNUSED(                        0x205C, _S64, _TC, 46)
+VMCS_UNUSED(                        0x205E, _S64, _TC, 47)
+VMCS_UNUSED(                        0x2060, _S64, _TC, 48)
+VMCS_UNUSED(                        0x2062, _S64, _TC, 49)
+VMCS_UNUSED(                        0x2064, _S64, _TC, 50)
+VMCS_UNUSED(                        0x2066, _S64, _TC, 51)
+VMCS_UNUSED(                        0x2068, _S64, _TC, 52)
+VMCS_UNUSED(                        0x206A, _S64, _TC, 53)
+VMCS_UNUSED(                        0x206C, _S64, _TC, 54)
+VMCS_UNUSED(                        0x206E, _S64, _TC, 55)
+VMCS_UNUSED(                        0x2070, _S64, _TC, 56)
+VMCS_UNUSED(                        0x2072, _S64, _TC, 57)
+VMCS_UNUSED(                        0x2074, _S64, _TC, 58)
+VMCS_UNUSED(                        0x2076, _S64, _TC, 59)
+VMCS_UNUSED(                        0x2078, _S64, _TC, 60)
+VMCS_UNUSED(                        0x207A, _S64, _TC, 61)
+VMCS_UNUSED(                        0x207C, _S64, _TC, 62)
+VMCS_UNUSED(                        0x207E, _S64, _TC, 63)
 VMCS_GROUP_END(64, CTL)
 
 /* 64-bit read-only data field. */
@@ -325,6 +486,38 @@ VMCS_UNUSED(                        0x2438, _S64, _TD,  28)
 VMCS_UNUSED(                        0x243A, _S64, _TD,  29)
 VMCS_UNUSED(                        0x243C, _S64, _TD,  30)
 VMCS_UNUSED(                        0x243E, _S64, _TD,  31)
+VMCS_UNUSED(                        0x2440, _S64, _TD,  32)
+VMCS_UNUSED(                        0x2442, _S64, _TD,  33)
+VMCS_UNUSED(                        0x2444, _S64, _TD,  34)
+VMCS_UNUSED(                        0x2446, _S64, _TD,  35)
+VMCS_UNUSED(                        0x2448, _S64, _TD,  36)
+VMCS_UNUSED(                        0x244A, _S64, _TD,  37)
+VMCS_UNUSED(                        0x244C, _S64, _TD,  38)
+VMCS_UNUSED(                        0x244E, _S64, _TD,  39)
+VMCS_UNUSED(                        0x2450, _S64, _TD,  40)
+VMCS_UNUSED(                        0x2452, _S64, _TD,  41)
+VMCS_UNUSED(                        0x2454, _S64, _TD,  42)
+VMCS_UNUSED(                        0x2456, _S64, _TD,  43)
+VMCS_UNUSED(                        0x2458, _S64, _TD,  44)
+VMCS_UNUSED(                        0x245A, _S64, _TD,  45)
+VMCS_UNUSED(                        0x245C, _S64, _TD,  46)
+VMCS_UNUSED(                        0x245E, _S64, _TD,  47)
+VMCS_UNUSED(                        0x2460, _S64, _TD,  48)
+VMCS_UNUSED(                        0x2462, _S64, _TD,  49)
+VMCS_UNUSED(                        0x2464, _S64, _TD,  50)
+VMCS_UNUSED(                        0x2466, _S64, _TD,  51)
+VMCS_UNUSED(                        0x2468, _S64, _TD,  52)
+VMCS_UNUSED(                        0x246A, _S64, _TD,  53)
+VMCS_UNUSED(                        0x246C, _S64, _TD,  54)
+VMCS_UNUSED(                        0x246E, _S64, _TD,  55)
+VMCS_UNUSED(                        0x2470, _S64, _TD,  56)
+VMCS_UNUSED(                        0x2472, _S64, _TD,  57)
+VMCS_UNUSED(                        0x2474, _S64, _TD,  58)
+VMCS_UNUSED(                        0x2476, _S64, _TD,  59)
+VMCS_UNUSED(                        0x2478, _S64, _TD,  60)
+VMCS_UNUSED(                        0x247A, _S64, _TD,  61)
+VMCS_UNUSED(                        0x247C, _S64, _TD,  62)
+VMCS_UNUSED(                        0x247E, _S64, _TD,  63)
 VMCS_GROUP_END(64, DATA)
 
 /* 64-bit guest state. */
@@ -361,6 +554,38 @@ VMCS_UNUSED(                        0x2838, _S64, _TG,  28)
 VMCS_UNUSED(                        0x283A, _S64, _TG,  29)
 VMCS_UNUSED(                        0x283C, _S64, _TG,  30)
 VMCS_UNUSED(                        0x283E, _S64, _TG,  31)
+VMCS_UNUSED(                        0x2840, _S64, _TG,  32)
+VMCS_UNUSED(                        0x2842, _S64, _TG,  33)
+VMCS_UNUSED(                        0x2844, _S64, _TG,  34)
+VMCS_UNUSED(                        0x2846, _S64, _TG,  35)
+VMCS_UNUSED(                        0x2848, _S64, _TG,  36)
+VMCS_UNUSED(                        0x284A, _S64, _TG,  37)
+VMCS_UNUSED(                        0x284C, _S64, _TG,  38)
+VMCS_UNUSED(                        0x284E, _S64, _TG,  39)
+VMCS_UNUSED(                        0x2850, _S64, _TG,  40)
+VMCS_UNUSED(                        0x2852, _S64, _TG,  41)
+VMCS_UNUSED(                        0x2854, _S64, _TG,  42)
+VMCS_UNUSED(                        0x2856, _S64, _TG,  43)
+VMCS_UNUSED(                        0x2858, _S64, _TG,  44)
+VMCS_UNUSED(                        0x285A, _S64, _TG,  45)
+VMCS_UNUSED(                        0x285C, _S64, _TG,  46)
+VMCS_UNUSED(                        0x285E, _S64, _TG,  47)
+VMCS_UNUSED(                        0x2860, _S64, _TG,  48)
+VMCS_UNUSED(                        0x2862, _S64, _TG,  49)
+VMCS_UNUSED(                        0x2864, _S64, _TG,  50)
+VMCS_UNUSED(                        0x2866, _S64, _TG,  51)
+VMCS_UNUSED(                        0x2868, _S64, _TG,  52)
+VMCS_UNUSED(                        0x286A, _S64, _TG,  53)
+VMCS_UNUSED(                        0x286C, _S64, _TG,  54)
+VMCS_UNUSED(                        0x286E, _S64, _TG,  55)
+VMCS_UNUSED(                        0x2870, _S64, _TG,  56)
+VMCS_UNUSED(                        0x2872, _S64, _TG,  57)
+VMCS_UNUSED(                        0x2874, _S64, _TG,  58)
+VMCS_UNUSED(                        0x2876, _S64, _TG,  59)
+VMCS_UNUSED(                        0x2878, _S64, _TG,  60)
+VMCS_UNUSED(                        0x287A, _S64, _TG,  61)
+VMCS_UNUSED(                        0x287C, _S64, _TG,  62)
+VMCS_UNUSED(                        0x287E, _S64, _TG,  63)
 VMCS_GROUP_END(64, GUEST)
 
 /* 64-bit host state. */
@@ -397,6 +622,38 @@ VMCS_UNUSED(                        0x2C38, _S64, _TH,  28)
 VMCS_UNUSED(                        0x2C3A, _S64, _TH,  29)
 VMCS_UNUSED(                        0x2C3C, _S64, _TH,  30)
 VMCS_UNUSED(                        0x2C3E, _S64, _TH,  31)
+VMCS_UNUSED(                        0x2C40, _S64, _TH,  32)
+VMCS_UNUSED(                        0x2C42, _S64, _TH,  33)
+VMCS_UNUSED(                        0x2C44, _S64, _TH,  34)
+VMCS_UNUSED(                        0x2C46, _S64, _TH,  35)
+VMCS_UNUSED(                        0x2C48, _S64, _TH,  36)
+VMCS_UNUSED(                        0x2C4A, _S64, _TH,  37)
+VMCS_UNUSED(                        0x2C4C, _S64, _TH,  38)
+VMCS_UNUSED(                        0x2C4E, _S64, _TH,  39)
+VMCS_UNUSED(                        0x2C50, _S64, _TH,  40)
+VMCS_UNUSED(                        0x2C52, _S64, _TH,  41)
+VMCS_UNUSED(                        0x2C54, _S64, _TH,  42)
+VMCS_UNUSED(                        0x2C56, _S64, _TH,  43)
+VMCS_UNUSED(                        0x2C58, _S64, _TH,  44)
+VMCS_UNUSED(                        0x2C5A, _S64, _TH,  45)
+VMCS_UNUSED(                        0x2C5C, _S64, _TH,  46)
+VMCS_UNUSED(                        0x2C5E, _S64, _TH,  47)
+VMCS_UNUSED(                        0x2C60, _S64, _TH,  48)
+VMCS_UNUSED(                        0x2C62, _S64, _TH,  49)
+VMCS_UNUSED(                        0x2C64, _S64, _TH,  50)
+VMCS_UNUSED(                        0x2C66, _S64, _TH,  51)
+VMCS_UNUSED(                        0x2C68, _S64, _TH,  52)
+VMCS_UNUSED(                        0x2C6A, _S64, _TH,  53)
+VMCS_UNUSED(                        0x2C6C, _S64, _TH,  54)
+VMCS_UNUSED(                        0x2C6E, _S64, _TH,  55)
+VMCS_UNUSED(                        0x2C70, _S64, _TH,  56)
+VMCS_UNUSED(                        0x2C72, _S64, _TH,  57)
+VMCS_UNUSED(                        0x2C74, _S64, _TH,  58)
+VMCS_UNUSED(                        0x2C76, _S64, _TH,  59)
+VMCS_UNUSED(                        0x2C78, _S64, _TH,  60)
+VMCS_UNUSED(                        0x2C7A, _S64, _TH,  61)
+VMCS_UNUSED(                        0x2C7C, _S64, _TH,  62)
+VMCS_UNUSED(                        0x2C7E, _S64, _TH,  63)
 VMCS_GROUP_END(64, HOST)
 VMCS_SET_END(64)
 
@@ -436,6 +693,38 @@ VMCS_UNUSED(                        0x4038, _S32, _TC, 28)
 VMCS_UNUSED(                        0x403A, _S32, _TC, 29)
 VMCS_UNUSED(                        0x403C, _S32, _TC, 30)
 VMCS_UNUSED(                        0x403E, _S32, _TC, 31)
+VMCS_UNUSED(                        0x4040, _S32, _TC, 32)
+VMCS_UNUSED(                        0x4042, _S32, _TC, 33)
+VMCS_UNUSED(                        0x4044, _S32, _TC, 34)
+VMCS_UNUSED(                        0x4046, _S32, _TC, 35)
+VMCS_UNUSED(                        0x4048, _S32, _TC, 36)
+VMCS_UNUSED(                        0x404A, _S32, _TC, 37)
+VMCS_UNUSED(                        0x404C, _S32, _TC, 38)
+VMCS_UNUSED(                        0x404E, _S32, _TC, 39)
+VMCS_UNUSED(                        0x4050, _S32, _TC, 40)
+VMCS_UNUSED(                        0x4052, _S32, _TC, 41)
+VMCS_UNUSED(                        0x4054, _S32, _TC, 42)
+VMCS_UNUSED(                        0x4056, _S32, _TC, 43)
+VMCS_UNUSED(                        0x4058, _S32, _TC, 44)
+VMCS_UNUSED(                        0x405A, _S32, _TC, 45)
+VMCS_UNUSED(                        0x405C, _S32, _TC, 46)
+VMCS_UNUSED(                        0x405E, _S32, _TC, 47)
+VMCS_UNUSED(                        0x4060, _S32, _TC, 48)
+VMCS_UNUSED(                        0x4062, _S32, _TC, 49)
+VMCS_UNUSED(                        0x4064, _S32, _TC, 50)
+VMCS_UNUSED(                        0x4066, _S32, _TC, 51)
+VMCS_UNUSED(                        0x4068, _S32, _TC, 52)
+VMCS_UNUSED(                        0x406A, _S32, _TC, 53)
+VMCS_UNUSED(                        0x406C, _S32, _TC, 54)
+VMCS_UNUSED(                        0x406E, _S32, _TC, 55)
+VMCS_UNUSED(                        0x4070, _S32, _TC, 56)
+VMCS_UNUSED(                        0x4072, _S32, _TC, 57)
+VMCS_UNUSED(                        0x4074, _S32, _TC, 58)
+VMCS_UNUSED(                        0x4076, _S32, _TC, 59)
+VMCS_UNUSED(                        0x4078, _S32, _TC, 60)
+VMCS_UNUSED(                        0x407A, _S32, _TC, 61)
+VMCS_UNUSED(                        0x407C, _S32, _TC, 62)
+VMCS_UNUSED(                        0x407E, _S32, _TC, 63)
 VMCS_GROUP_END(32, CTL)
 
 /* 32-bit read-only data fields. */
@@ -472,6 +761,38 @@ VMCS_UNUSED(                        0x4438, _S32, _TD,  28)
 VMCS_UNUSED(                        0x443A, _S32, _TD,  29)
 VMCS_UNUSED(                        0x443C, _S32, _TD,  30)
 VMCS_UNUSED(                        0x443E, _S32, _TD,  31)
+VMCS_UNUSED(                        0x4440, _S32, _TD,  32)
+VMCS_UNUSED(                        0x4442, _S32, _TD,  33)
+VMCS_UNUSED(                        0x4444, _S32, _TD,  34)
+VMCS_UNUSED(                        0x4446, _S32, _TD,  35)
+VMCS_UNUSED(                        0x4448, _S32, _TD,  36)
+VMCS_UNUSED(                        0x444A, _S32, _TD,  37)
+VMCS_UNUSED(                        0x444C, _S32, _TD,  38)
+VMCS_UNUSED(                        0x444E, _S32, _TD,  39)
+VMCS_UNUSED(                        0x4450, _S32, _TD,  40)
+VMCS_UNUSED(                        0x4452, _S32, _TD,  41)
+VMCS_UNUSED(                        0x4454, _S32, _TD,  42)
+VMCS_UNUSED(                        0x4456, _S32, _TD,  43)
+VMCS_UNUSED(                        0x4458, _S32, _TD,  44)
+VMCS_UNUSED(                        0x445A, _S32, _TD,  45)
+VMCS_UNUSED(                        0x445C, _S32, _TD,  46)
+VMCS_UNUSED(                        0x445E, _S32, _TD,  47)
+VMCS_UNUSED(                        0x4460, _S32, _TD,  48)
+VMCS_UNUSED(                        0x4462, _S32, _TD,  49)
+VMCS_UNUSED(                        0x4464, _S32, _TD,  50)
+VMCS_UNUSED(                        0x4466, _S32, _TD,  51)
+VMCS_UNUSED(                        0x4468, _S32, _TD,  52)
+VMCS_UNUSED(                        0x446A, _S32, _TD,  53)
+VMCS_UNUSED(                        0x446C, _S32, _TD,  54)
+VMCS_UNUSED(                        0x446E, _S32, _TD,  55)
+VMCS_UNUSED(                        0x4470, _S32, _TD,  56)
+VMCS_UNUSED(                        0x4472, _S32, _TD,  57)
+VMCS_UNUSED(                        0x4474, _S32, _TD,  58)
+VMCS_UNUSED(                        0x4476, _S32, _TD,  59)
+VMCS_UNUSED(                        0x4478, _S32, _TD,  60)
+VMCS_UNUSED(                        0x447A, _S32, _TD,  61)
+VMCS_UNUSED(                        0x447C, _S32, _TD,  62)
+VMCS_UNUSED(                        0x447E, _S32, _TD,  63)
 VMCS_GROUP_END(32, DATA)
 
 /* 32-bit guest state. */
@@ -508,7 +829,38 @@ VMCS_UNUSED(                        0x4838, _S32, _TG, 28)
 VMCS_UNUSED(                        0x483A, _S32, _TG, 29)
 VMCS_UNUSED(                        0x483C, _S32, _TG, 30)
 VMCS_UNUSED(                        0x483E, _S32, _TG, 31)
-
+VMCS_UNUSED(                        0x4840, _S32, _TG, 32)
+VMCS_UNUSED(                        0x4842, _S32, _TG, 33)
+VMCS_UNUSED(                        0x4844, _S32, _TG, 34)
+VMCS_UNUSED(                        0x4846, _S32, _TG, 35)
+VMCS_UNUSED(                        0x4848, _S32, _TG, 36)
+VMCS_UNUSED(                        0x484A, _S32, _TG, 37)
+VMCS_UNUSED(                        0x484C, _S32, _TG, 38)
+VMCS_UNUSED(                        0x484E, _S32, _TG, 39)
+VMCS_UNUSED(                        0x4850, _S32, _TG, 40)
+VMCS_UNUSED(                        0x4852, _S32, _TG, 41)
+VMCS_UNUSED(                        0x4854, _S32, _TG, 42)
+VMCS_UNUSED(                        0x4856, _S32, _TG, 43)
+VMCS_UNUSED(                        0x4858, _S32, _TG, 44)
+VMCS_UNUSED(                        0x485A, _S32, _TG, 45)
+VMCS_UNUSED(                        0x485C, _S32, _TG, 46)
+VMCS_UNUSED(                        0x485E, _S32, _TG, 47)
+VMCS_UNUSED(                        0x4860, _S32, _TG, 48)
+VMCS_UNUSED(                        0x4862, _S32, _TG, 49)
+VMCS_UNUSED(                        0x4864, _S32, _TG, 50)
+VMCS_UNUSED(                        0x4866, _S32, _TG, 51)
+VMCS_UNUSED(                        0x4868, _S32, _TG, 52)
+VMCS_UNUSED(                        0x486A, _S32, _TG, 53)
+VMCS_UNUSED(                        0x486C, _S32, _TG, 54)
+VMCS_UNUSED(                        0x486E, _S32, _TG, 55)
+VMCS_UNUSED(                        0x4870, _S32, _TG, 56)
+VMCS_UNUSED(                        0x4872, _S32, _TG, 57)
+VMCS_UNUSED(                        0x4874, _S32, _TG, 58)
+VMCS_UNUSED(                        0x4876, _S32, _TG, 59)
+VMCS_UNUSED(                        0x4878, _S32, _TG, 60)
+VMCS_UNUSED(                        0x487A, _S32, _TG, 61)
+VMCS_UNUSED(                        0x487C, _S32, _TG, 62)
+VMCS_UNUSED(                        0x487E, _S32, _TG, 63)
 VMCS_GROUP_END(32, GUEST)
 
 /* 32-bit host state. */
@@ -545,6 +897,38 @@ VMCS_UNUSED(                        0x4C38, _S32, _TH,  28)
 VMCS_UNUSED(                        0x4C3A, _S32, _TH,  29)
 VMCS_UNUSED(                        0x4C3C, _S32, _TH,  30)
 VMCS_UNUSED(                        0x4C3E, _S32, _TH,  31)
+VMCS_UNUSED(                        0x4C40, _S32, _TH,  32)
+VMCS_UNUSED(                        0x4C42, _S32, _TH,  33)
+VMCS_UNUSED(                        0x4C44, _S32, _TH,  34)
+VMCS_UNUSED(                        0x4C46, _S32, _TH,  35)
+VMCS_UNUSED(                        0x4C48, _S32, _TH,  36)
+VMCS_UNUSED(                        0x4C4A, _S32, _TH,  37)
+VMCS_UNUSED(                        0x4C4C, _S32, _TH,  38)
+VMCS_UNUSED(                        0x4C4E, _S32, _TH,  39)
+VMCS_UNUSED(                        0x4C50, _S32, _TH,  40)
+VMCS_UNUSED(                        0x4C52, _S32, _TH,  41)
+VMCS_UNUSED(                        0x4C54, _S32, _TH,  42)
+VMCS_UNUSED(                        0x4C56, _S32, _TH,  43)
+VMCS_UNUSED(                        0x4C58, _S32, _TH,  44)
+VMCS_UNUSED(                        0x4C5A, _S32, _TH,  45)
+VMCS_UNUSED(                        0x4C5C, _S32, _TH,  46)
+VMCS_UNUSED(                        0x4C5E, _S32, _TH,  47)
+VMCS_UNUSED(                        0x4C60, _S32, _TH,  48)
+VMCS_UNUSED(                        0x4C62, _S32, _TH,  49)
+VMCS_UNUSED(                        0x4C64, _S32, _TH,  50)
+VMCS_UNUSED(                        0x4C66, _S32, _TH,  51)
+VMCS_UNUSED(                        0x4C68, _S32, _TH,  52)
+VMCS_UNUSED(                        0x4C6A, _S32, _TH,  53)
+VMCS_UNUSED(                        0x4C6C, _S32, _TH,  54)
+VMCS_UNUSED(                        0x4C6E, _S32, _TH,  55)
+VMCS_UNUSED(                        0x4C70, _S32, _TH,  56)
+VMCS_UNUSED(                        0x4C72, _S32, _TH,  57)
+VMCS_UNUSED(                        0x4C74, _S32, _TH,  58)
+VMCS_UNUSED(                        0x4C76, _S32, _TH,  59)
+VMCS_UNUSED(                        0x4C78, _S32, _TH,  60)
+VMCS_UNUSED(                        0x4C7A, _S32, _TH,  61)
+VMCS_UNUSED(                        0x4C7C, _S32, _TH,  62)
+VMCS_UNUSED(                        0x4C7E, _S32, _TH,  63)
 VMCS_GROUP_END(32, HOST)
 VMCS_SET_END(32)
 
@@ -584,6 +968,38 @@ VMCS_UNUSED(                        0x6038,  _SN, _TC,  28)
 VMCS_UNUSED(                        0x603A,  _SN, _TC,  29)
 VMCS_UNUSED(                        0x603C,  _SN, _TC,  30)
 VMCS_UNUSED(                        0x603E,  _SN, _TC,  31)
+VMCS_UNUSED(                        0x6040,  _SN, _TC,  32)
+VMCS_UNUSED(                        0x6042,  _SN, _TC,  33)
+VMCS_UNUSED(                        0x6044,  _SN, _TC,  34)
+VMCS_UNUSED(                        0x6046,  _SN, _TC,  35)
+VMCS_UNUSED(                        0x6048,  _SN, _TC,  36)
+VMCS_UNUSED(                        0x604A,  _SN, _TC,  37)
+VMCS_UNUSED(                        0x604C,  _SN, _TC,  38)
+VMCS_UNUSED(                        0x604E,  _SN, _TC,  39)
+VMCS_UNUSED(                        0x6050,  _SN, _TC,  40)
+VMCS_UNUSED(                        0x6052,  _SN, _TC,  41)
+VMCS_UNUSED(                        0x6054,  _SN, _TC,  42)
+VMCS_UNUSED(                        0x6056,  _SN, _TC,  43)
+VMCS_UNUSED(                        0x6058,  _SN, _TC,  44)
+VMCS_UNUSED(                        0x605A,  _SN, _TC,  45)
+VMCS_UNUSED(                        0x605C,  _SN, _TC,  46)
+VMCS_UNUSED(                        0x605E,  _SN, _TC,  47)
+VMCS_UNUSED(                        0x6060,  _SN, _TC,  48)
+VMCS_UNUSED(                        0x6062,  _SN, _TC,  49)
+VMCS_UNUSED(                        0x6064,  _SN, _TC,  50)
+VMCS_UNUSED(                        0x6066,  _SN, _TC,  51)
+VMCS_UNUSED(                        0x6068,  _SN, _TC,  52)
+VMCS_UNUSED(                        0x606A,  _SN, _TC,  53)
+VMCS_UNUSED(                        0x606C,  _SN, _TC,  54)
+VMCS_UNUSED(                        0x606E,  _SN, _TC,  55)
+VMCS_UNUSED(                        0x6070,  _SN, _TC,  56)
+VMCS_UNUSED(                        0x6072,  _SN, _TC,  57)
+VMCS_UNUSED(                        0x6074,  _SN, _TC,  58)
+VMCS_UNUSED(                        0x6076,  _SN, _TC,  59)
+VMCS_UNUSED(                        0x6078,  _SN, _TC,  60)
+VMCS_UNUSED(                        0x607A,  _SN, _TC,  61)
+VMCS_UNUSED(                        0x607C,  _SN, _TC,  62)
+VMCS_UNUSED(                        0x607E,  _SN, _TC,  63)
 VMCS_GROUP_END(NAT, CTL)
 
 VMCS_GROUP_START(NAT, DATA)
@@ -619,6 +1035,38 @@ VMCS_UNUSED(                        0x6438,  _SN, _TD,  28)
 VMCS_UNUSED(                        0x643A,  _SN, _TD,  29)
 VMCS_UNUSED(                        0x643C,  _SN, _TD,  30)
 VMCS_UNUSED(                        0x643E,  _SN, _TD,  31)
+VMCS_UNUSED(                        0x6440,  _SN, _TD,  32)
+VMCS_UNUSED(                        0x6442,  _SN, _TD,  33)
+VMCS_UNUSED(                        0x6444,  _SN, _TD,  34)
+VMCS_UNUSED(                        0x6446,  _SN, _TD,  35)
+VMCS_UNUSED(                        0x6448,  _SN, _TD,  36)
+VMCS_UNUSED(                        0x644A,  _SN, _TD,  37)
+VMCS_UNUSED(                        0x644C,  _SN, _TD,  38)
+VMCS_UNUSED(                        0x644E,  _SN, _TD,  39)
+VMCS_UNUSED(                        0x6450,  _SN, _TD,  40)
+VMCS_UNUSED(                        0x6452,  _SN, _TD,  41)
+VMCS_UNUSED(                        0x6454,  _SN, _TD,  42)
+VMCS_UNUSED(                        0x6456,  _SN, _TD,  43)
+VMCS_UNUSED(                        0x6458,  _SN, _TD,  44)
+VMCS_UNUSED(                        0x645A,  _SN, _TD,  45)
+VMCS_UNUSED(                        0x645C,  _SN, _TD,  46)
+VMCS_UNUSED(                        0x645E,  _SN, _TD,  47)
+VMCS_UNUSED(                        0x6460,  _SN, _TD,  48)
+VMCS_UNUSED(                        0x6462,  _SN, _TD,  49)
+VMCS_UNUSED(                        0x6464,  _SN, _TD,  50)
+VMCS_UNUSED(                        0x6466,  _SN, _TD,  51)
+VMCS_UNUSED(                        0x6468,  _SN, _TD,  52)
+VMCS_UNUSED(                        0x646A,  _SN, _TD,  53)
+VMCS_UNUSED(                        0x646C,  _SN, _TD,  54)
+VMCS_UNUSED(                        0x646E,  _SN, _TD,  55)
+VMCS_UNUSED(                        0x6470,  _SN, _TD,  56)
+VMCS_UNUSED(                        0x6472,  _SN, _TD,  57)
+VMCS_UNUSED(                        0x6474,  _SN, _TD,  58)
+VMCS_UNUSED(                        0x6476,  _SN, _TD,  59)
+VMCS_UNUSED(                        0x6478,  _SN, _TD,  60)
+VMCS_UNUSED(                        0x647A,  _SN, _TD,  61)
+VMCS_UNUSED(                        0x647C,  _SN, _TD,  62)
+VMCS_UNUSED(                        0x647E,  _SN, _TD,  63)
 VMCS_GROUP_END(NAT, DATA)
 
 /* natural-width guest state. */
@@ -655,6 +1103,38 @@ VMCS_UNUSED(                        0x6838,  _SN, _TG, 28)
 VMCS_UNUSED(                        0x683A,  _SN, _TG, 29)
 VMCS_UNUSED(                        0x683C,  _SN, _TG, 30)
 VMCS_UNUSED(                        0x683E,  _SN, _TG, 31)
+VMCS_UNUSED(                        0x6840,  _SN, _TG, 32)
+VMCS_UNUSED(                        0x6842,  _SN, _TG, 33)
+VMCS_UNUSED(                        0x6844,  _SN, _TG, 34)
+VMCS_UNUSED(                        0x6846,  _SN, _TG, 35)
+VMCS_UNUSED(                        0x6848,  _SN, _TG, 36)
+VMCS_UNUSED(                        0x684A,  _SN, _TG, 37)
+VMCS_UNUSED(                        0x684C,  _SN, _TG, 38)
+VMCS_UNUSED(                        0x684E,  _SN, _TG, 39)
+VMCS_UNUSED(                        0x6850,  _SN, _TG, 40)
+VMCS_UNUSED(                        0x6852,  _SN, _TG, 41)
+VMCS_UNUSED(                        0x6854,  _SN, _TG, 42)
+VMCS_UNUSED(                        0x6856,  _SN, _TG, 43)
+VMCS_UNUSED(                        0x6858,  _SN, _TG, 44)
+VMCS_UNUSED(                        0x685A,  _SN, _TG, 45)
+VMCS_UNUSED(                        0x685C,  _SN, _TG, 46)
+VMCS_UNUSED(                        0x685E,  _SN, _TG, 47)
+VMCS_UNUSED(                        0x6860,  _SN, _TG, 48)
+VMCS_UNUSED(                        0x6862,  _SN, _TG, 49)
+VMCS_UNUSED(                        0x6864,  _SN, _TG, 50)
+VMCS_UNUSED(                        0x6866,  _SN, _TG, 51)
+VMCS_UNUSED(                        0x6868,  _SN, _TG, 52)
+VMCS_UNUSED(                        0x686A,  _SN, _TG, 53)
+VMCS_UNUSED(                        0x686C,  _SN, _TG, 54)
+VMCS_UNUSED(                        0x686E,  _SN, _TG, 55)
+VMCS_UNUSED(                        0x6870,  _SN, _TG, 56)
+VMCS_UNUSED(                        0x6872,  _SN, _TG, 57)
+VMCS_UNUSED(                        0x6874,  _SN, _TG, 58)
+VMCS_UNUSED(                        0x6876,  _SN, _TG, 59)
+VMCS_UNUSED(                        0x6878,  _SN, _TG, 60)
+VMCS_UNUSED(                        0x687A,  _SN, _TG, 61)
+VMCS_UNUSED(                        0x687C,  _SN, _TG, 62)
+VMCS_UNUSED(                        0x687E,  _SN, _TG, 63)
 VMCS_GROUP_END(NAT, GUEST)
 
 /* natural-width host state. */
@@ -691,6 +1171,38 @@ VMCS_UNUSED(                        0x6C38,  _SN, _TH, 28)
 VMCS_UNUSED(                        0x6C3A,  _SN, _TH, 29)
 VMCS_UNUSED(                        0x6C3C,  _SN, _TH, 30)
 VMCS_UNUSED(                        0x6C3E,  _SN, _TH, 31)
+VMCS_UNUSED(                        0x6C40,  _SN, _TH, 32)
+VMCS_UNUSED(                        0x6C42,  _SN, _TH, 33)
+VMCS_UNUSED(                        0x6C44,  _SN, _TH, 34)
+VMCS_UNUSED(                        0x6C46,  _SN, _TH, 35)
+VMCS_UNUSED(                        0x6C48,  _SN, _TH, 36)
+VMCS_UNUSED(                        0x6C4A,  _SN, _TH, 37)
+VMCS_UNUSED(                        0x6C4C,  _SN, _TH, 38)
+VMCS_UNUSED(                        0x6C4E,  _SN, _TH, 39)
+VMCS_UNUSED(                        0x6C50,  _SN, _TH, 40)
+VMCS_UNUSED(                        0x6C52,  _SN, _TH, 41)
+VMCS_UNUSED(                        0x6C54,  _SN, _TH, 42)
+VMCS_UNUSED(                        0x6C56,  _SN, _TH, 43)
+VMCS_UNUSED(                        0x6C58,  _SN, _TH, 44)
+VMCS_UNUSED(                        0x6C5A,  _SN, _TH, 45)
+VMCS_UNUSED(                        0x6C5C,  _SN, _TH, 46)
+VMCS_UNUSED(                        0x6C5E,  _SN, _TH, 47)
+VMCS_UNUSED(                        0x6C60,  _SN, _TH, 48)
+VMCS_UNUSED(                        0x6C62,  _SN, _TH, 49)
+VMCS_UNUSED(                        0x6C64,  _SN, _TH, 50)
+VMCS_UNUSED(                        0x6C66,  _SN, _TH, 51)
+VMCS_UNUSED(                        0x6C68,  _SN, _TH, 52)
+VMCS_UNUSED(                        0x6C6A,  _SN, _TH, 53)
+VMCS_UNUSED(                        0x6C6C,  _SN, _TH, 54)
+VMCS_UNUSED(                        0x6C6E,  _SN, _TH, 55)
+VMCS_UNUSED(                        0x6C70,  _SN, _TH, 56)
+VMCS_UNUSED(                        0x6C72,  _SN, _TH, 57)
+VMCS_UNUSED(                        0x6C74,  _SN, _TH, 58)
+VMCS_UNUSED(                        0x6C76,  _SN, _TH, 59)
+VMCS_UNUSED(                        0x6C78,  _SN, _TH, 60)
+VMCS_UNUSED(                        0x6C7A,  _SN, _TH, 61)
+VMCS_UNUSED(                        0x6C7C,  _SN, _TH, 62)
+VMCS_UNUSED(                        0x6C7E,  _SN, _TH, 63)
 VMCS_GROUP_END(NAT, HOST)
 VMCS_SET_END(NAT)
 
diff --git a/vmmon-only/include/x86vt.h b/vmmon-only/include/x86vt.h
index 379de474..b3ef27fa 100644
--- a/vmmon-only/include/x86vt.h
+++ b/vmmon-only/include/x86vt.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2004-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2004-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -58,7 +59,8 @@
 #define MSR_VMX_TRUE_ENTRY_CTLS        0x00000490
 #define MSR_VMX_VMFUNC                 0x00000491
 #define MSR_VMX_3RD_CTLS               0x00000492
-#define NUM_VMX_MSRS                   (MSR_VMX_3RD_CTLS - MSR_VMX_BASIC + 1)
+#define MSR_VMX_EXIT_CTLS2             0x00000493
+#define NUM_VMX_MSRS                   (MSR_VMX_EXIT_CTLS2 - MSR_VMX_BASIC + 1)
 
 /*
  * An alias to accommodate Intel's naming convention in feature masks.
@@ -139,6 +141,9 @@
 #define MSR_VMX_EPT_VPID_SUP_SHADOW_STK         \
    (CONST64U(1) << MSR_VMX_EPT_VPID_SUP_SHADOW_STK_SHIFT)
 
+#define MSR_VMX_EXIT_CTLS2_REPORT_FRACT_SHSTK \
+   (CONST64U(1) << MSR_VMX_EXIT_CTLS2_REPORT_FRACT_SHSTK_SHIFT)
+
 #define VT_VMCS_STANDARD_TAG           0x00000000
 #define VT_VMCS_SHADOW_TAG             0x80000000
 
@@ -170,10 +175,10 @@
                                   VT_ENCODING_NUM_TYPES *   \
                                   VT_ENCODING_NUM_SIZES)
 /*
- * The highest index of any currently defined field is 30, for
- * SHARED_EPTP.
+ * The highest index of any currently defined field is 34, for
+ * 2ND_VMEXIT_CTL.
  */
-#define VT_ENCODING_MAX_INDEX                  30
+#define VT_ENCODING_MAX_INDEX                  34
 
 /* VMCS ID's for various CPU models. */
 #define  VT_VMCS_ID_VMWARE       1
@@ -227,6 +232,10 @@ enum {
 #define VMX_BASIC(_field, _pos, _len)                    \
    VMXCAP(_BASIC, _field, _pos, _len)
 #define VMX_BASIC_CAP_NDA
+/*
+ * Adding a new field may require an update to IntelVT_FindCommonBasic and/or
+ * fields.
+ */
 #define VMX_BASIC_CAP_PUB                                \
    VMX_BASIC(VMCS_ID,                0, 32)              \
    VMX_BASIC(VMCS_SIZE,             32, 13)              \
@@ -340,7 +349,7 @@ enum {
  * Tertiary Processor-Based VM-Execution Controls
  */
 #define VMX_CPU3(_field, _pos)                           \
-   VMXCTL(_PROCBASED_CTLS3, _field, _pos)
+   VMXCAP(_PROCBASED_CTLS3, _field, _pos, 1)
 #define VMX_PROCBASED_CTLS3_CAP_NDA
 #define VMX_PROCBASED_CTLS3_CAP_PUB                      \
    VMX_CPU3(LOADIWKEY,           0)                      \
@@ -377,12 +386,27 @@ enum {
    VMX_EXIT(CLEAR_LBR,           26)                     \
    VMX_EXIT(CLEAR_UINV,          27)                     \
    VMX_EXIT(LOAD_CET,            28)                     \
-   VMX_EXIT(LOAD_PKRS,           29)
+   VMX_EXIT(LOAD_PKRS,           29)                     \
+   VMX_EXIT(SAVE_PGC,            30)                     \
+   VMX_EXIT(USE_2ND,             31)
 
 #define VMX_EXIT_CTLS_CAP                                \
         VMX_EXIT_CTLS_CAP_NDA                            \
         VMX_EXIT_CTLS_CAP_PUB
 
+/*
+ * Secondary VM-Exit Controls
+ */
+#define VMX_EXIT2(_field, _pos)                          \
+   VMXCAP(_EXIT_CTLS2, _field, _pos, 1)
+#define VMX_EXIT_CTLS2_CAP_NDA
+#define VMX_EXIT_CTLS2_CAP_PUB                           \
+   VMX_EXIT2(REPORT_FRACT_SHSTK,  3)
+
+#define VMX_EXIT_CTLS2_CAP                               \
+        VMX_EXIT_CTLS2_CAP_NDA                           \
+        VMX_EXIT_CTLS2_CAP_PUB
+
 /*
  * VM-Entry Controls
  */
@@ -494,12 +518,13 @@ enum {
 enum {
 #define VMXCAP(_msrName, _field, _pos, _len)                              \
    MSR_VMX ## _msrName ## _ ## _field ## _SHIFT = (_pos),                 \
-   MSR_VMX ## _msrName ## _ ## _field ## _MASK  = (int)MASK64(_len),      \
+   MSR_VMX ## _msrName ## _ ## _field ## _MASK  = (unsigned)MASK64(_len), \
 
    VMX_BASIC_CAP
    VMX_MISC_CAP
    VMX_VMCS_ENUM_CAP
    VMX_EPT_VPID_CAP
+   VMX_EXIT_CTLS2_CAP
 
 #undef VMXCAP
 };
@@ -513,6 +538,7 @@ enum {
 #define _PROCBASED_CTLS2      VT_VMCS_2ND_VMEXEC_CTL_
 #define _PROCBASED_CTLS3      VT_VMCS_3RD_VMEXEC_CTL_
 #define _EXIT_CTLS            VT_VMCS_VMEXIT_CTL_
+#define _EXIT_CTLS2           VT_VMCS_VMEXIT_CTL2_
 #define _ENTRY_CTLS           VT_VMCS_VMENTRY_CTL_
 
 #define VMXREQUIRE(_msrName, _field, _pos, _len)                      \
@@ -524,6 +550,7 @@ enum {
    VMX_PINBASED_CTLS_CAP
    VMX_PROCBASED_CTLS_CAP
    VMX_EXIT_CTLS_CAP
+   VMX_EXIT_CTLS2_CAP
    VMX_ENTRY_CTLS_CAP
    VMX_PROCBASED_CTLS2_CAP
    VMX_PROCBASED_CTLS3_CAP
@@ -533,7 +560,9 @@ enum {
 #undef VMXREQUIRE
 
 #undef _ENTRY_CTLS
+#undef _EXIT_CTLS2
 #undef _EXIT_CTLS
+#undef _PROCBASED_CTLS3
 #undef _PROCBASED_CTLS2
 #undef _PROCBASED_CTLS
 #undef _PINBASED_CTLS
@@ -937,7 +966,7 @@ typedef struct VTMSREntry {
 
 typedef uint64 VTConfig[NUM_VMX_MSRS];
 
-typedef uint32 VTVMCSFieldBitmap[VT_ENCODING_NUM_SIZES][VT_ENCODING_NUM_TYPES];
+typedef uint64 VTVMCSFieldBitmap[VT_ENCODING_NUM_SIZES][VT_ENCODING_NUM_TYPES];
 
 /*
  *----------------------------------------------------------------------
@@ -947,7 +976,7 @@ typedef uint32 VTVMCSFieldBitmap[VT_ENCODING_NUM_SIZES][VT_ENCODING_NUM_TYPES];
  *   64-bit component?
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VTEncodingHighDword(uint32 encoding)
 {
    return (encoding & VT_ENCODING_ACCESS_HIGH) != 0;
@@ -960,7 +989,7 @@ VTEncodingHighDword(uint32 encoding)
  *   Extract the index field from a VMCS component encoding.
  *----------------------------------------------------------------------
  */
-static INLINE unsigned
+static inline unsigned
 VTEncodingIndex(uint32 encoding)
 {
    return (encoding & VT_ENCODING_INDEX_MASK) >> VT_ENCODING_INDEX_SHIFT;
@@ -973,7 +1002,7 @@ VTEncodingIndex(uint32 encoding)
  *   Extract the type field from a VMCS component encoding.
  *----------------------------------------------------------------------
  */
-static INLINE unsigned
+static inline unsigned
 VTEncodingType(uint32 encoding)
 {
    return (encoding & VT_ENCODING_TYPE_MASK) >> VT_ENCODING_TYPE_SHIFT;
@@ -986,7 +1015,7 @@ VTEncodingType(uint32 encoding)
  *   Extract the size field from a VMCS component encoding.
  *----------------------------------------------------------------------
  */
-static INLINE unsigned
+static inline unsigned
 VTEncodingSize(uint32 encoding)
 {
    return (encoding & VT_ENCODING_SIZE_MASK) >> VT_ENCODING_SIZE_SHIFT;
@@ -1001,7 +1030,7 @@ VTEncodingSize(uint32 encoding)
  *   the desired bits.
  *----------------------------------------------------------------------
  */
-static INLINE uint32
+static inline uint32
 VTComputeMandatoryBits(uint64 msrVal, uint32 bits)
 {
    uint32 ones = LODWORD(msrVal);
@@ -1020,7 +1049,7 @@ VTComputeMandatoryBits(uint64 msrVal, uint32 bits)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_EnabledFromFeatures(uint64 featCtl, Bool smxEnabled)
 {
    uint64 req = MSR_FEATCTL_LOCK |
@@ -1037,7 +1066,7 @@ VT_EnabledFromFeatures(uint64 featCtl, Bool smxEnabled)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_LockedFromFeatures(uint64 featCtl)
 {
    return (featCtl & MSR_FEATCTL_LOCK) != 0;
@@ -1053,7 +1082,7 @@ VT_LockedFromFeatures(uint64 featCtl)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_SupportedFromFeatures(uint64 pinBasedCtl, uint64 procBasedCtl,
                          uint64 entryCtl, uint64 exitCtl, uint64 basicCtl,
                          uint64 eptVpidFeat)
@@ -1102,7 +1131,7 @@ VT_SupportedFromFeatures(uint64 pinBasedCtl, uint64 procBasedCtl,
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_RealModeSupportedFromFeatures(uint64 secondary)
 {
    return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_UNRESTRICTED) != 0;
@@ -1121,7 +1150,7 @@ VT_RealModeSupportedFromFeatures(uint64 secondary)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_MBXSupportedFromFeatures(uint64 secondary)
 {
    return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_EPT_MBX) != 0;
@@ -1140,7 +1169,7 @@ VT_MBXSupportedFromFeatures(uint64 secondary)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_ConvEPTViolSupportedFromFeatures(uint64 secondary)
 {
    return (HIDWORD(secondary) & VT_VMCS_2ND_VMEXEC_CTL_EPT_VIOL_VE) != 0;
@@ -1179,7 +1208,7 @@ VT_PasidTransSupportedFromFeatures(uint64 secondary)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_EnabledCPU(Bool smxEnabled)
 {
    return VT_EnabledFromFeatures(X86MSR_GetMSR(MSR_FEATCTL), smxEnabled);
@@ -1200,7 +1229,7 @@ VT_EnabledCPU(Bool smxEnabled)
  *
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_SupportedCPU(void)
 {
 
@@ -1225,7 +1254,7 @@ VT_SupportedCPU(void)
  *   Verify that this CPU is VT-capable.
  *----------------------------------------------------------------------
  */
-static INLINE Bool
+static inline Bool
 VT_CapableCPU(void)
 {
    return CPUID_ISSET(1, ECX, VMX, __GET_ECX_FROM_CPUID(1));
@@ -1243,7 +1272,7 @@ VT_CapableCPU(void)
  *
  *----------------------------------------------------------------------
  */
-static INLINE unsigned
+static inline unsigned
 VT_ConfigIndex(uint32 msrNum)
 {
    ASSERT(msrNum >= MSR_VMX_BASIC &&
@@ -1261,7 +1290,7 @@ VT_ConfigIndex(uint32 msrNum)
  *
  *----------------------------------------------------------------------
  */
-static INLINE uint32
+static inline uint32
 VT_ConfigMSRNum(unsigned index)
 {
    ASSERT(index < NUM_VMX_MSRS);
diff --git a/vmmon-only/linux/driver.c b/vmmon-only/linux/driver.c
index 3d8b7228..2fb42654 100644
--- a/vmmon-only/linux/driver.c
+++ b/vmmon-only/linux/driver.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2022 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -267,7 +268,7 @@ LinuxDriverInitTSCkHz(void)
  *----------------------------------------------------------------------
  */
 
-int
+static int
 LinuxDriverInit(void)
 {
    int retval;
@@ -335,7 +336,7 @@ LinuxDriverInit(void)
  *----------------------------------------------------------------------
  */
 
-void
+static void
 LinuxDriverExit(void)
 {
    /*
diff --git a/vmmon-only/linux/driver.h b/vmmon-only/linux/driver.h
index 9403fb38..7b66c1da 100644
--- a/vmmon-only/linux/driver.h
+++ b/vmmon-only/linux/driver.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2011,2014-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index 1827087e..a1e6c754 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -2922,7 +2923,7 @@ HostIF_CallOnEachCPU(void (*func)(void*), // IN: function to call
  *-----------------------------------------------------------------------------
  */
 
-Bool
+static Bool
 HostIFCheckTrackedMPN(VMDriver *vm, // IN: The VM instance
                       MPN mpn)      // IN: The MPN
 {
@@ -3042,7 +3043,7 @@ HostIF_ReadPhysical(VMDriver *vm,      // IN: The VM instance
  *----------------------------------------------------------------------
  */
 
-int
+static int
 HostIFWritePhysicalWork(MA ma,             // MA to be written to
                         VA64 addr,         // src data to write
                         Bool kernelBuffer, // is the buffer in kernel space?
@@ -3201,7 +3202,7 @@ HostIF_GetCurrentPCPU(void)
  *----------------------------------------------------------------------
  */
 
-int
+static int
 HostIFStartTimer(Bool rateChanged,  //IN: Did rate change?
                  unsigned int rate) //IN: current clock rate
 {
diff --git a/vmmon-only/linux/hostif_priv.h b/vmmon-only/linux/hostif_priv.h
index 9465654e..bd535286 100644
--- a/vmmon-only/linux/hostif_priv.h
+++ b/vmmon-only/linux/hostif_priv.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2009-2015,2018 VMware, Inc. All rights reserved.
+ * Copyright (c) 2009-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmmon-only/linux/vmhost.h b/vmmon-only/linux/vmhost.h
index dee549af..69497e0c 100644
--- a/vmmon-only/linux/vmhost.h
+++ b/vmmon-only/linux/vmhost.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 2002-2020 VMware, Inc. All rights reserved.
+ * Copyright (c) 2002-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
diff --git a/vmnet-only/bridge.c b/vmnet-only/bridge.c
index cce209b2..85820200 100644
--- a/vmnet-only/bridge.c
+++ b/vmnet-only/bridge.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2013, 2017, 2022-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -26,13 +27,14 @@
 #include <linux/slab.h>
 #include <linux/poll.h>
 
-#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 4, 10)
-#include <net/gso.h>
-#endif
 #include <linux/netdevice.h>
 #include <linux/etherdevice.h>
 #include <linux/mm.h>
 #include "compat_skbuff.h"
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 4, 10) || \
+    (LINUX_VERSION_CODE >= KERNEL_VERSION(3, 9, 0) && !defined(SKB_GSO_CB))
+#include <net/gso.h>
+#endif
 #include <linux/sockios.h>
 #include <linux/spinlock.h>
 #include "compat_sock.h"
@@ -1407,7 +1409,7 @@ VNetBridgeComputeHeaderPos(struct sk_buff *skb) // IN: buffer to examine
  *----------------------------------------------------------------------
  */
 
-void
+static void
 VNetBridgeSendLargePacket(struct sk_buff *skb,        // IN: packet to split
                           VNetBridge *bridge)         // IN: bridge
 {
diff --git a/vmnet-only/compat_version.h b/vmnet-only/compat_version.h
index 4a0d7316..e0e721a9 100644
--- a/vmnet-only/compat_version.h
+++ b/vmnet-only/compat_version.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -141,6 +142,9 @@
 #   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(9, 2)
 #      define RHEL92_BACKPORTS 1
 #   endif
+#   if RHEL_RELEASE_CODE >= RHEL_RELEASE_VERSION(9, 4)
+#      define RHEL94_BACKPORTS 1
+#   endif
 #endif
 
 #endif /* __COMPAT_VERSION_H__ */
diff --git a/vmnet-only/driver.c b/vmnet-only/driver.c
index 197a2134..cb7a8968 100644
--- a/vmnet-only/driver.c
+++ b/vmnet-only/driver.c
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998,2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -50,18 +51,6 @@
 
 #include "vmnetInt.h"
 
-/*
- * Initialization and creation routines from other files.
- * Putting them here reduces the need for so many header files.
- */
-
-extern int VNetUserIf_Create(VNetPort **ret);
-extern int VNetNetIf_Create(char *devName, VNetPort **ret, int hubNum);
-extern int VNetBridge_Create(char *devName, uint32 flags, VNetJack *hubJack,
-                             VNetPort **ret);
-extern int VNetUserListener_Create(uint32 classMask, VNetJack *hubJack, VNetPort **ret);
-
-
 /*
  *  Structure for cycle detection of host interfaces.  This
  *  struct is only used by VNetCycleDetectIf().
diff --git a/vmnet-only/net.h b/vmnet-only/net.h
index 9266b5fc..54f562ea 100644
--- a/vmnet-only/net.h
+++ b/vmnet-only/net.h
@@ -1,5 +1,5 @@
 /*********************************************************
- * Copyright (C) 1998-2019 VMware, Inc. All rights reserved.
+ * Copyright (C) 1998-2019,2024 VMware, Inc. All rights reserved.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -117,7 +117,7 @@ typedef struct Net_AdapterCount {
  *----------------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 Net_AddAddrToLadrf(const uint8 *addr,  // IN: pointer to MAC address
                    uint8 *ladrf)       // IN/OUT: pointer to ladrf
 {
@@ -168,7 +168,7 @@ Net_AddAddrToLadrf(const uint8 *addr,  // IN: pointer to MAC address
  *----------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 Net_GetNumAdapters(Net_AdapterCount *counts)
 {
    uint32 i;
diff --git a/vmnet-only/vm_atomic.h b/vmnet-only/vm_atomic.h
index 87bf1ece..7c836360 100644
--- a/vmnet-only/vm_atomic.h
+++ b/vmnet-only/vm_atomic.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -183,6 +184,17 @@ typedef ALIGNED(16) struct Atomic_uint128 {
 #define dmb() __asm__ __volatile__("dmb" : : : "memory")
 #endif
 
+/*
+ * Whether GCC flags output operands are supported.
+ * If building with GCC 6+ on x86, and 10+ on arm, flags output is supported.
+ * Some pieces are still built with GCC 4, which doesn't support flag outputs.
+ */
+#ifdef __GCC_ASM_FLAG_OUTPUTS__
+#define IF_ASM_FLAG_OUTPUT(supportedValue, fallbackValue) supportedValue
+#else /* older gcc (or not gcc), flags output is not supported */
+#define IF_ASM_FLAG_OUTPUT(supportedValue, fallbackValue) fallbackValue
+#endif
+
 
 /* Convert a volatile uint32 to Atomic_uint32. */
 static INLINE Atomic_uint32 *
@@ -318,7 +330,7 @@ Atomic_Read8(Atomic_uint8 const *var)  // IN:
    uint8 val;
 
 #if defined VM_ATOMIC_USE_C11
-   val = atomic_load((const _Atomic uint8 *)&var->value);
+   val = atomic_load((const _Atomic(uint8) *)&var->value);
 #elif defined __GNUC__ && defined VM_ARM_32
    val = AtomicUndefined(var);
 #elif defined __GNUC__ && defined VM_ARM_64
@@ -360,7 +372,7 @@ Atomic_ReadWrite8(Atomic_uint8 *var,  // IN/OUT:
                   uint8 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_exchange((_Atomic uint8 *)&var->value, val);
+   return atomic_exchange((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + val);
 #elif defined __GNUC__ && defined VM_ARM_64
@@ -404,7 +416,7 @@ Atomic_Write8(Atomic_uint8 *var,  // IN/OUT:
               uint8 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_store((_Atomic uint8 *)&var->value, val);
+   atomic_store((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_32
    AtomicUndefined(var + val);
 #elif defined __GNUC__ && defined VM_ARM_64
@@ -446,7 +458,7 @@ Atomic_ReadIfEqualWrite8(Atomic_uint8 *var,  // IN/OUT:
 {
 #if defined VM_ATOMIC_USE_C11
    atomic_compare_exchange_strong(
-      (_Atomic uint8 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint8) *)&var->value, &oldVal, newVal);
    return oldVal;
 #elif defined __GNUC__ && defined VM_ARM_32
    return AtomicUndefined(var + oldVal + newVal);
@@ -498,7 +510,7 @@ Atomic_ReadAnd8(Atomic_uint8 *var, // IN/OUT
    uint8 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_and((_Atomic uint8 *)&var->value, val);
+   res = atomic_fetch_and((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, and, val);
 #else
@@ -562,7 +574,7 @@ Atomic_ReadOr8(Atomic_uint8 *var, // IN/OUT
    uint8 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_or((_Atomic uint8 *)&var->value, val);
+   res = atomic_fetch_or((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, orr, val);
 #else
@@ -626,7 +638,7 @@ Atomic_ReadXor8(Atomic_uint8 *var, // IN/OUT
    uint8 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_xor((_Atomic uint8 *)&var->value, val);
+   res = atomic_fetch_xor((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, eor, val);
 #else
@@ -690,7 +702,7 @@ Atomic_ReadAdd8(Atomic_uint8 *var, // IN/OUT
    uint8 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_add((_Atomic uint8 *)&var->value, val);
+   res = atomic_fetch_add((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 8, TRUE, &var->value, add, val);
 #else
@@ -752,7 +764,7 @@ Atomic_Sub8(Atomic_uint8 *var, // IN/OUT
             uint8 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_sub((_Atomic uint8 *)&var->value, val);
+   atomic_fetch_sub((_Atomic(uint8) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    _VMATOM_X(OP, 8, TRUE, &var->value, sub, val);
 #else
@@ -879,7 +891,7 @@ Atomic_Read32(Atomic_uint32 const *var) // IN
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   value = atomic_load((_Atomic uint32 *)&var->value);
+   value = atomic_load((_Atomic(uint32) *)&var->value);
 #elif defined __GNUC__
    /*
     * Use inline assembler to force using a single load instruction to
@@ -940,7 +952,7 @@ Atomic_ReadWrite32(Atomic_uint32 *var, // IN/OUT
                    uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_exchange((_Atomic uint32 *)&var->value, val);
+   return atomic_exchange((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 retVal;
@@ -1009,7 +1021,7 @@ Atomic_Write32(Atomic_uint32 *var, // OUT
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store((_Atomic uint32 *)&var->value, val);
+   atomic_store((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #if defined VM_ARM_64
    _VMATOM_X(W, 32, &var->value, val);
@@ -1091,7 +1103,7 @@ Atomic_ReadIfEqualWrite32(Atomic_uint32 *var, // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    atomic_compare_exchange_strong(
-      (_Atomic uint32 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint32) *)&var->value, &oldVal, newVal);
    return oldVal;
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
@@ -1167,7 +1179,7 @@ Atomic_ReadIfEqualWrite64(Atomic_uint64 *var, // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    atomic_compare_exchange_strong(
-      (_Atomic uint64 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint64) *)&var->value, &oldVal, newVal);
    return oldVal;
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
@@ -1261,7 +1273,7 @@ Atomic_And32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_and((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_and((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1323,7 +1335,7 @@ Atomic_Or32(Atomic_uint32 *var, // IN/OUT
             uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_or((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_or((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1385,7 +1397,7 @@ Atomic_Xor32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_xor((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_xor((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1448,7 +1460,7 @@ Atomic_Xor64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_xor((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_xor((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__
 #if defined VM_ARM_64
    _VMATOM_X(OP, 64, TRUE, &var->value, eor, val);
@@ -1492,7 +1504,7 @@ Atomic_Add32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_add((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_add((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1554,7 +1566,7 @@ Atomic_Sub32(Atomic_uint32 *var, // IN/OUT
              uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_sub((_Atomic uint32 *)&var->value, val);
+   atomic_fetch_sub((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1724,7 +1736,7 @@ Atomic_ReadOr32(Atomic_uint32 *var, // IN/OUT
    uint32 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_or((_Atomic uint32 *)&var->value, val);
+   res = atomic_fetch_or((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, orr, val);
 #else
@@ -1760,7 +1772,7 @@ Atomic_ReadAnd32(Atomic_uint32 *var, // IN/OUT
    uint32 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_and((_Atomic uint32 *)&var->value, val);
+   res = atomic_fetch_and((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 32, TRUE, &var->value, and, val);
 #else
@@ -1797,7 +1809,7 @@ Atomic_ReadOr64(Atomic_uint64 *var, // IN/OUT
    uint64 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_or((_Atomic uint64 *)&var->value, val);
+   res = atomic_fetch_or((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, orr, val);
 #else
@@ -1833,7 +1845,7 @@ Atomic_ReadAnd64(Atomic_uint64 *var, // IN/OUT
    uint64 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_and((_Atomic uint64 *)&var->value, val);
+   res = atomic_fetch_and((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 64, TRUE, &var->value, and, val);
 #else
@@ -1872,7 +1884,7 @@ Atomic_ReadAdd32(Atomic_uint32 *var, // IN/OUT
                  uint32 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_fetch_add((_Atomic uint32 *)&var->value, val);
+   return atomic_fetch_add((_Atomic(uint32) *)&var->value, val);
 #elif defined __GNUC__
 #ifdef VM_ARM_V7
    uint32 res;
@@ -1986,7 +1998,7 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    return atomic_compare_exchange_strong(
-      (_Atomic uint64 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint64) *)&var->value, &oldVal, newVal);
 #elif defined __GNUC__
 #if defined VM_ARM_ANY
    return Atomic_ReadIfEqualWrite64(var, oldVal, newVal) == oldVal;
@@ -1997,10 +2009,10 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
 #if defined __x86_64__
    uint64 dummy;
    __asm__ __volatile__(
-      "lock; cmpxchgq %3, %0" "\n\t"
-      "sete %1"
+      "lock; cmpxchgq %3, %0"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "sete %1")
       : "+m" (*var),
-        "=qm" (equal),
+        IF_ASM_FLAG_OUTPUT("=@cce", "=qm") (equal),
         "=a" (dummy)
       : "r" (newVal),
         "2" (oldVal)
@@ -2042,9 +2054,9 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
    __asm__ __volatile__(
       "xchgl %%ebx, %6"      "\n\t"
       "lock; cmpxchg8b (%3)" "\n\t"
-      "xchgl %%ebx, %6"      "\n\t"
-      "sete %0"
-      : "=qm" (equal),
+      "xchgl %%ebx, %6"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "sete %0")
+      : IF_ASM_FLAG_OUTPUT("=@cce", "=qm") (equal),
         "=a" (dummy1),
         "=d" (dummy2)
       : /*
@@ -2064,10 +2076,10 @@ Atomic_CMPXCHG64(Atomic_uint64 *var,   // IN/OUT
    );
 #   else
    __asm__ __volatile__(
-      "lock; cmpxchg8b %0" "\n\t"
-      "sete %1"
+      "lock; cmpxchg8b %0"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "sete %1")
       : "+m" (*var),
-        "=qm" (equal),
+        IF_ASM_FLAG_OUTPUT("=@cce", "=qm") (equal),
         "=a" (dummy1),
         "=d" (dummy2)
       : "2" (((S_uint64 *)&oldVal)->lowValue),
@@ -2114,7 +2126,7 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    return atomic_compare_exchange_strong(
-      (_Atomic uint32 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint32) *)&var->value, &oldVal, newVal);
 #elif defined __GNUC__
 #if defined VM_ARM_ANY
    return Atomic_ReadIfEqualWrite32(var, oldVal, newVal) == oldVal;
@@ -2123,10 +2135,10 @@ Atomic_CMPXCHG32(Atomic_uint32 *var,   // IN/OUT
    uint32 dummy;
 
    __asm__ __volatile__(
-      "lock; cmpxchgl %3, %0" "\n\t"
-      "sete %1"
+      "lock; cmpxchgl %3, %0"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "sete %1")
       : "+m" (*var),
-        "=qm" (equal),
+        IF_ASM_FLAG_OUTPUT("=@cce", "=qm") (equal),
         "=a" (dummy)
       : "r" (newVal),
         "2" (oldVal)
@@ -2160,7 +2172,7 @@ static INLINE uint64
 Atomic_Read64(Atomic_uint64 const *var) // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_load((const _Atomic uint64 *)&var->value);
+   return atomic_load((const _Atomic(uint64) *)&var->value);
 #else
 #if defined __GNUC__
    uint64 value;
@@ -2284,7 +2296,7 @@ Atomic_ReadAdd64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_fetch_add((_Atomic uint64 *)&var->value, val);
+   return atomic_fetch_add((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, add, val);
 #elif defined __x86_64__
@@ -2340,7 +2352,7 @@ Atomic_ReadSub64(Atomic_uint64 *var, // IN/OUT
                  uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_fetch_sub((_Atomic uint64 *)&var->value, val);
+   return atomic_fetch_sub((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    return _VMATOM_X(ROP, 64, TRUE, &var->value, sub, val);
 #else
@@ -2434,7 +2446,7 @@ Atomic_Add64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_add((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_add((_Atomic(uint64) *)&var->value, val);
 #elif !defined VM_64BIT
    Atomic_ReadAdd64(var, val); /* Return value is unused. */
 #elif defined __GNUC__
@@ -2479,7 +2491,7 @@ Atomic_Sub64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_sub((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_sub((_Atomic(uint64) *)&var->value, val);
 #elif !defined VM_64BIT
    Atomic_ReadSub64(var, val); /* Return value is unused. */
 #elif defined __GNUC__
@@ -2604,7 +2616,7 @@ Atomic_ReadWrite64(Atomic_uint64 *var, // IN/OUT
                    uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_exchange((_Atomic uint64 *)&var->value, val);
+   return atomic_exchange((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -2657,7 +2669,7 @@ Atomic_Write64(Atomic_uint64 *var, // OUT
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store((_Atomic uint64 *)&var->value, val);
+   atomic_store((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined __x86_64__
    /*
     * There is no move instruction for 64-bit immediate to memory, so unless
@@ -2710,7 +2722,7 @@ Atomic_Or64(Atomic_uint64 *var, // IN/OUT
             uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_or((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_or((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -2756,7 +2768,7 @@ Atomic_And64(Atomic_uint64 *var, // IN/OUT
              uint64 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_and((_Atomic uint64 *)&var->value, val);
+   atomic_fetch_and((_Atomic(uint64) *)&var->value, val);
 #elif defined __GNUC__ && defined __x86_64__
    /* Checked against the AMD manual and GCC --hpreg */
    __asm__ __volatile__(
@@ -2885,8 +2897,9 @@ Atomic_TestBit64(Atomic_uint64 *var, // IN
    ASSERT(bit <= 63);
 #if defined __x86_64__ && defined __GNUC__
    __asm__ __volatile__(
-      "btq %2, %1; setc %0"
-      : "=rm"(out)
+      "btq %2, %1"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "setc %0")
+      : IF_ASM_FLAG_OUTPUT("=@ccc", "=rm") (out)
       : "m" (var->value),
         "rJ" ((uint64)bit)
       : "cc"
@@ -2923,8 +2936,10 @@ Atomic_TestSetBit64(Atomic_uint64 *var, // IN/OUT
    Bool out;
    ASSERT(bit <= 63);
    __asm__ __volatile__(
-      "lock; btsq %2, %1; setc %0"
-      : "=rm" (out), "+m" (var->value)
+      "lock; btsq %2, %1"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "setc %0")
+      : IF_ASM_FLAG_OUTPUT("=@ccc", "=rm") (out),
+        "+m" (var->value)
       : "rJ" ((uint64)bit)
       : "cc", "memory"
    );
@@ -2969,7 +2984,7 @@ Atomic_Read16(Atomic_uint16 const *var) // IN
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   value = atomic_load((_Atomic uint16 *)&var->value);
+   value = atomic_load((_Atomic(uint16) *)&var->value);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "movw %1, %0"
@@ -3015,7 +3030,7 @@ Atomic_ReadWrite16(Atomic_uint16 *var,  // IN/OUT:
                    uint16 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_exchange((_Atomic uint16 *)&var->value, val);
+   return atomic_exchange((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "xchgw %0, %1"
@@ -3080,7 +3095,7 @@ Atomic_Write16(Atomic_uint16 *var,  // OUT:
 #endif
 
 #if defined VM_ATOMIC_USE_C11
-   atomic_store((_Atomic uint16 *)&var->value, val);
+   atomic_store((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "movw %1, %0"
@@ -3124,7 +3139,7 @@ Atomic_ReadIfEqualWrite16(Atomic_uint16 *var,   // IN/OUT
 {
 #if defined VM_ATOMIC_USE_C11
    atomic_compare_exchange_strong(
-      (_Atomic uint16 *)&var->value, &oldVal, newVal);
+      (_Atomic(uint16) *)&var->value, &oldVal, newVal);
    return oldVal;
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    uint16 val;
@@ -3192,7 +3207,7 @@ Atomic_ReadAnd16(Atomic_uint16 *var, // IN/OUT
    uint16 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_and((_Atomic uint16 *)&var->value, val);
+   res = atomic_fetch_and((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 16, TRUE, &var->value, and, val);
 #else
@@ -3226,7 +3241,7 @@ Atomic_And16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_and((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_and((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; andw %1, %0"
@@ -3283,7 +3298,7 @@ Atomic_Or16(Atomic_uint16 *var, // IN/OUT
             uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_or((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_or((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; orw %1, %0"
@@ -3340,7 +3355,7 @@ Atomic_Xor16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_xor((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_xor((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; xorw %1, %0"
@@ -3397,7 +3412,7 @@ Atomic_Add16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_add((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_add((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; addw %1, %0"
@@ -3454,7 +3469,7 @@ Atomic_Sub16(Atomic_uint16 *var, // IN/OUT
              uint16 val)         // IN
 {
 #if defined VM_ATOMIC_USE_C11
-   atomic_fetch_sub((_Atomic uint16 *)&var->value, val);
+   atomic_fetch_sub((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; subw %1, %0"
@@ -3577,7 +3592,7 @@ Atomic_ReadOr16(Atomic_uint16 *var, // IN/OUT
    uint16 res;
 
 #if defined VM_ATOMIC_USE_C11
-   res = atomic_fetch_or((_Atomic uint16 *)&var->value, val);
+   res = atomic_fetch_or((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && defined VM_ARM_64
    res = _VMATOM_X(ROP, 16, TRUE, &var->value, orr, val);
 #else
@@ -3611,7 +3626,7 @@ Atomic_ReadAdd16(Atomic_uint16 *var,  // IN/OUT
                  uint16 val)          // IN:
 {
 #if defined VM_ATOMIC_USE_C11
-   return atomic_fetch_add((_Atomic uint16 *)&var->value, val);
+   return atomic_fetch_add((_Atomic(uint16) *)&var->value, val);
 #elif defined __GNUC__ && (defined __x86_64__ || defined __i386__)
    __asm__ __volatile__(
       "lock; xaddw %0, %1"
@@ -3916,6 +3931,32 @@ MAKE_ATOMIC_TYPE(Bool, 8, Bool, Bool, Bool)
 #define ATOMIC_BITVECTOR(varName, capacity) \
       Atomic_uint8 varName[CEILING(capacity, 8)]
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_SetBitVector --
+ *
+ *      Atomically set the bit 'index' in bit vector var.
+ *
+ *      The index input value specifies which bit to modify and is 0-based.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_SetBitVector(Atomic_uint8 *var, // IN/OUT
+                    unsigned index)    // IN
+{
+   Atomic_Or8(var + index / 8, 1 << index % 8);
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -3941,9 +3982,10 @@ Atomic_TestSetBitVector(Atomic_uint8 *var, // IN/OUT
 #if defined __x86_64__ && defined __GNUC__
    Bool bit;
    __asm__ __volatile__(
-      "lock; bts %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (var->value)
+      "lock; bts %2, %1"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "setc %0")
+      : IF_ASM_FLAG_OUTPUT("=@ccc", "=qQm") (bit),
+        "+m" (var->value)
       : "rI" (index)
       : "cc", "memory"
    );
@@ -3955,6 +3997,32 @@ Atomic_TestSetBitVector(Atomic_uint8 *var, // IN/OUT
 }
 
 
+/*
+ *-----------------------------------------------------------------------------
+ *
+ * Atomic_ClearBitVector --
+ *
+ *      Atomically clear the bit 'index' in bit vector var.
+ *
+ *      The index input value specifies which bit to modify and is 0-based.
+ *
+ * Results:
+ *      None
+ *
+ * Side effects:
+ *      None
+ *
+ *-----------------------------------------------------------------------------
+ */
+
+static INLINE void
+Atomic_ClearBitVector(Atomic_uint8 *var, // IN/OUT
+                      unsigned index)    // IN
+{
+   Atomic_And8(var + index / 8, ~(1 << index % 8));
+}
+
+
 /*
  *-----------------------------------------------------------------------------
  *
@@ -3980,9 +4048,10 @@ Atomic_TestClearBitVector(Atomic_uint8 *var, // IN/OUT
 #if defined __x86_64__ && defined __GNUC__
    Bool bit;
    __asm__ __volatile__(
-      "lock; btr %2, %1;"
-      "setc %0"
-      : "=qQm" (bit), "+m" (var->value)
+      "lock; btr %2, %1"
+      IF_ASM_FLAG_OUTPUT("", "\n\t" "setc %0")
+      : IF_ASM_FLAG_OUTPUT("=@ccc", "=qQm") (bit),
+        "+m" (var->value)
       : "rI" (index)
       : "cc", "memory"
    );
diff --git a/vmnet-only/vm_basic_asm.h b/vmnet-only/vm_basic_asm.h
index c6485d9a..5e6fb3dd 100644
--- a/vmnet-only/vm_basic_asm.h
+++ b/vmnet-only/vm_basic_asm.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (c) 2003-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2003-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -17,9 +18,9 @@
  *********************************************************/
 
 /*
- * vm_basic_asm.h
+ * vm_basic_asm.h --
  *
- *	Basic asm macros
+ *      Basic asm macros.
  */
 
 #ifndef _VM_BASIC_ASM_H_
@@ -56,12 +57,15 @@
 #include "mul64.h"
 #elif defined VM_ARM_64
 #include "vm_basic_asm_arm64.h"
+#ifdef VMKERNEL
+#include "vmk_arm_mode.h"
+#endif
 #else
 #define MUL64_NO_ASM 1
 #include "mul64.h"
 #endif
 
-#if defined _M_ARM64EC
+#if defined _M_ARM64EC || defined _M_ARM64
 #include "vm_assert.h"
 #define MUL64_NO_ASM 1
 #include "mul64.h"
@@ -91,18 +95,18 @@ extern "C" {
  * lssbPtr_0   LSB set (uintptr_t;64-bit)  0..63    -1
  * mssbPtr_0   MSB set (uintptr_t;32-bit)  0..31    -1
  * mssbPtr_0   MSB set (uintptr_t;64-bit)  0..63    -1
- * lssbPtr     LSB set (uintptr_t;32-bit)  1..32    0
- * lssbPtr     LSB set (uintptr_t;64-bit)  1..64    0
- * mssbPtr     MSB set (uintptr_t;32-bit)  1..32    0
- * mssbPtr     MSB set (uintptr_t;64-bit)  1..64    0
  * lssb32      LSB set (uint32)            1..32    0
  * mssb32      MSB set (uint32)            1..32    0
  * lssb64      LSB set (uint64)            1..64    0
  * mssb64      MSB set (uint64)            1..64    0
+ * lssbPtr     LSB set (uintptr_t;32-bit)  1..32    0
+ * lssbPtr     LSB set (uintptr_t;64-bit)  1..64    0
+ * mssbPtr     MSB set (uintptr_t;32-bit)  1..32    0
+ * mssbPtr     MSB set (uintptr_t;64-bit)  1..64    0
  */
 
 #if defined(_MSC_VER) && !defined(__clang__) // Clang defines _MSC_VER on Windows
-static INLINE int
+static inline int
 lssb32_0(const uint32 value)
 {
    unsigned long idx;
@@ -120,7 +124,7 @@ lssb32_0(const uint32 value)
    return idx;
 }
 
-static INLINE int
+static inline int
 mssb32_0(const uint32 value)
 {
    unsigned long idx;
@@ -138,7 +142,7 @@ mssb32_0(const uint32 value)
    return idx;
 }
 
-static INLINE int
+static inline int
 lssb64_0(const uint64 value)
 {
    if (UNLIKELY(value == 0)) {
@@ -169,7 +173,7 @@ lssb64_0(const uint64 value)
    }
 }
 
-static INLINE int
+static inline int
 mssb64_0(const uint64 value)
 {
    if (UNLIKELY(value == 0)) {
@@ -228,7 +232,7 @@ mssb64_0(const uint64 value)
  * **********************************************************
  */
 
-static INLINE int
+static inline int
 lssb32_0(uint32 v)
 {
    int value = (int)v;
@@ -246,7 +250,7 @@ lssb32_0(uint32 v)
    return __builtin_ffs(value) - 1;
 }
 
-static INLINE int
+static inline int
 mssb32_0(uint32 value)
 {
    /*
@@ -269,7 +273,7 @@ mssb32_0(uint32 value)
    }
 }
 
-static INLINE int
+static inline int
 lssb64_0(const uint64 v)
 {
    int64 value = (int64)v;
@@ -300,7 +304,7 @@ lssb64_0(const uint64 v)
 }
 
 
-static INLINE int
+static inline int
 mssb64_0(const uint64 value)
 {
    if (UNLIKELY(value == 0)) {
@@ -333,7 +337,7 @@ mssb64_0(const uint64 value)
 
 #endif // __GNUC__
 
-static INLINE int
+static inline int
 lssbPtr_0(const uintptr_t value)
 {
 #ifdef VM_64BIT
@@ -343,13 +347,13 @@ lssbPtr_0(const uintptr_t value)
 #endif
 }
 
-static INLINE unsigned
+static inline unsigned
 lssbPtr(const uintptr_t value)
 {
    return (unsigned)lssbPtr_0(value) + 1;
 }
 
-static INLINE int
+static inline int
 mssbPtr_0(const uintptr_t value)
 {
 #ifdef VM_64BIT
@@ -359,41 +363,39 @@ mssbPtr_0(const uintptr_t value)
 #endif
 }
 
-static INLINE unsigned
+static inline unsigned
 mssbPtr(const uintptr_t value)
 {
    return (unsigned)mssbPtr_0(value) + 1;
 }
 
-static INLINE unsigned
+static inline unsigned
 lssb32(const uint32 value)
 {
    return (unsigned)lssb32_0(value) + 1;
 }
 
-static INLINE unsigned
+static inline unsigned
 mssb32(const uint32 value)
 {
    return (unsigned)mssb32_0(value) + 1;
 }
 
-static INLINE unsigned
+static inline unsigned
 lssb64(const uint64 value)
 {
    return (unsigned)lssb64_0(value) + 1;
 }
 
-static INLINE unsigned
+static inline unsigned
 mssb64(const uint64 value)
 {
    return (unsigned)mssb64_0(value) + 1;
 }
 
-#ifdef __GNUC__
-#if defined(VM_X86_ANY) || defined(VM_ARM_ANY)
 
 /*
- *----------------------------------------------------------------------
+ *-----------------------------------------------------------------------------
  *
  * uint16set --
  *
@@ -405,16 +407,18 @@ mssb64(const uint64 value)
  * Side effects:
  *      As with memset.
  *
- *----------------------------------------------------------------------
+ *-----------------------------------------------------------------------------
  */
 
-static INLINE void *
-uint16set(void *dst, uint16 val, size_t count)
+static inline void *
+uint16set(void *dst,    // OUT
+          uint16 val,   // IN
+          size_t count) // IN
 {
-#ifdef VM_ARM_32
+#if defined __GNUC__ && defined VM_ARM_32
    void *tmpDst = dst;
 
-   __asm__ __volatile__ (
+   __asm__ __volatile__(
       "cmp     %1, #0\n\t"
       "beq     2f\n"
       "1:\n\t"
@@ -425,7 +429,7 @@ uint16set(void *dst, uint16 val, size_t count)
       : "+r" (tmpDst), "+r" (count)
       : "r" (val)
       : "cc", "memory");
-#elif defined(VM_ARM_64)
+#elif defined __GNUC__ && defined VM_ARM_64
    void   *tmpDst = dst;
    uint64  tmpVal = 0;
 
@@ -433,7 +437,7 @@ uint16set(void *dst, uint16 val, size_t count)
       return dst;
    }
 
-   __asm__ __volatile__ (
+   __asm__ __volatile__(
       "cbz     %3, 1f\n\t"
 
       // Copy 16 bits twice...
@@ -469,24 +473,31 @@ uint16set(void *dst, uint16 val, size_t count)
       : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
       : "r" ((uint64)val)
       : "cc", "memory");
-#else
+#elif defined __GNUC__ && defined VM_X86_ANY
    size_t dummy0;
    void *dummy1;
 
-   __asm__ __volatile__("\t"
-                        "cld"            "\n\t"
-                        "rep ; stosw"    "\n"
-                        : "=c" (dummy0), "=D" (dummy1)
-                        : "0" (count), "1" (dst), "a" (val)
-                        : "memory", "cc"
-      );
+   __asm__ __volatile__(
+      "cld"            "\n\t"
+      "rep ; stosw"    "\n"
+      : "=c" (dummy0), "=D" (dummy1)
+      : "0" (count), "1" (dst), "a" (val)
+      : "memory", "cc");
+#elif defined _MSC_VER && defined VM_X86_ANY
+   __stosw((uint16 *)dst, val, count);
+#else /* Fall back to a plain C implementation. */
+   size_t i;
+
+   for (i = 0; i < count; i++) {
+      ((uint16 *)dst)[i] = val;
+   }
 #endif
    return dst;
 }
 
 
 /*
- *----------------------------------------------------------------------
+ *-----------------------------------------------------------------------------
  *
  * uint32set --
  *
@@ -498,16 +509,18 @@ uint16set(void *dst, uint16 val, size_t count)
  * Side effects:
  *      As with memset.
  *
- *----------------------------------------------------------------------
+ *-----------------------------------------------------------------------------
  */
 
-static INLINE void *
-uint32set(void *dst, uint32 val, size_t count)
+static inline void *
+uint32set(void *dst,    // OUT
+          uint32 val,   // IN
+          size_t count) // IN
 {
-#ifdef VM_ARM_32
+#if defined __GNUC__ && defined VM_ARM_32
    void *tmpDst = dst;
 
-   __asm__ __volatile__ (
+   __asm__ __volatile__(
       "cmp     %1, #0\n\t"
       "beq     2f\n"
       "1:\n\t"
@@ -518,15 +531,15 @@ uint32set(void *dst, uint32 val, size_t count)
       : "+r" (tmpDst), "+r" (count)
       : "r" (val)
       : "cc", "memory");
-#elif defined(VM_ARM_64)
+#elif defined __GNUC__ && defined VM_ARM_64
    void   *tmpDst = dst;
-   uint64 tmpVal = val;
+   uint64  tmpVal = val;
 
    if (count == 0) {
       return dst;
    }
 
-   __asm__ __volatile__ (
+   __asm__ __volatile__(
       "cbz     %2, 1f\n\t"
 
       // Drop our value in the top 32 bits, then copy from there to the bottom
@@ -560,65 +573,21 @@ uint32set(void *dst, uint32 val, size_t count)
       : "+r" (tmpDst), "+r" (count), "+r" (tmpVal)
       :
       : "cc", "memory");
-#else
+#elif defined __GNUC__ && defined VM_X86_ANY
    size_t dummy0;
    void *dummy1;
 
-   __asm__ __volatile__("\t"
-                        "cld"            "\n\t"
-                        "rep ; stosl"    "\n"
-                        : "=c" (dummy0), "=D" (dummy1)
-                        : "0" (count), "1" (dst), "a" (val)
-                        : "memory", "cc"
-      );
-#endif
-   return dst;
-}
-
-#else /* unknown system: rely on C to write */
-static INLINE void *
-uint16set(void *dst, uint16 val, size_t count)
-{
-   size_t i;
-   for (i = 0; i < count; i++) {
-     ((uint16 *) dst)[i] = val;
-   }
-   return dst;
-}
-
-static INLINE void *
-uint32set(void *dst, uint32 val, size_t count)
-{
-   size_t i;
-   for (i = 0; i < count; i++) {
-     ((uint32 *) dst)[i] = val;
-   }
-   return dst;
-}
-#endif // defined(VM_X86_ANY) || defined(VM_ARM_ANY)
-#elif defined(_MSC_VER)
-
-static INLINE void *
-uint16set(void *dst, uint16 val, size_t count)
-{
-#ifdef VM_X86_ANY
-   __stosw((uint16*)dst, val, count);
-#else
+   __asm__ __volatile__(
+      "cld"            "\n\t"
+      "rep ; stosl"    "\n"
+      : "=c" (dummy0), "=D" (dummy1)
+      : "0" (count), "1" (dst), "a" (val)
+      : "memory", "cc");
+#elif defined _MSC_VER && defined VM_X86_ANY
+   __stosd((unsigned long *)dst, (unsigned long)val, count);
+#else /* Fall back to a plain C implementation. */
    size_t i;
-   for (i = 0; i < count; i++) {
-      ((uint16 *)dst)[i] = val;
-   }
-#endif
-   return dst;
-}
 
-static INLINE void *
-uint32set(void *dst, uint32 val, size_t count)
-{
-#ifdef VM_X86_ANY
-   __stosd((unsigned long*)dst, (unsigned long)val, count);
-#else
-   size_t i;
    for (i = 0; i < count; i++) {
       ((uint32 *)dst)[i] = val;
    }
@@ -626,10 +595,6 @@ uint32set(void *dst, uint32 val, size_t count)
    return dst;
 }
 
-#else
-#error "No compiler defined for uint*set"
-#endif
-
 
 /*
  *-----------------------------------------------------------------------------
@@ -641,7 +606,7 @@ uint32set(void *dst, uint32 val, size_t count)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint16
+static inline uint16
 Bswap16(uint16 v)
 {
 #if defined(VM_ARM_64) && !defined(_MSC_VER)
@@ -663,7 +628,7 @@ Bswap16(uint16 v)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint32
+static inline uint32
 Bswap32(uint32 v) // IN
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -700,14 +665,23 @@ Bswap32(uint32 v) // IN
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 Bswap64(uint64 v) // IN
 {
-#if defined(VM_ARM_64) && !defined(_MSC_VER)
+#if defined _MSC_VER
+   return _byteswap_uint64(v);
+#elif defined __GNUC__
+
+/* TODO: Return __builtin_bswap64(v) if gcc-arm64 is verified to use "rev". */
+#if defined VM_ARM_64
    __asm__("rev %0, %0" : "+r"(v));
    return v;
 #else
-   return ((uint64)Bswap((uint32)v) << 32) | Bswap((uint32)(v >> 32));
+   return __builtin_bswap64(v);
+#endif
+
+#else
+   return ((uint64)Bswap32((uint32)v) << 32) | Bswap32((uint32)(v >> 32));
 #endif
 }
 
@@ -717,7 +691,7 @@ Bswap64(uint64 v) // IN
  * on non-P4 IA32 systems, the encoding is interpreted as a REPZ-NOP.
  * Use volatile to avoid NOP removal.
  */
-static INLINE void
+static inline void
 PAUSE(void)
 #if defined(__GNUC__) || defined(VM_ARM_32)
 {
@@ -750,7 +724,7 @@ PAUSE(void)
  *
  * volatile because the tsc always changes without the compiler knowing it.
  */
-static INLINE uint64
+static inline uint64
 RDTSC(void)
 #ifdef __GNUC__
 {
@@ -776,11 +750,12 @@ RDTSC(void)
 #elif defined(VM_ARM_64)
    /*
     * Keep this implementation in sync with:
+    * bora/vmkernel/hardware/arm64/tscsync_arch.h::TSCSyncRDTSC()
     * bora/lib/vprobe/arm64/vp_emit_tc.c::VpEmit_BuiltinRDTSCWork()
     * bora/modules/vmkernel/tests/core/xmapTest/xmapTest_arm64.c::XMapTest_SetupLoopCode()
     */
-#if defined(VMKERNEL) && !defined(VMK_ARM_EL1_OR_VHE)
-   return MRS(CNTPCT_EL0);
+#ifdef VMKERNEL
+   return MRSx(VMK_CNT_CT_EL);
 #else
    return MRS(CNTVCT_EL0);
 #endif
@@ -799,8 +774,8 @@ RDTSC(void)
 #else
 {
    /*
-    * We need to do more inverstagetion here to find
-    * a microsoft equivalent of that code
+    * We need to do more investigation here to find
+    * a Microsoft equivalent of that code.
     */
    NOT_IMPLEMENTED();
    return 0;
@@ -852,49 +827,49 @@ RDTSC(void)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE void
+static inline void
 SetBit32(uint32 *var, unsigned index)
 {
    *var |= 1 << index;
 }
 
-static INLINE void
+static inline void
 ClearBit32(uint32 *var, unsigned index)
 {
    *var &= ~(1 << index);
 }
 
-static INLINE void
+static inline void
 ToggleBit32(uint32 *var, unsigned index)
 {
    *var ^= 1 << index;
 }
 
-static INLINE void
+static inline void
 SetBit64(uint64 *var, unsigned index)
 {
    *var |= CONST64U(1) << index;
 }
 
-static INLINE void
+static inline void
 ClearBit64(uint64 *var, unsigned index)
 {
    *var &= ~(CONST64U(1) << index);
 }
 
-static INLINE void
+static inline void
 ToggleBit64(uint64 *var, unsigned index)
 {
    *var ^= (CONST64U(1) << index);
 }
 
-static INLINE Bool
+static inline Bool
 TestBit32(const uint32 *var, unsigned index)
 {
    return (*var & (1 << index)) != 0;
 }
 
-static INLINE Bool
+static inline Bool
 TestBit64(const uint64 *var, unsigned index)
 {
    return (*var & (CONST64U(1) << index)) != 0;
@@ -927,7 +902,7 @@ TestBit64(const uint64 *var, unsigned index)
 #define GCC_ASM_BT_EPILOG "\n\tsetc\t%0" : "=qQm"
 #endif
 
-static INLINE Bool
+static inline Bool
 SetBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -946,7 +921,7 @@ SetBitVector(void *var, int32 index)
 #endif
 }
 
-static INLINE Bool
+static inline Bool
 ClearBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -965,7 +940,7 @@ ClearBitVector(void *var, int32 index)
 #endif
 }
 
-static INLINE Bool
+static inline Bool
 ComplementBitVector(void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -984,7 +959,7 @@ ComplementBitVector(void *var, int32 index)
 #endif
 }
 
-static INLINE Bool
+static inline Bool
 TestBitVector(const void *var, int32 index)
 {
 #if defined(__GNUC__) && defined(VM_X86_ANY)
@@ -1012,7 +987,7 @@ TestBitVector(const void *var, int32 index)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 RoundDownPow2_64(uint64 value)
 {
    if ((value & (value - 1)) == 0) {
@@ -1026,12 +1001,12 @@ RoundDownPow2_64(uint64 value)
 }
 
 
-static INLINE uint32
+static inline uint32
 RoundDownPow2_32(uint32 value)
 {
    if ((value & (value - 1)) == 0) {
       /*
-       * Already a power of two.
+       * Already zero or a power of two.
        */
       return value;
    }
@@ -1051,7 +1026,7 @@ RoundDownPow2_32(uint32 value)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE uint64
+static inline uint64
 RoundUpPow2C64(uint64 value)
 {
    if (value <= 1 || value > (CONST64U(1) << 63)) {
@@ -1062,7 +1037,7 @@ RoundUpPow2C64(uint64 value)
 }
 
 #if defined(__GNUC__) && defined(VM_X86_64)
-static INLINE uint64
+static inline uint64
 RoundUpPow2Asm64(uint64 value)
 {
    uint64 out = 2;
@@ -1080,7 +1055,7 @@ RoundUpPow2Asm64(uint64 value)
 }
 #endif
 
-static INLINE uint64
+static inline uint64
 RoundUpPow2_64(uint64 value)
 {
 #if defined(__GNUC__) && defined(VM_X86_64)
@@ -1094,7 +1069,7 @@ RoundUpPow2_64(uint64 value)
 #endif
 }
 
-static INLINE uint32
+static inline uint32
 RoundUpPow2C32(uint32 value)
 {
    if (value <= 1 || value > (1U << 31)) {
@@ -1107,7 +1082,7 @@ RoundUpPow2C32(uint32 value)
 }
 
 #ifdef __GNUC__
-static INLINE uint32
+static inline uint32
 RoundUpPow2Asm32(uint32 value)
 {
 #ifdef VM_ARM_32
@@ -1143,7 +1118,7 @@ RoundUpPow2Asm32(uint32 value)
 }
 #endif // __GNUC__
 
-static INLINE uint32
+static inline uint32
 RoundUpPow2_32(uint32 value)
 {
 #ifdef __GNUC__
@@ -1174,7 +1149,7 @@ RoundUpPow2_32(uint32 value)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE unsigned
+static inline unsigned
 PopCount32(uint32 value)
 {
 #if defined(__GNUC__) && defined(__POPCNT__)
@@ -1243,7 +1218,7 @@ PopCount32(uint32 value)
  *-----------------------------------------------------------------------------
  */
 
-static INLINE unsigned
+static inline unsigned
 PopCount64(uint64 value)
 {
 #if defined(__GNUC__) && defined(__POPCNT__)
@@ -1291,7 +1266,7 @@ PopCount64(uint64 value)
 
 #ifdef __GNUC__
 
-static INLINE void
+static inline void
 INTR_RW_BARRIER_RW(void)
 {
    __asm__ __volatile__("" ::: "memory");
@@ -1308,19 +1283,19 @@ INTR_RW_BARRIER_RW(void)
 
 #elif defined _MSC_VER
 
-static INLINE void
+static inline void
 INTR_R_BARRIER_R(void)
 {
    _ReadBarrier();
 }
 
-static INLINE void
+static inline void
 INTR_W_BARRIER_W(void)
 {
    _WriteBarrier();
 }
 
-static INLINE void
+static inline void
 INTR_RW_BARRIER_RW(void)
 {
    _ReadWriteBarrier();
diff --git a/vmnet-only/vm_basic_defs.h b/vmnet-only/vm_basic_defs.h
index 80bbad90..74749032 100644
--- a/vmnet-only/vm_basic_defs.h
+++ b/vmnet-only/vm_basic_defs.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 2003-2023 VMware, Inc. All rights reserved.
+ * Copyright (c) 2003-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -209,32 +210,40 @@ Max(int a, int b)
 #define PAGE_SHIFT_16KB  14
 #define PAGE_SHIFT_64KB  16
 
-#ifndef PAGE_SHIFT // {
+#define PAGE_SIZE_4KB    4096
+#define PAGE_SIZE_16KB   16384
+#define PAGE_SIZE_64KB   65536
+
 #if defined __x86_64__ || defined __i386__
-   #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+   #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
 #elif defined __APPLE__
    #if defined VM_ARM_ANY
-      #define PAGE_SHIFT    PAGE_SHIFT_16KB
+      #define VMW_PAGE_SHIFT PAGE_SHIFT_16KB
+      #define VMW_PAGE_SIZE  PAGE_SIZE_16KB
    #else
-      #define PAGE_SHIFT    PAGE_SHIFT_4KB
+      #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+      #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
    #endif
 #elif defined VM_ARM_64
-   #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+   #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
 #elif defined __arm__
-   #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+   #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
 #elif defined __wasm__
-   #define PAGE_SHIFT    PAGE_SHIFT_4KB
+   #define VMW_PAGE_SHIFT PAGE_SHIFT_4KB
+   #define VMW_PAGE_SIZE  PAGE_SIZE_4KB
 #else
    #error
 #endif
-#endif // }
 
-#define PAGE_SIZE_4KB    (1 << PAGE_SHIFT_4KB)
-#define PAGE_SIZE_16KB   (1 << PAGE_SHIFT_16KB)
-#define PAGE_SIZE_64KB   (1 << PAGE_SHIFT_64KB)
+#ifndef PAGE_SHIFT
+#define PAGE_SHIFT VMW_PAGE_SHIFT
+#endif
 
 #ifndef PAGE_SIZE
-#define PAGE_SIZE     (1 << PAGE_SHIFT)
+#define PAGE_SIZE     VMW_PAGE_SIZE
 #endif
 
 #define PAGE_MASK_4KB    (PAGE_SIZE_4KB - 1)
@@ -419,6 +428,16 @@ Max(int a, int b)
 #endif
 #define QWORD(_hi, _lo)   ((((uint64)(_hi)) << 32) | ((uint32)(_lo)))
 
+#ifndef HIDWORD128
+#define HIDWORD128(_qw)    ((uint64)((_qw) >> 64))
+#endif
+#ifndef LODWORD128
+#define LODWORD128(_qw)    ((uint64)(_qw))
+#endif
+#ifndef QWORD128
+#define QWORD128(_hi, _lo) ((((uint128)(_hi)) << 64) | ((uint64)(_lo)))
+#endif
+
 
 /*
  * Deposit a field _src at _pos bits from the right,
@@ -551,19 +570,50 @@ typedef int pid_t;
  * Convenience macros and definitions. Can often be used instead of #ifdef.
  */
 
+#ifdef VMK_HAS_VMM
+#define VMK_HAS_VMM_ONLY(...) __VA_ARGS__
+#else
+#define VMK_HAS_VMM_ONLY(...)
+#endif
+
+#if defined VMM || defined VMK_HAS_VMM
+/* Structure field only used to support the VMM (as opposed to the ULM). */
+#define VMM_ONLY_FIELD(name) name
+#else
+/*
+ * Structure field only used to support the VMM (as opposed to the ULM).
+ * Until VMK_HAS_VMM is retired, keep this field so the size of the structure
+ * is unchanged (was bug 3354277), but prepend an underscore to the field's
+ * name to verify at compile time that the field is indeed not used.
+ */
+#define VMM_ONLY_FIELD(name) _##name
+#endif
+
 #undef ARM64_ONLY
 #ifdef VM_ARM_64
-#define ARM64_ONLY(x)    x
+#define ARM64_ONLY(...)  __VA_ARGS__
 #else
-#define ARM64_ONLY(x)
+#define ARM64_ONLY(...)
 #endif
 
 #undef X86_ONLY
+#ifdef _MSC_VER
+/*
+ * Old MSVC versions (such as MSVC 14.29.30133, used to build Workstation's
+ * offset checker) are notorious to have non-standard __VA_ARGS__ handling.
+ */
 #ifdef VM_X86_ANY
 #define X86_ONLY(x)      x
 #else
 #define X86_ONLY(x)
 #endif
+#else
+#ifdef VM_X86_ANY
+#define X86_ONLY(...)    __VA_ARGS__
+#else
+#define X86_ONLY(...)
+#endif
+#endif
 
 #undef DEBUG_ONLY
 #ifdef VMX86_DEBUG
@@ -631,6 +681,12 @@ typedef int pid_t;
 #define HOSTED_ONLY(x) x
 #endif
 
+#ifdef VMX86_FDM
+#define vmx86_fdm 1
+#else
+#define vmx86_fdm 0
+#endif
+
 #ifdef VMX86_ESXIO
 #define vmx86_esxio      1
 #else
@@ -906,12 +962,13 @@ typedef int pid_t;
 
 /* VMW_FALLTHROUGH
  *
- *   Instructs GCC 9 and above to not warn when a case label of a
+ *   Instructs capable compilers to not warn when a case label of a
  *   'switch' statement falls through to the next label.
  *
- *   If not GCC 9 or above, expands to nothing.
+ *   If not a matched compiler, expands to nothing.
  */
-#if __GNUC__ >= 9
+#if (defined(__GNUC__) && (__GNUC__ >= 9)) ||           \
+    (defined(__clang__) && (__clang_major__ >= 13))
 #define VMW_FALLTHROUGH() __attribute__((fallthrough))
 #else
 #define VMW_FALLTHROUGH()
diff --git a/vmnet-only/vm_basic_types.h b/vmnet-only/vm_basic_types.h
index 0cfc0264..559577e8 100644
--- a/vmnet-only/vm_basic_types.h
+++ b/vmnet-only/vm_basic_types.h
@@ -353,8 +353,8 @@ typedef int64 VmTimeVirtualClock;  /* Virtual Clock kept in CPU cycles */
       #define FMTPD      "I"
       #define FMTH       "I"
    #endif
-#elif defined __APPLE__ || (!defined VMKERNEL && \
-                            defined __linux__ && defined __KERNEL__)
+#elif defined __APPLE__ || defined __EMSCRIPTEN__ || \
+      (!defined VMKERNEL && defined __linux__ && defined __KERNEL__)
    /* semi-LLP64 targets; 'long' is 64-bit, but uint64_t is 'long long' */
    #define FMT64         "ll"
    #if defined(__APPLE__) && KERNEL
diff --git a/vmnet-only/vnetInt.h b/vmnet-only/vnetInt.h
index f6a90a13..c278b918 100644
--- a/vmnet-only/vnetInt.h
+++ b/vmnet-only/vnetInt.h
@@ -1,5 +1,6 @@
 /*********************************************************
- * Copyright (C) 1998-2021 VMware, Inc. All rights reserved.
+ * Copyright (c) 1998-2024 Broadcom. All Rights Reserved.
+ * The term "Broadcom" refers to Broadcom Inc. and/or its subsidiaries.
  *
  * This program is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License as published by the
@@ -219,6 +220,14 @@ extern int VNetProc_Init(void);
 extern void VNetProc_Cleanup(void);
 
 
+int VNetNetIf_Create(char *devName, VNetPort **ret, int hubNum);
+int VNetUserIf_Create(VNetPort **ret);
+int VNetBridge_Create(const char *devName, uint32 flags, VNetJack *hubJack,
+                      VNetPort **ret);
+int VNetUserListener_Create(uint32 classMask, VNetJack *hubJack,
+                            VNetPort **port);
+
+
 /*
  *----------------------------------------------------------------------
  *

From fe7e23745ebb4372e4cba47b497cdc86d5907f73 Mon Sep 17 00:00:00 2001
From: Veronika Kossmann <nanodesuu@gmail.com>
Date: Sat, 18 May 2024 20:23:18 +0300
Subject: [PATCH 25/41] Seems x86cpuid.h also need to be patched to prevent
 array-index-out-of-bounds

---
 vmmon-only/include/x86cpuid.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/vmmon-only/include/x86cpuid.h b/vmmon-only/include/x86cpuid.h
index 5ef4e0a0..59507725 100644
--- a/vmmon-only/include/x86cpuid.h
+++ b/vmmon-only/include/x86cpuid.h
@@ -93,7 +93,7 @@ typedef struct CPUIDQuery {
    uint32 eax;                // IN
    uint32 ecx;                // IN
    uint32 numLogicalCPUs;     // IN/OUT
-   CPUIDReply logicalCPUs[0]; // OUT
+   CPUIDReply logicalCPUs[]; // OUT
 } CPUIDQuery;
 #pragma pack(pop)
 #endif

From d2788a68cadacc4cab1c4818f21fdfe11cf2f8fb Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 12 Aug 2023 20:03:09 +0200
Subject: [PATCH 26/41] modules: make COMPAT_LINUX_VERSION_CHECK_LT less tricky

The definition of COMPAT_LINUX_VERSION_CHECK_LT() macro lacks surrounding
paretheses so that negated tests like !COMPAT_LINUX_VERSION_CHECK_LT(...)
expand to something completely different. This could be worked around
easily by adding parentheses to each place the macro is used in an
expression but it makes much more sense to fix the macro definition so that
the macro does not serve as a trap.
---
 vmmon-only/include/compat_version.h | 4 ++--
 vmnet-only/compat_version.h         | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/vmmon-only/include/compat_version.h b/vmmon-only/include/compat_version.h
index e0e721a9..705c5f67 100644
--- a/vmmon-only/include/compat_version.h
+++ b/vmmon-only/include/compat_version.h
@@ -119,11 +119,11 @@
  */
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 0, 0)
    /* Straight forward comparison if kernel version is 3.0.0 and beyond */
-#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) LINUX_VERSION_CODE < KERNEL_VERSION (a, b, c)
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) (LINUX_VERSION_CODE < KERNEL_VERSION (a, b, c))
 #elif LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 40)
    /* Use b of the check to calculate corresponding c of kernel
     *  version to compare */
-#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) LINUX_VERSION_CODE < KERNEL_VERSION (2, 6, (b + 40))
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) (LINUX_VERSION_CODE < KERNEL_VERSION (2, 6, (b + 40)))
 #else
     /* This is anyways lesser than any 3.x versions */
 #   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) 1
diff --git a/vmnet-only/compat_version.h b/vmnet-only/compat_version.h
index e0e721a9..705c5f67 100644
--- a/vmnet-only/compat_version.h
+++ b/vmnet-only/compat_version.h
@@ -119,11 +119,11 @@
  */
 #if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 0, 0)
    /* Straight forward comparison if kernel version is 3.0.0 and beyond */
-#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) LINUX_VERSION_CODE < KERNEL_VERSION (a, b, c)
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) (LINUX_VERSION_CODE < KERNEL_VERSION (a, b, c))
 #elif LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 40)
    /* Use b of the check to calculate corresponding c of kernel
     *  version to compare */
-#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) LINUX_VERSION_CODE < KERNEL_VERSION (2, 6, (b + 40))
+#   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) (LINUX_VERSION_CODE < KERNEL_VERSION (2, 6, (b + 40)))
 #else
     /* This is anyways lesser than any 3.x versions */
 #   define COMPAT_LINUX_VERSION_CHECK_LT(a, b, c) 1

From a7a0dcc18e54be4e7bbd9d4d43b2321ee5e9c942 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Tue, 15 Sep 2020 18:58:14 +0200
Subject: [PATCH 27/41] vmmon: rename GDT_SIZE macro to avoid collision

When building against kernel 4.12 and newer, macro name GDT_SIZE used in
(vmmon) include/segs.h collides with macro defined in (kernel source)
arch/x86/include/asm/segment.h, resulting in its redefinition.

To prevent potential problems, rename vmmon's GDT_SIZE to VMMON_GDT_SIZE
and GDT_LIMIT to VMMON_GDT_LIMIT. (There is no GDT_LIMIT in mainline kernel
source but let's be consistent.)
---
 vmmon-only/common/crosspage.c | 2 +-
 vmmon-only/include/segs.h     | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/vmmon-only/common/crosspage.c b/vmmon-only/common/crosspage.c
index ac24ac70..37a7238e 100644
--- a/vmmon-only/common/crosspage.c
+++ b/vmmon-only/common/crosspage.c
@@ -122,7 +122,7 @@ CPDATA const VMCrossPageData cpDataTemplate = {
 
    .monTask.IOMapBase = sizeof(Task64),
 
-   .monGDTR.limit  = GDT_LIMIT,
+   .monGDTR.limit  = VMMON_GDT_LIMIT,
    .monGDTR.offset = GDT_START_VA,
 
    .shadowDR[6].ureg64 = DR6_DEFAULT,
diff --git a/vmmon-only/include/segs.h b/vmmon-only/include/segs.h
index df712df9..ff5c35e4 100644
--- a/vmmon-only/include/segs.h
+++ b/vmmon-only/include/segs.h
@@ -46,8 +46,8 @@
 
 #define PCPU_DATA_SIZE        (32 * CACHELINE_SIZE)
 
-#define GDT_SIZE              (sizeof(Descriptor) * NUM_VALID_SEGMENTS)
-#define GDT_LIMIT             (GDT_SIZE - 1)
+#define VMMON_GDT_SIZE        (sizeof(Descriptor) * NUM_VALID_SEGMENTS)
+#define VMMON_GDT_LIMIT       (VMMON_GDT_SIZE - 1)
 
 /*
  * This is one more than max GDT limit value.

From a3fc2c2eb176dc4bc83b7c461efb732c565fccc5 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 18 Nov 2022 13:42:16 +0100
Subject: [PATCH 28/41] modules: use standard constant definitions if available

The PCI_VENDOR_ID_VMWARE macro is defined in mainline pci_ids.h since
commit 94e57fea6202 ("PCI: Move PCI_VENDOR_ID_VMWARE to pci_ids.h") in
v3.18-rc1.

The PCI_DEVICE_ID_VMWARE_VMXNET3 macro is defined in mainline pci_ids.h
since commit b1226c7db1d9 ("vmxnet3: Move PCI Id to pci_ids.h") in
v4.10-rc1.

The MSR_MISC_FEATURES_ENABLES_CPUID_FAULT macro is defined in mainline
since commit e9ea1e7f53b8 ("x86/arch_prctl: Add ARCH_[GET|SET]_CPUID") in
v4.12-rc1.

The CR3_PCID_MASK is defined in mainline asm/processor-flags.h since commit
6c690ee1039b ("x86/mm: Split read_cr3() into read_cr3_pa() and
__read_cr3()") in v4.13-rc1.
---
 vmmon-only/include/x86_basic_defs.h | 2 ++
 vmmon-only/include/x86msr.h         | 5 +++++
 vmnet-only/vm_device_version.h      | 9 +++++++++
 3 files changed, 16 insertions(+)

diff --git a/vmmon-only/include/x86_basic_defs.h b/vmmon-only/include/x86_basic_defs.h
index 2592c9e8..c5584ccf 100644
--- a/vmmon-only/include/x86_basic_defs.h
+++ b/vmmon-only/include/x86_basic_defs.h
@@ -36,6 +36,8 @@
 #define INCLUDE_ALLOW_VMCORE
 #include "includeCheck.h"
 
+#include <asm/processor-flags.h>
+
 #define X86_MAX_INSTR_LEN  15   /* Max byte length of an x86 instruction */
 
 #define NUM_IDT_VECTORS 256
diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index 7e05f440..cfd2ef67 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -25,6 +25,7 @@
 
 #ifndef _X86MSR_H_
 #define _X86MSR_H_
+#include <asm/msr-index.h>
 #define INCLUDE_ALLOW_USERLEVEL
 #define INCLUDE_ALLOW_VMX
 
@@ -1085,7 +1086,11 @@ typedef unsigned char MTRRType;
 /*
  * MISC_FEATURES_ENABLES bits
  */
+#ifdef MSR_MISC_FEATURES_ENABLES_CPUID_FAULT
+#define MSR_MISC_FEATURES_ENABLES_CPUID_FAULTING MSR_MISC_FEATURES_ENABLES_CPUID_FAULT
+#else
 #define MSR_MISC_FEATURES_ENABLES_CPUID_FAULTING 1
+#endif
 
 
 
diff --git a/vmnet-only/vm_device_version.h b/vmnet-only/vm_device_version.h
index f2584a3b..76c8e3a6 100644
--- a/vmnet-only/vm_device_version.h
+++ b/vmnet-only/vm_device_version.h
@@ -35,6 +35,8 @@
 #endif
 #endif
 
+#include <linux/pci_ids.h>
+
 /* LSILogic 53C1030 Parallel SCSI controller
  * LSILogic SAS1068 SAS controller
  */
@@ -54,7 +56,10 @@
  *    VMware HD Audio codec
  *    VMware HD Audio controller
  */
+#ifndef PCI_VENDOR_ID_VMWARE
 #define PCI_VENDOR_ID_VMWARE                    0x15AD
+#endif
+
 #define PCI_DEVICE_ID_VMWARE_SBX                0x0420
 #define PCI_DEVICE_ID_VMWARE_SVGA4              0x0408
 #define PCI_DEVICE_ID_VMWARE_SVGA_EFI           0x0407
@@ -76,7 +81,11 @@
 #define PCI_DEVICE_ID_VMWARE_1394               0x0780
 #define PCI_DEVICE_ID_VMWARE_BRIDGE             0x0790
 #define PCI_DEVICE_ID_VMWARE_ROOTPORT           0x07A0
+
+#ifndef PCI_DEVICE_ID_VMWARE_VMXNET3
 #define PCI_DEVICE_ID_VMWARE_VMXNET3            0x07B0
+#endif
+
 #define PCI_DEVICE_ID_VMWARE_PVSCSI             0x07C0
 #define PCI_DEVICE_ID_VMWARE_82574              0x07D0
 #define PCI_DEVICE_ID_VMWARE_AHCI               0x07E0

From 9392920e41cfdb49fc65bc1515a8cb361360940a Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 30 Sep 2017 21:41:51 +0200
Subject: [PATCH 29/41] vmmon: quick workaround for objtool warnings

As discussed in

  https://bugzilla.suse.com/show_bug.cgi?id=1059674

the reason for multiple objtool warnings is the fact that vmmon module
defines its own Panic() function which never returns. While it is marked as
such which is used by the compiler for optimization, there is no way to
find this from object file.

While this seems innocuous, it might result in problems with unwinder
later. The quickest way around is to replace vmmon's own Panic() with
standard kernel panic() until a cleaner solution is found.
---
 vmmon-only/include/vm_assert.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/vmmon-only/include/vm_assert.h b/vmmon-only/include/vm_assert.h
index fca85007..d834d682 100644
--- a/vmmon-only/include/vm_assert.h
+++ b/vmmon-only/include/vm_assert.h
@@ -74,6 +74,7 @@ extern "C" {
 # if defined (VMKPANIC)
 #  include "vmk_assert.h"
 # else /* !VMKPANIC */
+#  include <linux/kernel.h>
 #  define _ASSERT_PANIC(name) \
            Panic(_##name##Fmt "\n", __FILE__, __LINE__)
 #  define _ASSERT_PANIC_BUG(bug, name) \
@@ -114,7 +115,7 @@ NORETURN void Panic_NoSave(const char *fmt, ...) PRINTF_DECL(1, 2);
    } while(0)
 
 #else /* !VMKPANIC */
-NORETURN void Panic(const char *fmt, ...) PRINTF_DECL(1, 2);
+#define Panic panic
 #endif
 
 void LogThrottled(uint32 *count, const char *fmt, ...) PRINTF_DECL(2, 3);

From a7d68e179b35cf1f0510dcd3db84718ec733bf74 Mon Sep 17 00:00:00 2001
From: Theo Bertacchini <theo.bertacchini@epitech.eu>
Date: Sun, 27 May 2018 17:14:52 +0900
Subject: [PATCH 30/41] modules: remove .cache.mk on make clean

Remove .cache.mk inside vmmon-only and vmnet-only when executing
"make clean". This file can cause issues when upgrading gcc as make will
still look for includes inside older gcc includes directory.

File .cache.mk with cache of generated variables was created by build since
kernel v4.15-rc1, commit 3298b690b21c ("kbuild: Add a cache for generated
variables") until the feature was removed in v4.18-rc1, commit e08d6de4e532
("kbuild: remove kbuild cache").
---
 vmmon-only/Makefile.kernel | 2 +-
 vmnet-only/Makefile.kernel | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/vmmon-only/Makefile.kernel b/vmmon-only/Makefile.kernel
index f9ddf680..ded2dfc3 100644
--- a/vmmon-only/Makefile.kernel
+++ b/vmmon-only/Makefile.kernel
@@ -30,7 +30,7 @@ $(DRIVER)-y := $(subst $(SRCROOT)/, , $(patsubst %.c, %.o, \
 		$(SRCROOT)/bootstrap/*.c)))
 
 clean:
-	rm -rf $(wildcard $(DRIVER).mod.c $(DRIVER).ko .tmp_versions \
+	rm -rf $(wildcard $(DRIVER).mod.c $(DRIVER).ko .tmp_versions .cache.mk \
 		Module.symvers Modules.symvers Module.markers modules.order \
 		$(foreach dir,linux/ common/ bootstrap/ \
 		./,$(addprefix $(dir),.*.cmd .*.o.flags *.o)))
diff --git a/vmnet-only/Makefile.kernel b/vmnet-only/Makefile.kernel
index 44a8a95d..de04abee 100644
--- a/vmnet-only/Makefile.kernel
+++ b/vmnet-only/Makefile.kernel
@@ -32,6 +32,6 @@ $(DRIVER)-y := driver.o hub.o userif.o netif.o bridge.o procfs.o smac_compat.o \
 ####
 
 clean:
-	rm -rf $(DRIVER).o $(DRIVER).mod.o $(DRIVER).mod.c $(DRIVER).ko \
+	rm -rf $(DRIVER).o $(DRIVER).mod.o $(DRIVER).mod.c $(DRIVER).ko .cache.mk \
 	       .tmp_versions Module.symvers Modules.symvers Module.markers \
 	       modules.order $($(DRIVER)-y) .*.cmd .*.o.flags

From 3519dc972cd48967559fdcbedd97c5879edced8b Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Thu, 20 Aug 2020 10:39:56 +0200
Subject: [PATCH 31/41] vmmon: include <asm/irq_vectors.h> explicitly

After mainline commit 13c01139b171 ("x86/headers: Remove APIC headers from
<asm/smp.h>") in 5.9-rc1, APIC headers are no longer included via
<asm/smp.h> so that linux/hostif.c will use incorrect fallback definitions
of SPURIOUS_APIC_VECTOR, POSTED_INTR_VECTOR and ERROR_APIC_VECTOR even if
built against kernel where these are defined.

Include <asm/irq_vectors.h> in linux/hostif.c explicitly to avoid that.
---
 vmmon-only/linux/hostif.c | 1 +
 1 file changed, 1 insertion(+)

diff --git a/vmmon-only/linux/hostif.c b/vmmon-only/linux/hostif.c
index a1e6c754..36d27ebd 100644
--- a/vmmon-only/linux/hostif.c
+++ b/vmmon-only/linux/hostif.c
@@ -48,6 +48,7 @@
 #include <asm/io.h>
 #include <asm/page.h>
 #include <asm/uaccess.h>
+#include <asm/irq_vectors.h>
 #include <linux/capability.h>
 #include <linux/kthread.h>
 #include <linux/wait.h>

From c7e75a4741b26055c455597f7176dc46a0af1a1d Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 14 Mar 2020 10:12:16 +0100
Subject: [PATCH 32/41] vmnet: convert VNetBridge debugging code to
 ktime_get_ns()

The do_gettimeofday() helper was removed by commit e4b92b108c6c
("timekeeping: remove obsolete time accessors") in v5.0-rc1 and since
commit c766d1472c70 ("y2038: hide timeval/timespec/itimerval/itimerspec
types") in v5.6-rc3, struct timeval should no longer be used in kernel
code.

Convert the do_gettimeofday() relics in VNetBridge (which are only compiled
with LOGLEVEL >= 4) completely to ktime based interface.
---
 vmnet-only/bridge.c | 13 ++++++-------
 1 file changed, 6 insertions(+), 7 deletions(-)

diff --git a/vmnet-only/bridge.c b/vmnet-only/bridge.c
index 85820200..e3284f23 100644
--- a/vmnet-only/bridge.c
+++ b/vmnet-only/bridge.c
@@ -71,7 +71,7 @@
 #endif
 
 #if LOGLEVEL >= 4
-static struct timeval vnetTime;
+static u64 vnetTime;
 #endif
 
 typedef struct VNetBridge VNetBridge;
@@ -695,7 +695,7 @@ VNetBridgeReceiveFromVNet(VNetJack        *this, // IN: jack
          netif_rx(clone);
 #endif
 #	 if LOGLEVEL >= 4
-	 do_gettimeofday(&vnetTime);
+	 vnetTime = ktime_get_ns();
 #	 endif
       }
    }
@@ -1494,12 +1494,11 @@ VNetBridgeReceiveFromDev(struct sk_buff *skb,         // IN: packet to receive
 
 #  if LOGLEVEL >= 4
    {
-      struct timeval now;
-      do_gettimeofday(&now);
+      u64 now;
+
+      now = ktime_get_ns();
       LOG(3, (KERN_DEBUG "bridge-%s: time %d\n",
-	      bridge->name,
-	      (int)((now.tv_sec * 1000000 + now.tv_usec)
-                    - (vnetTime.tv_sec * 1000000 + vnetTime.tv_usec))));
+	      bridge->name, (int)((now - vnetTime) / NSEC_PER_USEC)));
    }
 #  endif
 

From bf9bc89e72590fee9ac51c8a86f5550359f6e5c4 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sat, 26 Nov 2022 23:55:10 +0100
Subject: [PATCH 33/41] vmnet: hack around SLE15-SP5 backport of
 netdevice::dev_addr changes

SLE15-SP5 backported mainline commit adeef3e32146 ("net: constify
netdev->dev_addr") from 5.17-rc1 into their "5.14" kernel. Add an extra
hack to the version check to fix SLE15-SP5 build.
---
 vmmon-only/include/compat_autoconf.h | 6 ++++++
 vmnet-only/compat_autoconf.h         | 6 ++++++
 vmnet-only/netif.c                   | 5 +++--
 3 files changed, 15 insertions(+), 2 deletions(-)

diff --git a/vmmon-only/include/compat_autoconf.h b/vmmon-only/include/compat_autoconf.h
index 26064aa8..ee00015a 100644
--- a/vmmon-only/include/compat_autoconf.h
+++ b/vmmon-only/include/compat_autoconf.h
@@ -38,4 +38,10 @@
 #   include <generated/autoconf.h>
 #endif
 
+#if defined(CONFIG_SUSE_VERSION) && defined(CONFIG_SUSE_PATCHLEVEL)
+#   if CONFIG_SUSE_VERSION == 15 && CONFIG_SUSE_PATCHLEVEL >= 5
+#      define SLE15_SP5_BACKPORTS 1
+#   endif
+#endif
+
 #endif /* __COMPAT_AUTOCONF_H__ */
diff --git a/vmnet-only/compat_autoconf.h b/vmnet-only/compat_autoconf.h
index 26064aa8..ee00015a 100644
--- a/vmnet-only/compat_autoconf.h
+++ b/vmnet-only/compat_autoconf.h
@@ -38,4 +38,10 @@
 #   include <generated/autoconf.h>
 #endif
 
+#if defined(CONFIG_SUSE_VERSION) && defined(CONFIG_SUSE_PATCHLEVEL)
+#   if CONFIG_SUSE_VERSION == 15 && CONFIG_SUSE_PATCHLEVEL >= 5
+#      define SLE15_SP5_BACKPORTS 1
+#   endif
+#endif
+
 #endif /* __COMPAT_AUTOCONF_H__ */
diff --git a/vmnet-only/netif.c b/vmnet-only/netif.c
index 8b9d16bc..9739bab1 100644
--- a/vmnet-only/netif.c
+++ b/vmnet-only/netif.c
@@ -41,6 +41,7 @@
 #include <linux/file.h>
 
 #include "vnetInt.h"
+#include "compat_autoconf.h"
 #include "compat_netdevice.h"
 #include "vmnetInt.h"
 
@@ -253,7 +254,7 @@ VNetNetIf_Create(char *devName,  // IN:
 
    memset(&netIf->stats, 0, sizeof netIf->stats);
 
-#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 15, 0)
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 15, 0) && !defined(SLE15_SP5_BACKPORTS)
    memcpy(dev->dev_addr, netIf->port.paddr, sizeof netIf->port.paddr);
 #else
    eth_hw_addr_set(dev, netIf->port.paddr);
@@ -540,7 +541,7 @@ VNetNetifSetMAC(struct net_device *dev, // IN:
       return -EINVAL;
    }
    memcpy(netIf->port.paddr, addr->sa_data, dev->addr_len);
-#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 15, 0)
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 15, 0) && !defined(SLE15_SP5_BACKPORTS)
    memcpy(dev->dev_addr, netIf->port.paddr, dev->addr_len);
 #else
    eth_hw_addr_set(dev, netIf->port.paddr);

From edceb87ba1fa6627bea3edf8c0139dd433845a41 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Wed, 18 Jan 2023 00:19:52 +0100
Subject: [PATCH 34/41] vmnet: use explicit module_init() and module_exit()
 (#187)

While vmmon module already uses explicit module_init() and module_exit()
for its init and cleanup function, vmnet relies on traditional magic names
init_module() and cleanup_module(). Apparently this has an unfortunate side
effect that the two functions are not identified as indirect call targets
by objdump and they get "sealed" when the module is built against and
loaded into an IBT enabled kernel.

Starting with 6.3-rc1, objtool is going to warn about this issue,
indicating that the legacy module initialization is deprecated and
module_init() and module_exit() macros should be used instead so do that
for vmnet as well.
---
 vmnet-only/driver.c | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/vmnet-only/driver.c b/vmnet-only/driver.c
index cb7a8968..b5ad7aeb 100644
--- a/vmnet-only/driver.c
+++ b/vmnet-only/driver.c
@@ -268,7 +268,7 @@ VNetRemovePortFromList(const VNetPort *port) // IN: port to remove from list
 /*
  *----------------------------------------------------------------------
  *
- * init_module --
+ * vmnet_init_module --
  *
  *      linux module entry point. Called by /sbin/insmod command.
  *      Initializes module and Registers this driver for a
@@ -285,7 +285,7 @@ VNetRemovePortFromList(const VNetPort *port) // IN: port to remove from list
  */
 
 int
-init_module(void)
+vmnet_init_module(void)
 {
    int retval;
 
@@ -347,7 +347,7 @@ init_module(void)
 /*
  *----------------------------------------------------------------------
  *
- * cleanup_module --
+ * vmnet_cleanup_module --
  *
  *      Called by /sbin/rmmod.  Unregisters this driver for a
  *      vnet major #, and deinitializes the modules.  The 64-bit
@@ -364,7 +364,7 @@ init_module(void)
  */
 
 void
-cleanup_module(void)
+vmnet_cleanup_module(void)
 {
    unregister_chrdev(VNET_MAJOR_NUMBER, "vmnet");
    VNetProtoUnregister();
@@ -1659,3 +1659,5 @@ MODULE_LICENSE("GPL v2");
  * by default (i.e., neither mkinitrd nor modprobe will accept it).
  */
 MODULE_INFO(supported, "external");
+module_init(vmnet_init_module);
+module_exit(vmnet_cleanup_module);

From 7f94d6cfea897e92ebf37af2fa250e5fa7794d77 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Tue, 17 Jan 2023 22:40:04 +0100
Subject: [PATCH 35/41] vmmon: use standard ASM_ENDBR macro

Some cross page functions need an explicit endbr64 instruction as they are
indirect branch targets but are not recognized as such. VMware 17 uses home
cooked ENDBR macro rather than standard ASM_ENDBR defined in kernel.

Use ASM_ENDBR instead and define it as empty if not available (kernel
before 5.18-rc1) so that we do not generate useless endbr64 instructions
when building against kernel which does not support IBT or has it disabled.
---
 vmmon-only/common/crosspage.c | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/vmmon-only/common/crosspage.c b/vmmon-only/common/crosspage.c
index 37a7238e..6b189400 100644
--- a/vmmon-only/common/crosspage.c
+++ b/vmmon-only/common/crosspage.c
@@ -76,7 +76,9 @@
 
 #define EXPORTED_ASM_SYMBOL(fn) ".global " ASM_PREFIX #fn "\n"   \
                                 ASM_PREFIX #fn ":\n"
-#define ENDBR ".byte 0xf3, 0x0f, 0x1e, 0xfa\n"
+#ifndef ASM_ENDBR
+#define ASM_ENDBR
+#endif
 
 /*
  * Tag the crosspage code C wrapper with the crosspage section and page
@@ -328,7 +330,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchDBHandler)
-   ENDBR
+   ASM_ENDBR
    "pushq        %%rax\n"
 
    SwitchExcGetCrossPageData
@@ -369,7 +371,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchUDHandler)
-   ENDBR
+   ASM_ENDBR
    "pushq        %%rax\n"
    "pushq        %%rbx\n"
    "pushq        %%rcx\n"
@@ -440,7 +442,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchNMIHandler)
-   ENDBR
+   ASM_ENDBR
    "pushq        %%rax\n"
 
    SwitchExcGetCrossPageData
@@ -478,7 +480,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(SwitchMCEHandler)
-   ENDBR
+   ASM_ENDBR
    "pushq        %%rax\n"
 
    SwitchExcGetCrossPageData
@@ -601,7 +603,7 @@ CrossPage_CodePage(void)
 
    ".p2align 4\n"
    EXPORTED_ASM_SYMBOL(VmmToHost)
-   ENDBR
+   ASM_ENDBR
    "movq            %c[VMMCROSSPAGE] + %c[crosspageDataLA], %%rcx\n"
    /* Create an lret frame on the monitor stack. */
    "pushq           (%%rsp)\n"

From 119c95fa97060c5545d018adfe2e508bc0ca566a Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 18 Nov 2022 14:24:17 +0100
Subject: [PATCH 36/41] vmnet: fix csum_and_copy_to_user workaround for kernel
 >= 5.19

Mainline commit 6308499b5e99 ("net: unexport csum_and_copy_{from,to}_user")
in 5.19-rc1 unexports csum_and_copy_to_user as no in-tree module is using
it. A clean solution would probably be rewriting the code to use iovec
iterator as csum_and_copy_to_iter() is still exported (or perhaps
skb_copy_and_csum_datagram() might be used instead). Anything like this
would be way too intrusive so it would have to wait for VMware developers.

Workstation 17.0.0 handles this with a call to csum_partial_copy_nocheck()
inside a user_access_begin()/user_access_end() block which lets the build
succeed but objtool still warns about a call to csum_partial_copy_nocheck()
with UACCESS enabled. Based on the reasoning in commit message of mainline
commit ea24213d8088 ("objtool: Add UACCESS validation"), this workaround
does indeed seem questionable.

Use the older workaround combining csum_partial() with copy_to_user() like
in workstation-16.2.4 branch instead. This will be less efficient but
hopefully the performace hit will not be noticeable.
---
 vmnet-only/userif.c | 10 +++-------
 1 file changed, 3 insertions(+), 7 deletions(-)

diff --git a/vmnet-only/userif.c b/vmnet-only/userif.c
index 0d6b258b..e8bca66f 100644
--- a/vmnet-only/userif.c
+++ b/vmnet-only/userif.c
@@ -550,14 +550,10 @@ VNetCsumAndCopyToUser(const void *src,   // IN: Source
    csum = csum_and_copy_to_user(src, dst, len);
    *err = (csum == 0) ? -EFAULT : 0;
 #else
-   if (!user_access_begin(dst, len)) {
-      *err = -EFAULT;
+   csum = csum_partial(src, len, ~0U);
+   if (copy_to_user(dst, src, len))
       csum = 0;
-   } else {
-      *err = 0;
-      csum = csum_partial_copy_nocheck(src, dst, len);
-      user_access_end();
-   }
+   *err = (csum == 0) ? -EFAULT : 0;
 #endif
    return csum;
 }

From 32731a7ccf1c10222af53bbfe8d1225ad4067e2b Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Tue, 7 Jun 2022 21:29:28 +0200
Subject: [PATCH 37/41] vmnet: fix wireless device detection

Mainline commit c304eddcecfe ("net: wrap the wireless pointers in struct
net_device in an ifdef") in 5.19-rc1 makess ieee80211_ptr member present in
struct net_device only if CONFIG_CFG80211 is enabled. Workstation 17.0.0
checks if CONFIG_CFG80211 is enabled but only when CONFIG_WIRELESS_EXT is
not. Thus a build against a kernel with CONFIG_WIRELESS_EXT enabled and
CONFIG_CFG80211 disabled still fails. Also, the newly introduced version
check is pointless, there is no point checking dev->ieee80211_ptr with
CONFIG_CFG80211 disabled (fortunately it will be null anyway).

Rewrite the check in VNetBridgeIsDeviceWireless() to check each of the two
pointers only if it actually exists.
---
 vmnet-only/bridge.c | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/vmnet-only/bridge.c b/vmnet-only/bridge.c
index e3284f23..df959bd2 100644
--- a/vmnet-only/bridge.c
+++ b/vmnet-only/bridge.c
@@ -811,12 +811,14 @@ static Bool
 VNetBridgeIsDeviceWireless(struct net_device *dev) //IN: sock
 {
 #if defined(CONFIG_WIRELESS_EXT)
-   return dev->ieee80211_ptr != NULL || dev->wireless_handlers != NULL;
-#elif LINUX_VERSION_CODE < KERNEL_VERSION(5, 19, 0) || IS_ENABLED(CONFIG_CFG80211)
-   return dev->ieee80211_ptr != NULL;
-#else
-   return FALSE;
+   if (dev->wireless_handlers)
+      return TRUE;
 #endif
+#if LINUX_VERSION_CODE < KERNEL_VERSION(5, 19, 0) || IS_ENABLED(CONFIG_CFG80211)
+   if (dev->ieee80211_ptr)
+      return TRUE;
+#endif
+   return FALSE;
 }
 
 

From 97ce99e8716b3d1d574562e4c32b8d5c3ad69529 Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Fri, 17 Feb 2023 09:41:26 +0100
Subject: [PATCH 38/41] vmnet: use void as argument list in function
 definitions (#188)

Two functions use "foo()" rather than proper "foo(void)" in their
definitions and as reported, clang compiler treats it as an error.

While at it, also mark VNetFreeInterfaceList() static to make its
definition match the declaration.
---
 vmnet-only/driver.c      | 4 ++--
 vmnet-only/smac_compat.c | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/vmnet-only/driver.c b/vmnet-only/driver.c
index b5ad7aeb..0e4e11d2 100644
--- a/vmnet-only/driver.c
+++ b/vmnet-only/driver.c
@@ -1396,8 +1396,8 @@ VNetCycleDetectIf(const char *name, // IN:
  *----------------------------------------------------------------------
  */
 
-void
-VNetFreeInterfaceList()
+static void
+VNetFreeInterfaceList(void)
 {
    while (vnetInterfaces != NULL) {
       VNetInterface *next = vnetInterfaces->next;
diff --git a/vmnet-only/smac_compat.c b/vmnet-only/smac_compat.c
index 28581045..e704b50c 100644
--- a/vmnet-only/smac_compat.c
+++ b/vmnet-only/smac_compat.c
@@ -83,7 +83,7 @@
  */
 
 unsigned long SMACINT
-SMACL_GetUptime()
+SMACL_GetUptime(void)
 {
    return jiffies;
 }

From 0ace2b5ff1731816f5f7dd8d54bf3cf92594508d Mon Sep 17 00:00:00 2001
From: Michal Kubecek <mkubecek@suse.cz>
Date: Sun, 22 Oct 2023 23:24:05 +0200
Subject: [PATCH 39/41] vmmon: use get_user_pages to get page PFN

As a side effect of mainline commit 0d940a9b270b ("mm/pgtable: allow
pte_offset_map[_lock]() to fail") in 6.5-rc1, __pte_offset_map(), called by
pte_offset_map(), is no longer exported. WMware developers decided to hack
around this by replacing pte_offset_map() by pte_offset_kernel() which does
not seem to be a good idea and apparently may trigger warn checks in RCU
code on some systems as mentioned in the discussion on issue #223.
Therefore let's use the same solution as we had for 17.0.2 and older
versions as it does not show these problems.

Based on an upstream IRC discussion and the hva_to_pfn_*() family of
functions in KVM code, what PgtblVa2MPNLocked() does seems to be an
incomplete and partial open coded logic of get_user_pages() and as it is
only used to get PFN from a virtual address, it can be easily implemented
using get_user_pages() family.

Without knowledge what exactly are the PFNs used for in VMware, it is hard
to guess the right flags, these seem to work and have been tested by
multiple users over last few weeks.

We could likely use get_user_pages() also on older kernels and it might be
actually cleaner and more reliable as existing open coded implementation
does not seem to handle some corner cases but without knowledge of VMware
internals, it will be safer to stick to existing code where possible.
---
 vmmon-only/include/pgtbl.h | 25 +++++++++++++++++++++++++
 1 file changed, 25 insertions(+)

diff --git a/vmmon-only/include/pgtbl.h b/vmmon-only/include/pgtbl.h
index 5de6fb1d..da90ec82 100644
--- a/vmmon-only/include/pgtbl.h
+++ b/vmmon-only/include/pgtbl.h
@@ -26,6 +26,7 @@
 #include "compat_pgtable.h"
 #include "compat_spinlock.h"
 #include "compat_page.h"
+#include "compat_version.h"
 
 
 /*
@@ -46,6 +47,7 @@
  *-----------------------------------------------------------------------------
  */
 
+#if COMPAT_LINUX_VERSION_CHECK_LT(6, 5, 0) // only used by PgtblVa2MPN() below
 static INLINE MPN
 PgtblVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a process
                   VA addr)              // IN: Address in the virtual address
@@ -107,6 +109,7 @@ PgtblVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a process
    }
    return mpn;
 }
+#endif
 
 
 /*
@@ -126,6 +129,8 @@ PgtblVa2MPNLocked(struct mm_struct *mm, // IN: Mm structure of a process
  *-----------------------------------------------------------------------------
  */
 
+#if COMPAT_LINUX_VERSION_CHECK_LT(6, 5, 0)
+
 static INLINE MPN
 PgtblVa2MPN(VA addr)  // IN
 {
@@ -140,4 +145,24 @@ PgtblVa2MPN(VA addr)  // IN
    return mpn;
 }
 
+#else /* COMPAT_LINUX_VERSION_CHECK_LT(6, 5, 0) */
+
+static INLINE MPN
+PgtblVa2MPN(VA addr)  // IN
+{
+   struct page *page;
+   int npages;
+   MPN mpn;
+
+   npages = get_user_pages_unlocked(addr, 1, &page, FOLL_HWPOISON);
+   if (npages != 1)
+	   return INVALID_MPN;
+   mpn = page_to_pfn(page);
+   put_page(page);
+
+   return mpn;
+}
+
+#endif /* COMPAT_LINUX_VERSION_CHECK_LT(6, 5, 0) */
+
 #endif /* __PGTBL_H__ */

From cc104a85c9e54823cc9620644833c84d75fac1be Mon Sep 17 00:00:00 2001
From: Veronika Kossmann <nanodesuu@gmail.com>
Date: Sat, 18 May 2024 19:45:31 +0300
Subject: [PATCH 40/41] Compiles and works for Workstation 17.5.2 and Mainline
 kernel 6.9.1. Applied
 https://github.com/mkubecek/vmware-host-modules/issues/243#issuecomment-2098516707
 and
 https://github.com/mkubecek/vmware-host-modules/issues/239#issuecomment-2118783046

---
 vmmon-only/include/x86msr.h | 2 +-
 vmnet-only/vmnetInt.h       | 9 +++++++--
 2 files changed, 8 insertions(+), 3 deletions(-)

diff --git a/vmmon-only/include/x86msr.h b/vmmon-only/include/x86msr.h
index cfd2ef67..126991a9 100644
--- a/vmmon-only/include/x86msr.h
+++ b/vmmon-only/include/x86msr.h
@@ -68,7 +68,7 @@ typedef struct MSRReply {
 typedef struct MSRQuery {
    uint32 msrNum;           // IN
    uint32 numLogicalCPUs;   // IN/OUT
-   MSRReply logicalCPUs[0]; // OUT
+   MSRReply logicalCPUs[]; // OUT
 } MSRQuery;
 #pragma pack(pop)
 
diff --git a/vmnet-only/vmnetInt.h b/vmnet-only/vmnetInt.h
index b49c3990..f8fbc75a 100644
--- a/vmnet-only/vmnetInt.h
+++ b/vmnet-only/vmnetInt.h
@@ -41,8 +41,13 @@
     compat_skb_set_network_header(skb, sizeof (struct ethhdr)),  \
     dev_queue_xmit(skb)                                   \
   )
-#define dev_lock_list()    read_lock(&dev_base_lock)
-#define dev_unlock_list()  read_unlock(&dev_base_lock)
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(6, 9, 0)
+#   define dev_lock_list()    rcu_read_lock()
+#   define dev_unlock_list()  rcu_read_unlock()
+#else
+#   define dev_lock_list()    read_lock(&dev_base_lock)
+#   define dev_unlock_list()  read_unlock(&dev_base_lock)
+#endif
 
 
 extern struct proto vmnet_proto;

From bc295fc2ddf1229b834aef54c27699152da9b731 Mon Sep 17 00:00:00 2001
From: Philip Langdale <philipl@overt.org>
Date: Sat, 7 Sep 2024 15:00:44 -0700
Subject: [PATCH 41/41] Add dkms support

This also requires tweaking the Makefiles to allow for building for non-active
kernels
---
 Makefile            |  2 +-
 dkms.conf           | 11 +++++++++++
 vmmon-only/Makefile |  2 +-
 vmnet-only/Makefile |  2 +-
 4 files changed, 14 insertions(+), 3 deletions(-)
 create mode 100644 dkms.conf

diff --git a/Makefile b/Makefile
index c5e561d0..125115e7 100644
--- a/Makefile
+++ b/Makefile
@@ -2,7 +2,7 @@ MODULES = vmmon vmnet
 SUBDIRS = $(MODULES:%=%-only)
 TARBALLS = $(MODULES:%=%.tar)
 MODFILES = $(foreach mod,$(MODULES),$(mod)-only/$(mod).ko)
-VM_UNAME = $(shell uname -r)
+VM_UNAME ?= $(shell uname -r)
 MODDIR = /lib/modules/$(VM_UNAME)/misc
 
 MODINFO = /sbin/modinfo
diff --git a/dkms.conf b/dkms.conf
new file mode 100644
index 00000000..a25710fd
--- /dev/null
+++ b/dkms.conf
@@ -0,0 +1,11 @@
+PACKAGE_NAME="vmware-host-modules"
+PACKAGE_VERSION="17.6.0"
+MAKE="VM_UNAME=$kernelver make"
+CLEAN="make clean"
+BUILT_MODULE_NAME[0]="vmmon"
+BUILT_MODULE_NAME[1]="vmnet"
+BUILT_MODULE_LOCATION[0]="vmmon-only"
+BUILT_MODULE_LOCATION[1]="vmnet-only"
+DEST_MODULE_LOCATION[0]="/extra"
+DEST_MODULE_LOCATION[1]="/extra"
+AUTOINSTALL="yes"
diff --git a/vmmon-only/Makefile b/vmmon-only/Makefile
index dc2ac3b0..f4a60e6d 100644
--- a/vmmon-only/Makefile
+++ b/vmmon-only/Makefile
@@ -43,7 +43,7 @@ INCLUDE      += -I$(SRCROOT)/shared
 endif
 
 
-VM_UNAME = $(shell uname -r)
+VM_UNAME ?= $(shell uname -r)
 
 # Header directory for the running kernel
 ifdef LINUXINCLUDE
diff --git a/vmnet-only/Makefile b/vmnet-only/Makefile
index 2640c1a9..9d8be1f3 100644
--- a/vmnet-only/Makefile
+++ b/vmnet-only/Makefile
@@ -43,7 +43,7 @@ INCLUDE      += -I$(SRCROOT)/shared
 endif
 
 
-VM_UNAME = $(shell uname -r)
+VM_UNAME ?= $(shell uname -r)
 
 # Header directory for the running kernel
 ifdef LINUXINCLUDE