1 /*
   2  * CDDL HEADER START
   3  *
   4  * The contents of this file are subject to the terms of the
   5  * Common Development and Distribution License (the "License").
   6  * You may not use this file except in compliance with the License.
   7  *
   8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
   9  * or http://www.opensolaris.org/os/licensing.
  10  * See the License for the specific language governing permissions
  11  * and limitations under the License.
  12  *
  13  * When distributing Covered Code, include this CDDL HEADER in each
  14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  15  * If applicable, add the following below this CDDL HEADER, with the
  16  * fields enclosed by brackets "[]" replaced with your own identifying
  17  * information: Portions Copyright [yyyy] [name of copyright owner]
  18  *
  19  * CDDL HEADER END
  20  */
  21 /*
  22  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
  23  * Use is subject to license terms.
  24  */
  25 /*
  26  * Copyright 2018 Joyent, Inc.
  27  */
  28 
  29 #ifndef _SYS_MACHCPUVAR_H
  30 #define _SYS_MACHCPUVAR_H
  31 
  32 #ifdef  __cplusplus
  33 extern "C" {
  34 #endif
  35 
  36 #include <sys/inttypes.h>
  37 #include <sys/x_call.h>
  38 #include <sys/tss.h>
  39 #include <sys/segments.h>
  40 #include <sys/rm_platter.h>
  41 #include <sys/avintr.h>
  42 #include <sys/pte.h>
  43 #include <sys/stddef.h>
  44 #include <sys/debug.h>
  45 #include <sys/cpuvar.h>
  46 
  47 #ifndef _ASM
  48 /*
  49  * On a virtualized platform a virtual cpu may not be actually
  50  * on a physical cpu, especially in situations where a configuration has
  51  * more vcpus than pcpus.  This function tells us (if it's able) if the
  52  * specified vcpu is currently running on a pcpu.  Note if it is not
  53  * known or not able to determine, it will return the unknown state.
  54  */
  55 #define VCPU_STATE_UNKNOWN      0
  56 #define VCPU_ON_PCPU            1
  57 #define VCPU_NOT_ON_PCPU        2
  58 
  59 extern int vcpu_on_pcpu(processorid_t);
  60 
  61 /*
  62  * Machine specific fields of the cpu struct
  63  * defined in common/sys/cpuvar.h.
  64  *
  65  * Note:  This is kinda kludgy but seems to be the best
  66  * of our alternatives.
  67  */
  68 
  69 struct cpuid_info;
  70 struct cpu_ucode_info;
  71 struct cmi_hdl;
  72 
  73 /*
  74  * A note about the hypervisor affinity bits: a one bit in the affinity mask
  75  * means the corresponding event channel is allowed to be serviced
  76  * by this cpu.
  77  */
  78 struct xen_evt_data {
  79         ulong_t         pending_sel[PIL_MAX + 1]; /* event array selectors */
  80         ulong_t         pending_evts[PIL_MAX + 1][sizeof (ulong_t) * 8];
  81         ulong_t         evt_affinity[sizeof (ulong_t) * 8]; /* service on cpu */
  82 };
  83 
  84 struct kpti_frame {
  85         uint64_t        kf_lower_redzone;
  86 
  87         /* Stashed value of %cr3 when we entered the trampoline. */
  88         greg_t          kf_tr_cr3;
  89 
  90         /*
  91          * We use %r13-r14 as scratch registers in the trampoline code,
  92          * so stash those here "below" the rest of the stack so they can be
  93          * pushed/popped if needed.
  94          */
  95         greg_t          kf_r14;
  96         greg_t          kf_r13;
  97 
  98         /*
  99          * Part of this struct is used as the HW stack frame when taking an
 100          * interrupt on the user page table. The CPU is going to push a bunch
 101          * of regs onto the stack pointer set in the TSS/IDT (which we set to
 102          * &kf_rsp here).
 103          *
 104          * This is only a temporary holding area for them (we'll move them over
 105          * to the real interrupt stack once we've set %cr3).
 106          *
 107          * Note that these must be cleared during a process switch on this cpu.
 108          */
 109         greg_t          kf_err;         /* Bottom of initial hw stack frame */
 110         greg_t          kf_rip;
 111         greg_t          kf_cs;
 112         greg_t          kf_rflags;
 113         greg_t          kf_rsp;
 114         greg_t          kf_ss;
 115 
 116         greg_t          kf_tr_rsp;      /* Top of HW stack frame */
 117         /* We also write this with the %rsp value on tramp entry */
 118 
 119         /* Written to 0x1 when this kpti_frame is in use. */
 120         uint64_t        kf_tr_flag;
 121 
 122         uint64_t        kf_middle_redzone;
 123 
 124         /*
 125          * The things we need to write to %cr3 to change between page tables.
 126          * These live "above" the HW stack.
 127          */
 128         greg_t          kf_kernel_cr3;
 129         greg_t          kf_user_cr3;
 130         greg_t          kf_tr_ret_rsp;
 131 
 132         uint64_t        kf_unused;              /* For 16-byte align */
 133 
 134         uint64_t        kf_upper_redzone;
 135 };
 136 
 137 typedef struct cpu_ht {
 138         lock_t ch_lock;
 139         char ch_pad[56];
 140         struct cpu *ch_sib;
 141         volatile uint64_t ch_intr_depth;
 142         volatile uint64_t ch_state;
 143         volatile uint64_t ch_sibstate;
 144 } cpu_ht_t;
 145 
 146 /*
 147  * This first value, MACHCPU_SIZE is the size of all the members in the cpu_t
 148  * AND struct machcpu, before we get to the mcpu_pad and the kpti area.
 149  * The KPTI is used to contain per-CPU data that is visible in both sets of
 150  * page-tables, and hence must be page-aligned and page-sized. See
 151  * hat_pcp_setup().
 152  *
 153  * There are CTASSERTs in os/intr.c that verify this all works out.
 154  */
 155 #define MACHCPU_SIZE    (1568 + 688)
 156 #define MACHCPU_PAD     (MMU_PAGESIZE - MACHCPU_SIZE)
 157 #define MACHCPU_PAD2    (MMU_PAGESIZE - 16 - 3 * sizeof (struct kpti_frame))
 158 
 159 struct  machcpu {
 160         /*
 161          * x_call fields - used for interprocessor cross calls
 162          */
 163         struct xc_msg   *xc_msgbox;
 164         struct xc_msg   *xc_free;
 165         xc_data_t       xc_data;
 166         uint32_t        xc_wait_cnt;
 167         volatile uint32_t xc_work_cnt;
 168 
 169         int             mcpu_nodeid;            /* node-id */
 170         int             mcpu_pri;               /* CPU priority */
 171 
 172         struct hat      *mcpu_current_hat; /* cpu's current hat */
 173 
 174         struct hat_cpu_info     *mcpu_hat_info;
 175 
 176         volatile ulong_t        mcpu_tlb_info;
 177 
 178         /* i86 hardware table addresses that cannot be shared */
 179 
 180         user_desc_t     *mcpu_gdt;      /* GDT */
 181         gate_desc_t     *mcpu_idt;      /* current IDT */
 182 
 183         tss_t           *mcpu_tss;      /* TSS */
 184         void            *mcpu_ldt;
 185         size_t          mcpu_ldt_len;
 186 
 187         kmutex_t        mcpu_ppaddr_mutex;
 188         caddr_t         mcpu_caddr1;    /* per cpu CADDR1 */
 189         caddr_t         mcpu_caddr2;    /* per cpu CADDR2 */
 190         uint64_t        mcpu_caddr1pte;
 191         uint64_t        mcpu_caddr2pte;
 192 
 193         struct softint  mcpu_softinfo;
 194         uint64_t        pil_high_start[HIGH_LEVELS];
 195         uint64_t        intrstat[PIL_MAX + 1][2];
 196 
 197         struct cpuid_info        *mcpu_cpi;
 198 
 199 #if defined(__amd64)
 200         greg_t  mcpu_rtmp_rsp;          /* syscall: temporary %rsp stash */
 201         greg_t  mcpu_rtmp_r15;          /* syscall: temporary %r15 stash */
 202 #endif
 203 
 204         struct vcpu_info *mcpu_vcpu_info;
 205         uint64_t        mcpu_gdtpa;     /* hypervisor: GDT physical address */
 206 
 207         uint16_t mcpu_intr_pending;     /* hypervisor: pending intrpt levels */
 208         uint16_t mcpu_ec_mbox;          /* hypervisor: evtchn_dev mailbox */
 209         struct xen_evt_data *mcpu_evt_pend; /* hypervisor: pending events */
 210 
 211         volatile uint32_t *mcpu_mwait;  /* MONITOR/MWAIT buffer */
 212         void (*mcpu_idle_cpu)(void);    /* idle function */
 213         uint16_t mcpu_idle_type;        /* CPU next idle type */
 214         uint16_t max_cstates;           /* supported max cstates */
 215 
 216         struct cpu_ucode_info   *mcpu_ucode_info;
 217 
 218         void                    *mcpu_pm_mach_state;
 219         struct cmi_hdl          *mcpu_cmi_hdl;
 220         void                    *mcpu_mach_ctx_ptr;
 221 
 222         /*
 223          * A stamp that is unique per processor and changes
 224          * whenever an interrupt happens. Userful for detecting
 225          * if a section of code gets interrupted.
 226          * The high order 16 bits will hold the cpu->cpu_id.
 227          * The low order bits will be incremented on every interrupt.
 228          */
 229         volatile uint32_t       mcpu_istamp;
 230 
 231         cpu_ht_t                mcpu_ht;
 232 
 233         char                    mcpu_pad[MACHCPU_PAD];
 234 
 235         /* This is the start of the page */
 236         char                    mcpu_pad2[MACHCPU_PAD2];
 237         struct kpti_frame       mcpu_kpti;
 238         struct kpti_frame       mcpu_kpti_flt;
 239         struct kpti_frame       mcpu_kpti_dbg;
 240         char                    mcpu_pad3[16];
 241 };
 242 
 243 #define NINTR_THREADS   (LOCK_LEVEL-1)  /* number of interrupt threads */
 244 #define MWAIT_HALTED    (1)             /* mcpu_mwait set when halting */
 245 #define MWAIT_RUNNING   (0)             /* mcpu_mwait set to wakeup */
 246 #define MWAIT_WAKEUP_IPI        (2)     /* need IPI to wakeup */
 247 #define MWAIT_WAKEUP(cpu)       (*((cpu)->cpu_m.mcpu_mwait) = MWAIT_RUNNING)
 248 
 249 #endif  /* _ASM */
 250 
 251 /* Please DON'T add any more of this namespace-poisoning sewage here */
 252 
 253 #define cpu_nodeid cpu_m.mcpu_nodeid
 254 #define cpu_pri cpu_m.mcpu_pri
 255 #define cpu_current_hat cpu_m.mcpu_current_hat
 256 #define cpu_hat_info cpu_m.mcpu_hat_info
 257 #define cpu_ppaddr_mutex cpu_m.mcpu_ppaddr_mutex
 258 #define cpu_gdt cpu_m.mcpu_gdt
 259 #define cpu_idt cpu_m.mcpu_idt
 260 #define cpu_tss cpu_m.mcpu_tss
 261 #define cpu_caddr1 cpu_m.mcpu_caddr1
 262 #define cpu_caddr2 cpu_m.mcpu_caddr2
 263 #define cpu_softinfo cpu_m.mcpu_softinfo
 264 #define cpu_caddr1pte cpu_m.mcpu_caddr1pte
 265 #define cpu_caddr2pte cpu_m.mcpu_caddr2pte
 266 
 267 #ifdef  __cplusplus
 268 }
 269 #endif
 270 
 271 #endif  /* _SYS_MACHCPUVAR_H */