 83974cf4f8
			
		
	
	
		83974cf4f8
		
	
	
	
	
		
			
			Commit f0aff0f124 ("cputlb: add assert_cpu_is_self checks") buried
the increment of tlb_flush_count under TLB_DEBUG. This results in
"info jit" always (mis)reporting 0 TLB flushes when !TLB_DEBUG.
Besides, under MTTCG tlb_flush_count is updated by several threads,
so in order not to lose counts we'd either have to use atomic ops
or distribute the counter, which is more scalable.
This patch does the latter by embedding tlb_flush_count in CPUArchState.
The global count is then easily obtained by iterating over the CPU list.
Note that this change also requires updating the accessors to
tlb_flush_count to use atomic_read/set whenever there may be conflicting
accesses (as defined in C11) to it.
Reviewed-by: Richard Henderson <rth@twiddle.net>
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
Signed-off-by: Emilio G. Cota <cota@braap.org>
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
		
	
			
		
			
				
	
	
		
			157 lines
		
	
	
		
			5.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			157 lines
		
	
	
		
			5.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * common defines for all CPUs
 | |
|  *
 | |
|  * Copyright (c) 2003 Fabrice Bellard
 | |
|  *
 | |
|  * This library is free software; you can redistribute it and/or
 | |
|  * modify it under the terms of the GNU Lesser General Public
 | |
|  * License as published by the Free Software Foundation; either
 | |
|  * version 2 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * This library is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|  * Lesser General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU Lesser General Public
 | |
|  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
 | |
|  */
 | |
| #ifndef CPU_DEFS_H
 | |
| #define CPU_DEFS_H
 | |
| 
 | |
| #ifndef NEED_CPU_H
 | |
| #error cpu.h included from common code
 | |
| #endif
 | |
| 
 | |
| #include "qemu/host-utils.h"
 | |
| #include "qemu/queue.h"
 | |
| #ifdef CONFIG_TCG
 | |
| #include "tcg-target.h"
 | |
| #endif
 | |
| #ifndef CONFIG_USER_ONLY
 | |
| #include "exec/hwaddr.h"
 | |
| #endif
 | |
| #include "exec/memattrs.h"
 | |
| 
 | |
| #ifndef TARGET_LONG_BITS
 | |
| #error TARGET_LONG_BITS must be defined before including this header
 | |
| #endif
 | |
| 
 | |
| #define TARGET_LONG_SIZE (TARGET_LONG_BITS / 8)
 | |
| 
 | |
| /* target_ulong is the type of a virtual address */
 | |
| #if TARGET_LONG_SIZE == 4
 | |
| typedef int32_t target_long;
 | |
| typedef uint32_t target_ulong;
 | |
| #define TARGET_FMT_lx "%08x"
 | |
| #define TARGET_FMT_ld "%d"
 | |
| #define TARGET_FMT_lu "%u"
 | |
| #elif TARGET_LONG_SIZE == 8
 | |
| typedef int64_t target_long;
 | |
| typedef uint64_t target_ulong;
 | |
| #define TARGET_FMT_lx "%016" PRIx64
 | |
| #define TARGET_FMT_ld "%" PRId64
 | |
| #define TARGET_FMT_lu "%" PRIu64
 | |
| #else
 | |
| #error TARGET_LONG_SIZE undefined
 | |
| #endif
 | |
| 
 | |
| #if !defined(CONFIG_USER_ONLY) && defined(CONFIG_TCG)
 | |
| /* use a fully associative victim tlb of 8 entries */
 | |
| #define CPU_VTLB_SIZE 8
 | |
| 
 | |
| #if HOST_LONG_BITS == 32 && TARGET_LONG_BITS == 32
 | |
| #define CPU_TLB_ENTRY_BITS 4
 | |
| #else
 | |
| #define CPU_TLB_ENTRY_BITS 5
 | |
| #endif
 | |
| 
 | |
| /* TCG_TARGET_TLB_DISPLACEMENT_BITS is used in CPU_TLB_BITS to ensure that
 | |
|  * the TLB is not unnecessarily small, but still small enough for the
 | |
|  * TLB lookup instruction sequence used by the TCG target.
 | |
|  *
 | |
|  * TCG will have to generate an operand as large as the distance between
 | |
|  * env and the tlb_table[NB_MMU_MODES - 1][0].addend.  For simplicity,
 | |
|  * the TCG targets just round everything up to the next power of two, and
 | |
|  * count bits.  This works because: 1) the size of each TLB is a largish
 | |
|  * power of two, 2) and because the limit of the displacement is really close
 | |
|  * to a power of two, 3) the offset of tlb_table[0][0] inside env is smaller
 | |
|  * than the size of a TLB.
 | |
|  *
 | |
|  * For example, the maximum displacement 0xFFF0 on PPC and MIPS, but TCG
 | |
|  * just says "the displacement is 16 bits".  TCG_TARGET_TLB_DISPLACEMENT_BITS
 | |
|  * then ensures that tlb_table at least 0x8000 bytes large ("not unnecessarily
 | |
|  * small": 2^15).  The operand then will come up smaller than 0xFFF0 without
 | |
|  * any particular care, because the TLB for a single MMU mode is larger than
 | |
|  * 0x10000-0xFFF0=16 bytes.  In the end, the maximum value of the operand
 | |
|  * could be something like 0xC000 (the offset of the last TLB table) plus
 | |
|  * 0x18 (the offset of the addend field in each TLB entry) plus the offset
 | |
|  * of tlb_table inside env (which is non-trivial but not huge).
 | |
|  */
 | |
| #define CPU_TLB_BITS                                             \
 | |
|     MIN(8,                                                       \
 | |
|         TCG_TARGET_TLB_DISPLACEMENT_BITS - CPU_TLB_ENTRY_BITS -  \
 | |
|         (NB_MMU_MODES <= 1 ? 0 :                                 \
 | |
|          NB_MMU_MODES <= 2 ? 1 :                                 \
 | |
|          NB_MMU_MODES <= 4 ? 2 :                                 \
 | |
|          NB_MMU_MODES <= 8 ? 3 : 4))
 | |
| 
 | |
| #define CPU_TLB_SIZE (1 << CPU_TLB_BITS)
 | |
| 
 | |
| typedef struct CPUTLBEntry {
 | |
|     /* bit TARGET_LONG_BITS to TARGET_PAGE_BITS : virtual address
 | |
|        bit TARGET_PAGE_BITS-1..4  : Nonzero for accesses that should not
 | |
|                                     go directly to ram.
 | |
|        bit 3                      : indicates that the entry is invalid
 | |
|        bit 2..0                   : zero
 | |
|     */
 | |
|     union {
 | |
|         struct {
 | |
|             target_ulong addr_read;
 | |
|             target_ulong addr_write;
 | |
|             target_ulong addr_code;
 | |
|             /* Addend to virtual address to get host address.  IO accesses
 | |
|                use the corresponding iotlb value.  */
 | |
|             uintptr_t addend;
 | |
|         };
 | |
|         /* padding to get a power of two size */
 | |
|         uint8_t dummy[1 << CPU_TLB_ENTRY_BITS];
 | |
|     };
 | |
| } CPUTLBEntry;
 | |
| 
 | |
| QEMU_BUILD_BUG_ON(sizeof(CPUTLBEntry) != (1 << CPU_TLB_ENTRY_BITS));
 | |
| 
 | |
| /* The IOTLB is not accessed directly inline by generated TCG code,
 | |
|  * so the CPUIOTLBEntry layout is not as critical as that of the
 | |
|  * CPUTLBEntry. (This is also why we don't want to combine the two
 | |
|  * structs into one.)
 | |
|  */
 | |
| typedef struct CPUIOTLBEntry {
 | |
|     hwaddr addr;
 | |
|     MemTxAttrs attrs;
 | |
| } CPUIOTLBEntry;
 | |
| 
 | |
| #define CPU_COMMON_TLB \
 | |
|     /* The meaning of the MMU modes is defined in the target code. */   \
 | |
|     CPUTLBEntry tlb_table[NB_MMU_MODES][CPU_TLB_SIZE];                  \
 | |
|     CPUTLBEntry tlb_v_table[NB_MMU_MODES][CPU_VTLB_SIZE];               \
 | |
|     CPUIOTLBEntry iotlb[NB_MMU_MODES][CPU_TLB_SIZE];                    \
 | |
|     CPUIOTLBEntry iotlb_v[NB_MMU_MODES][CPU_VTLB_SIZE];                 \
 | |
|     size_t tlb_flush_count;                                             \
 | |
|     target_ulong tlb_flush_addr;                                        \
 | |
|     target_ulong tlb_flush_mask;                                        \
 | |
|     target_ulong vtlb_index;                                            \
 | |
| 
 | |
| #else
 | |
| 
 | |
| #define CPU_COMMON_TLB
 | |
| 
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #define CPU_COMMON                                                      \
 | |
|     /* soft mmu support */                                              \
 | |
|     CPU_COMMON_TLB                                                      \
 | |
| 
 | |
| #endif
 |