2015-10-19 21:12:53 +02:00
|
|
|
/** @file
|
|
|
|
Code for Processor S3 restoration
|
|
|
|
|
2019-08-05 08:41:43 +02:00
|
|
|
Copyright (c) 2006 - 2019, Intel Corporation. All rights reserved.<BR>
|
2019-04-04 01:07:22 +02:00
|
|
|
SPDX-License-Identifier: BSD-2-Clause-Patent
|
2015-10-19 21:12:53 +02:00
|
|
|
|
|
|
|
**/
|
|
|
|
|
|
|
|
#include "PiSmmCpuDxeSmm.h"
|
|
|
|
|
2018-01-11 10:05:15 +01:00
|
|
|
#pragma pack(1)
|
2015-10-19 21:12:53 +02:00
|
|
|
typedef struct {
|
|
|
|
UINTN Lock;
|
|
|
|
VOID *StackStart;
|
|
|
|
UINTN StackSize;
|
|
|
|
VOID *ApFunction;
|
|
|
|
IA32_DESCRIPTOR GdtrProfile;
|
|
|
|
IA32_DESCRIPTOR IdtrProfile;
|
|
|
|
UINT32 BufferStart;
|
|
|
|
UINT32 Cr3;
|
2018-01-11 10:05:15 +01:00
|
|
|
UINTN InitializeFloatingPointUnitsAddress;
|
2015-10-19 21:12:53 +02:00
|
|
|
} MP_CPU_EXCHANGE_INFO;
|
2018-01-11 10:05:15 +01:00
|
|
|
#pragma pack()
|
2015-10-19 21:12:53 +02:00
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
UINT8 *RendezvousFunnelAddress;
|
|
|
|
UINTN PModeEntryOffset;
|
|
|
|
UINTN FlatJumpOffset;
|
|
|
|
UINTN Size;
|
|
|
|
UINTN LModeEntryOffset;
|
|
|
|
UINTN LongJumpOffset;
|
|
|
|
} MP_ASSEMBLY_ADDRESS_MAP;
|
|
|
|
|
2016-06-29 03:00:13 +02:00
|
|
|
//
|
2018-10-15 04:34:59 +02:00
|
|
|
// Flags used when program the register.
|
2016-06-29 03:00:13 +02:00
|
|
|
//
|
2018-10-15 04:34:59 +02:00
|
|
|
typedef struct {
|
UefiCpuPkg/PiSmmCpuDxeSmm: Separate semaphore container.
In current implementation, core and package level sync uses same semaphores.
Sharing the semaphore may cause wrong execution order.
For example:
1. Feature A has CPU_FEATURE_CORE_BEFORE dependency with Feature B.
2. Feature C has CPU_FEATURE_PACKAGE_AFTER dependency with Feature B.
The expected feature initialization order is A B C:
A ---- (Core Depends) ----> B ---- (Package Depends) ----> C
For a CPU has 1 package, 2 cores and 4 threads. The feature initialization
order may like below:
Thread#1 Thread#2 Thread#3 Thread#4
[A.Init] [A.Init] [A.Init]
Release(S1, S2) Release(S1, S2) Release(S3, S4)
Wait(S1) * 2 Wait(S2) * 2 <------------------------------- Core sync
[B.Init] [B.Init]
Release (S1,S2,S3,S4)
Wait (S1) * 4 <----------------------------------------------------- Package sync
Wait(S4 * 2) <- Core sync
[B.Init]
In above case, for thread#4, when it syncs in core level, Wait(S4) * 2 isn't
blocked and [B.Init] runs. But [A.Init] hasn't run in thread#3. It's wrong!
Thread#4 should execute [B.Init] after thread#3 executes [A.Init] because B
core level depends on A.
The reason of the wrong execution order is that S4 is released in thread#1
by calling Release (S1, S2, S3, S4) and in thread #4 by calling
Release (S3, S4).
To fix this issue, core level sync and package level sync should use separate
semaphores.
In above example, the S4 released in Release (S1, S2, S3, S4) should not be the
same semaphore as that in Release (S3, S4).
Related BZ: https://bugzilla.tianocore.org/show_bug.cgi?id=1311
Cc: Laszlo Ersek <lersek@redhat.com>
Cc: Ruiyu Ni <ruiyu.ni@intel.com>
Contributed-under: TianoCore Contribution Agreement 1.1
Signed-off-by: Eric Dong <eric.dong@intel.com>
Reviewed-by: Ruiyu Ni <ruiyu.ni@intel.com>
Acked-by: Laszlo Ersek <lersek@redhat.com>
2018-11-10 03:53:41 +01:00
|
|
|
volatile UINTN MemoryMappedLock; // Spinlock used to program mmio
|
|
|
|
volatile UINT32 *CoreSemaphoreCount; // Semaphore container used to program
|
|
|
|
// core level semaphore.
|
|
|
|
volatile UINT32 *PackageSemaphoreCount; // Semaphore container used to program
|
|
|
|
// package level semaphore.
|
2018-10-15 04:34:59 +02:00
|
|
|
} PROGRAM_CPU_REGISTER_FLAGS;
|
2016-06-29 03:00:13 +02:00
|
|
|
|
2017-09-28 10:57:35 +02:00
|
|
|
//
|
|
|
|
// Signal that SMM BASE relocation is complete.
|
|
|
|
//
|
|
|
|
volatile BOOLEAN mInitApsAfterSmmBaseReloc;
|
|
|
|
|
2015-10-19 21:12:53 +02:00
|
|
|
/**
|
|
|
|
Get starting address and size of the rendezvous entry for APs.
|
|
|
|
Information for fixing a jump instruction in the code is also returned.
|
|
|
|
|
|
|
|
@param AddressMap Output buffer for address map information.
|
|
|
|
**/
|
|
|
|
VOID *
|
|
|
|
EFIAPI
|
|
|
|
AsmGetAddressMap (
|
|
|
|
MP_ASSEMBLY_ADDRESS_MAP *AddressMap
|
|
|
|
);
|
|
|
|
|
|
|
|
#define LEGACY_REGION_SIZE (2 * 0x1000)
|
|
|
|
#define LEGACY_REGION_BASE (0xA0000 - LEGACY_REGION_SIZE)
|
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
PROGRAM_CPU_REGISTER_FLAGS mCpuFlags;
|
2015-10-19 21:12:53 +02:00
|
|
|
ACPI_CPU_DATA mAcpiCpuData;
|
2016-11-17 21:43:04 +01:00
|
|
|
volatile UINT32 mNumberToFinish;
|
2015-10-19 21:12:53 +02:00
|
|
|
MP_CPU_EXCHANGE_INFO *mExchangeInfo;
|
|
|
|
BOOLEAN mRestoreSmmConfigurationInS3 = FALSE;
|
|
|
|
|
2016-07-19 10:44:16 +02:00
|
|
|
//
|
|
|
|
// S3 boot flag
|
|
|
|
//
|
|
|
|
BOOLEAN mSmmS3Flag = FALSE;
|
|
|
|
|
|
|
|
//
|
|
|
|
// Pointer to structure used during S3 Resume
|
|
|
|
//
|
|
|
|
SMM_S3_RESUME_STATE *mSmmS3ResumeState = NULL;
|
|
|
|
|
2016-07-20 04:24:58 +02:00
|
|
|
BOOLEAN mAcpiS3Enable = TRUE;
|
|
|
|
|
2016-11-10 06:40:12 +01:00
|
|
|
UINT8 *mApHltLoopCode = NULL;
|
|
|
|
UINT8 mApHltLoopCodeTemplate[] = {
|
2016-11-11 06:25:51 +01:00
|
|
|
0x8B, 0x44, 0x24, 0x04, // mov eax, dword ptr [esp+4]
|
|
|
|
0xF0, 0xFF, 0x08, // lock dec dword ptr [eax]
|
|
|
|
0xFA, // cli
|
|
|
|
0xF4, // hlt
|
|
|
|
0xEB, 0xFC // jmp $-2
|
2016-11-10 06:40:12 +01:00
|
|
|
};
|
|
|
|
|
2015-10-19 21:12:53 +02:00
|
|
|
/**
|
|
|
|
Sync up the MTRR values for all processors.
|
|
|
|
|
|
|
|
@param MtrrTable Table holding fixed/variable MTRR values to be loaded.
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
EFIAPI
|
|
|
|
LoadMtrrData (
|
|
|
|
EFI_PHYSICAL_ADDRESS MtrrTable
|
|
|
|
)
|
|
|
|
/*++
|
|
|
|
|
|
|
|
Routine Description:
|
|
|
|
|
|
|
|
Sync up the MTRR values for all processors.
|
|
|
|
|
|
|
|
Arguments:
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
None
|
|
|
|
|
|
|
|
--*/
|
|
|
|
{
|
|
|
|
MTRR_SETTINGS *MtrrSettings;
|
|
|
|
|
|
|
|
MtrrSettings = (MTRR_SETTINGS *) (UINTN) MtrrTable;
|
|
|
|
MtrrSetAllMtrrs (MtrrSettings);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2018-10-15 04:34:59 +02:00
|
|
|
Increment semaphore by 1.
|
2015-10-19 21:12:53 +02:00
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
@param Sem IN: 32-bit unsigned integer
|
2015-10-19 21:12:53 +02:00
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
S3ReleaseSemaphore (
|
|
|
|
IN OUT volatile UINT32 *Sem
|
|
|
|
)
|
|
|
|
{
|
|
|
|
InterlockedIncrement (Sem);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
Decrement the semaphore by 1 if it is not zero.
|
2015-10-19 21:12:53 +02:00
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
Performs an atomic decrement operation for semaphore.
|
|
|
|
The compare exchange operation must be performed using
|
|
|
|
MP safe mechanisms.
|
|
|
|
|
|
|
|
@param Sem IN: 32-bit unsigned integer
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
S3WaitForSemaphore (
|
|
|
|
IN OUT volatile UINT32 *Sem
|
|
|
|
)
|
|
|
|
{
|
|
|
|
UINT32 Value;
|
|
|
|
|
|
|
|
do {
|
|
|
|
Value = *Sem;
|
|
|
|
} while (Value == 0 ||
|
|
|
|
InterlockedCompareExchange32 (
|
|
|
|
Sem,
|
|
|
|
Value,
|
|
|
|
Value - 1
|
|
|
|
) != Value);
|
|
|
|
}
|
|
|
|
|
2019-08-16 05:57:26 +02:00
|
|
|
/**
|
|
|
|
Read / write CR value.
|
|
|
|
|
|
|
|
@param[in] CrIndex The CR index which need to read/write.
|
|
|
|
@param[in] Read Read or write. TRUE is read.
|
|
|
|
@param[in,out] CrValue CR value.
|
|
|
|
|
|
|
|
@retval EFI_SUCCESS means read/write success, else return EFI_UNSUPPORTED.
|
|
|
|
**/
|
|
|
|
UINTN
|
|
|
|
ReadWriteCr (
|
|
|
|
IN UINT32 CrIndex,
|
|
|
|
IN BOOLEAN Read,
|
|
|
|
IN OUT UINTN *CrValue
|
|
|
|
)
|
|
|
|
{
|
|
|
|
switch (CrIndex) {
|
|
|
|
case 0:
|
|
|
|
if (Read) {
|
|
|
|
*CrValue = AsmReadCr0 ();
|
|
|
|
} else {
|
|
|
|
AsmWriteCr0 (*CrValue);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case 2:
|
|
|
|
if (Read) {
|
|
|
|
*CrValue = AsmReadCr2 ();
|
|
|
|
} else {
|
|
|
|
AsmWriteCr2 (*CrValue);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case 3:
|
|
|
|
if (Read) {
|
|
|
|
*CrValue = AsmReadCr3 ();
|
|
|
|
} else {
|
|
|
|
AsmWriteCr3 (*CrValue);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case 4:
|
|
|
|
if (Read) {
|
|
|
|
*CrValue = AsmReadCr4 ();
|
|
|
|
} else {
|
|
|
|
AsmWriteCr4 (*CrValue);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return EFI_UNSUPPORTED;;
|
|
|
|
}
|
|
|
|
|
|
|
|
return EFI_SUCCESS;
|
|
|
|
}
|
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
/**
|
|
|
|
Initialize the CPU registers from a register table.
|
|
|
|
|
|
|
|
@param[in] RegisterTable The register table for this AP.
|
|
|
|
@param[in] ApLocation AP location info for this ap.
|
|
|
|
@param[in] CpuStatus CPU status info for this CPU.
|
|
|
|
@param[in] CpuFlags Flags data structure used when program the register.
|
|
|
|
|
|
|
|
@note This service could be called by BSP/APs.
|
2015-10-19 21:12:53 +02:00
|
|
|
**/
|
|
|
|
VOID
|
2018-10-15 04:34:59 +02:00
|
|
|
ProgramProcessorRegister (
|
|
|
|
IN CPU_REGISTER_TABLE *RegisterTable,
|
|
|
|
IN EFI_CPU_PHYSICAL_LOCATION *ApLocation,
|
|
|
|
IN CPU_STATUS_INFORMATION *CpuStatus,
|
|
|
|
IN PROGRAM_CPU_REGISTER_FLAGS *CpuFlags
|
2015-10-19 21:12:53 +02:00
|
|
|
)
|
|
|
|
{
|
|
|
|
CPU_REGISTER_TABLE_ENTRY *RegisterTableEntry;
|
|
|
|
UINTN Index;
|
|
|
|
UINTN Value;
|
2018-10-15 04:34:59 +02:00
|
|
|
CPU_REGISTER_TABLE_ENTRY *RegisterTableEntryHead;
|
|
|
|
volatile UINT32 *SemaphorePtr;
|
|
|
|
UINT32 FirstThread;
|
|
|
|
UINT32 PackageThreadsCount;
|
|
|
|
UINT32 CurrentThread;
|
|
|
|
UINTN ProcessorIndex;
|
|
|
|
UINTN ValidThreadCount;
|
|
|
|
UINT32 *ValidCoreCountPerPackage;
|
2019-08-16 05:57:26 +02:00
|
|
|
EFI_STATUS Status;
|
2019-08-16 05:57:27 +02:00
|
|
|
UINT64 CurrentValue;
|
2015-10-19 21:12:53 +02:00
|
|
|
|
|
|
|
//
|
|
|
|
// Traverse Register Table of this logical processor
|
|
|
|
//
|
2018-10-15 04:34:59 +02:00
|
|
|
RegisterTableEntryHead = (CPU_REGISTER_TABLE_ENTRY *) (UINTN) RegisterTable->RegisterTableEntry;
|
|
|
|
|
|
|
|
for (Index = 0; Index < RegisterTable->TableLength; Index++) {
|
|
|
|
|
|
|
|
RegisterTableEntry = &RegisterTableEntryHead[Index];
|
|
|
|
|
2015-10-19 21:12:53 +02:00
|
|
|
//
|
|
|
|
// Check the type of specified register
|
|
|
|
//
|
|
|
|
switch (RegisterTableEntry->RegisterType) {
|
|
|
|
//
|
|
|
|
// The specified register is Control Register
|
|
|
|
//
|
|
|
|
case ControlRegister:
|
2019-08-16 05:57:26 +02:00
|
|
|
Status = ReadWriteCr (RegisterTableEntry->Index, TRUE, &Value);
|
|
|
|
if (EFI_ERROR (Status)) {
|
2015-10-19 21:12:53 +02:00
|
|
|
break;
|
|
|
|
}
|
2019-08-16 05:57:27 +02:00
|
|
|
if (RegisterTableEntry->TestThenWrite) {
|
|
|
|
CurrentValue = BitFieldRead64 (
|
|
|
|
Value,
|
|
|
|
RegisterTableEntry->ValidBitStart,
|
|
|
|
RegisterTableEntry->ValidBitStart + RegisterTableEntry->ValidBitLength - 1
|
|
|
|
);
|
|
|
|
if (CurrentValue == RegisterTableEntry->Value) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2019-08-16 05:57:26 +02:00
|
|
|
Value = (UINTN) BitFieldWrite64 (
|
|
|
|
Value,
|
|
|
|
RegisterTableEntry->ValidBitStart,
|
|
|
|
RegisterTableEntry->ValidBitStart + RegisterTableEntry->ValidBitLength - 1,
|
|
|
|
RegisterTableEntry->Value
|
|
|
|
);
|
|
|
|
ReadWriteCr (RegisterTableEntry->Index, FALSE, &Value);
|
2015-10-19 21:12:53 +02:00
|
|
|
break;
|
|
|
|
//
|
|
|
|
// The specified register is Model Specific Register
|
|
|
|
//
|
|
|
|
case Msr:
|
2019-08-16 05:57:27 +02:00
|
|
|
if (RegisterTableEntry->TestThenWrite) {
|
|
|
|
Value = (UINTN)AsmReadMsr64 (RegisterTableEntry->Index);
|
|
|
|
if (RegisterTableEntry->ValidBitLength >= 64) {
|
|
|
|
if (Value == RegisterTableEntry->Value) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
CurrentValue = BitFieldRead64 (
|
|
|
|
Value,
|
|
|
|
RegisterTableEntry->ValidBitStart,
|
|
|
|
RegisterTableEntry->ValidBitStart + RegisterTableEntry->ValidBitLength - 1
|
|
|
|
);
|
|
|
|
if (CurrentValue == RegisterTableEntry->Value) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-10-19 21:12:53 +02:00
|
|
|
//
|
|
|
|
// If this function is called to restore register setting after INIT signal,
|
|
|
|
// there is no need to restore MSRs in register table.
|
|
|
|
//
|
|
|
|
if (RegisterTableEntry->ValidBitLength >= 64) {
|
|
|
|
//
|
|
|
|
// If length is not less than 64 bits, then directly write without reading
|
|
|
|
//
|
|
|
|
AsmWriteMsr64 (
|
|
|
|
RegisterTableEntry->Index,
|
|
|
|
RegisterTableEntry->Value
|
|
|
|
);
|
|
|
|
} else {
|
|
|
|
//
|
|
|
|
// Set the bit section according to bit start and length
|
|
|
|
//
|
|
|
|
AsmMsrBitFieldWrite64 (
|
|
|
|
RegisterTableEntry->Index,
|
|
|
|
RegisterTableEntry->ValidBitStart,
|
|
|
|
RegisterTableEntry->ValidBitStart + RegisterTableEntry->ValidBitLength - 1,
|
|
|
|
RegisterTableEntry->Value
|
|
|
|
);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
//
|
2016-06-29 03:00:13 +02:00
|
|
|
// MemoryMapped operations
|
|
|
|
//
|
|
|
|
case MemoryMapped:
|
2018-10-15 04:34:59 +02:00
|
|
|
AcquireSpinLock (&CpuFlags->MemoryMappedLock);
|
2016-06-29 03:00:13 +02:00
|
|
|
MmioBitFieldWrite32 (
|
2017-03-23 06:19:49 +01:00
|
|
|
(UINTN)(RegisterTableEntry->Index | LShiftU64 (RegisterTableEntry->HighIndex, 32)),
|
2016-06-29 03:00:13 +02:00
|
|
|
RegisterTableEntry->ValidBitStart,
|
|
|
|
RegisterTableEntry->ValidBitStart + RegisterTableEntry->ValidBitLength - 1,
|
|
|
|
(UINT32)RegisterTableEntry->Value
|
|
|
|
);
|
2018-10-15 04:34:59 +02:00
|
|
|
ReleaseSpinLock (&CpuFlags->MemoryMappedLock);
|
2016-06-29 03:00:13 +02:00
|
|
|
break;
|
|
|
|
//
|
2015-10-19 21:12:53 +02:00
|
|
|
// Enable or disable cache
|
|
|
|
//
|
|
|
|
case CacheControl:
|
|
|
|
//
|
|
|
|
// If value of the entry is 0, then disable cache. Otherwise, enable cache.
|
|
|
|
//
|
|
|
|
if (RegisterTableEntry->Value == 0) {
|
|
|
|
AsmDisableCache ();
|
|
|
|
} else {
|
|
|
|
AsmEnableCache ();
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
case Semaphore:
|
|
|
|
// Semaphore works logic like below:
|
|
|
|
//
|
|
|
|
// V(x) = LibReleaseSemaphore (Semaphore[FirstThread + x]);
|
|
|
|
// P(x) = LibWaitForSemaphore (Semaphore[FirstThread + x]);
|
|
|
|
//
|
|
|
|
// All threads (T0...Tn) waits in P() line and continues running
|
|
|
|
// together.
|
|
|
|
//
|
|
|
|
//
|
|
|
|
// T0 T1 ... Tn
|
|
|
|
//
|
|
|
|
// V(0...n) V(0...n) ... V(0...n)
|
|
|
|
// n * P(0) n * P(1) ... n * P(n)
|
|
|
|
//
|
|
|
|
ASSERT (
|
2018-10-25 03:51:29 +02:00
|
|
|
(ApLocation != NULL) &&
|
2018-10-15 04:34:59 +02:00
|
|
|
(CpuStatus->ValidCoreCountPerPackage != 0) &&
|
UefiCpuPkg/PiSmmCpuDxeSmm: Separate semaphore container.
In current implementation, core and package level sync uses same semaphores.
Sharing the semaphore may cause wrong execution order.
For example:
1. Feature A has CPU_FEATURE_CORE_BEFORE dependency with Feature B.
2. Feature C has CPU_FEATURE_PACKAGE_AFTER dependency with Feature B.
The expected feature initialization order is A B C:
A ---- (Core Depends) ----> B ---- (Package Depends) ----> C
For a CPU has 1 package, 2 cores and 4 threads. The feature initialization
order may like below:
Thread#1 Thread#2 Thread#3 Thread#4
[A.Init] [A.Init] [A.Init]
Release(S1, S2) Release(S1, S2) Release(S3, S4)
Wait(S1) * 2 Wait(S2) * 2 <------------------------------- Core sync
[B.Init] [B.Init]
Release (S1,S2,S3,S4)
Wait (S1) * 4 <----------------------------------------------------- Package sync
Wait(S4 * 2) <- Core sync
[B.Init]
In above case, for thread#4, when it syncs in core level, Wait(S4) * 2 isn't
blocked and [B.Init] runs. But [A.Init] hasn't run in thread#3. It's wrong!
Thread#4 should execute [B.Init] after thread#3 executes [A.Init] because B
core level depends on A.
The reason of the wrong execution order is that S4 is released in thread#1
by calling Release (S1, S2, S3, S4) and in thread #4 by calling
Release (S3, S4).
To fix this issue, core level sync and package level sync should use separate
semaphores.
In above example, the S4 released in Release (S1, S2, S3, S4) should not be the
same semaphore as that in Release (S3, S4).
Related BZ: https://bugzilla.tianocore.org/show_bug.cgi?id=1311
Cc: Laszlo Ersek <lersek@redhat.com>
Cc: Ruiyu Ni <ruiyu.ni@intel.com>
Contributed-under: TianoCore Contribution Agreement 1.1
Signed-off-by: Eric Dong <eric.dong@intel.com>
Reviewed-by: Ruiyu Ni <ruiyu.ni@intel.com>
Acked-by: Laszlo Ersek <lersek@redhat.com>
2018-11-10 03:53:41 +01:00
|
|
|
(CpuFlags->CoreSemaphoreCount != NULL) &&
|
|
|
|
(CpuFlags->PackageSemaphoreCount != NULL)
|
2018-10-15 04:34:59 +02:00
|
|
|
);
|
|
|
|
switch (RegisterTableEntry->Value) {
|
|
|
|
case CoreDepType:
|
UefiCpuPkg/PiSmmCpuDxeSmm: Separate semaphore container.
In current implementation, core and package level sync uses same semaphores.
Sharing the semaphore may cause wrong execution order.
For example:
1. Feature A has CPU_FEATURE_CORE_BEFORE dependency with Feature B.
2. Feature C has CPU_FEATURE_PACKAGE_AFTER dependency with Feature B.
The expected feature initialization order is A B C:
A ---- (Core Depends) ----> B ---- (Package Depends) ----> C
For a CPU has 1 package, 2 cores and 4 threads. The feature initialization
order may like below:
Thread#1 Thread#2 Thread#3 Thread#4
[A.Init] [A.Init] [A.Init]
Release(S1, S2) Release(S1, S2) Release(S3, S4)
Wait(S1) * 2 Wait(S2) * 2 <------------------------------- Core sync
[B.Init] [B.Init]
Release (S1,S2,S3,S4)
Wait (S1) * 4 <----------------------------------------------------- Package sync
Wait(S4 * 2) <- Core sync
[B.Init]
In above case, for thread#4, when it syncs in core level, Wait(S4) * 2 isn't
blocked and [B.Init] runs. But [A.Init] hasn't run in thread#3. It's wrong!
Thread#4 should execute [B.Init] after thread#3 executes [A.Init] because B
core level depends on A.
The reason of the wrong execution order is that S4 is released in thread#1
by calling Release (S1, S2, S3, S4) and in thread #4 by calling
Release (S3, S4).
To fix this issue, core level sync and package level sync should use separate
semaphores.
In above example, the S4 released in Release (S1, S2, S3, S4) should not be the
same semaphore as that in Release (S3, S4).
Related BZ: https://bugzilla.tianocore.org/show_bug.cgi?id=1311
Cc: Laszlo Ersek <lersek@redhat.com>
Cc: Ruiyu Ni <ruiyu.ni@intel.com>
Contributed-under: TianoCore Contribution Agreement 1.1
Signed-off-by: Eric Dong <eric.dong@intel.com>
Reviewed-by: Ruiyu Ni <ruiyu.ni@intel.com>
Acked-by: Laszlo Ersek <lersek@redhat.com>
2018-11-10 03:53:41 +01:00
|
|
|
SemaphorePtr = CpuFlags->CoreSemaphoreCount;
|
2018-10-15 04:34:59 +02:00
|
|
|
//
|
|
|
|
// Get Offset info for the first thread in the core which current thread belongs to.
|
|
|
|
//
|
|
|
|
FirstThread = (ApLocation->Package * CpuStatus->MaxCoreCount + ApLocation->Core) * CpuStatus->MaxThreadCount;
|
|
|
|
CurrentThread = FirstThread + ApLocation->Thread;
|
|
|
|
//
|
|
|
|
// First Notify all threads in current Core that this thread has ready.
|
|
|
|
//
|
|
|
|
for (ProcessorIndex = 0; ProcessorIndex < CpuStatus->MaxThreadCount; ProcessorIndex ++) {
|
|
|
|
S3ReleaseSemaphore (&SemaphorePtr[FirstThread + ProcessorIndex]);
|
|
|
|
}
|
|
|
|
//
|
|
|
|
// Second, check whether all valid threads in current core have ready.
|
|
|
|
//
|
|
|
|
for (ProcessorIndex = 0; ProcessorIndex < CpuStatus->MaxThreadCount; ProcessorIndex ++) {
|
|
|
|
S3WaitForSemaphore (&SemaphorePtr[CurrentThread]);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case PackageDepType:
|
UefiCpuPkg/PiSmmCpuDxeSmm: Separate semaphore container.
In current implementation, core and package level sync uses same semaphores.
Sharing the semaphore may cause wrong execution order.
For example:
1. Feature A has CPU_FEATURE_CORE_BEFORE dependency with Feature B.
2. Feature C has CPU_FEATURE_PACKAGE_AFTER dependency with Feature B.
The expected feature initialization order is A B C:
A ---- (Core Depends) ----> B ---- (Package Depends) ----> C
For a CPU has 1 package, 2 cores and 4 threads. The feature initialization
order may like below:
Thread#1 Thread#2 Thread#3 Thread#4
[A.Init] [A.Init] [A.Init]
Release(S1, S2) Release(S1, S2) Release(S3, S4)
Wait(S1) * 2 Wait(S2) * 2 <------------------------------- Core sync
[B.Init] [B.Init]
Release (S1,S2,S3,S4)
Wait (S1) * 4 <----------------------------------------------------- Package sync
Wait(S4 * 2) <- Core sync
[B.Init]
In above case, for thread#4, when it syncs in core level, Wait(S4) * 2 isn't
blocked and [B.Init] runs. But [A.Init] hasn't run in thread#3. It's wrong!
Thread#4 should execute [B.Init] after thread#3 executes [A.Init] because B
core level depends on A.
The reason of the wrong execution order is that S4 is released in thread#1
by calling Release (S1, S2, S3, S4) and in thread #4 by calling
Release (S3, S4).
To fix this issue, core level sync and package level sync should use separate
semaphores.
In above example, the S4 released in Release (S1, S2, S3, S4) should not be the
same semaphore as that in Release (S3, S4).
Related BZ: https://bugzilla.tianocore.org/show_bug.cgi?id=1311
Cc: Laszlo Ersek <lersek@redhat.com>
Cc: Ruiyu Ni <ruiyu.ni@intel.com>
Contributed-under: TianoCore Contribution Agreement 1.1
Signed-off-by: Eric Dong <eric.dong@intel.com>
Reviewed-by: Ruiyu Ni <ruiyu.ni@intel.com>
Acked-by: Laszlo Ersek <lersek@redhat.com>
2018-11-10 03:53:41 +01:00
|
|
|
SemaphorePtr = CpuFlags->PackageSemaphoreCount;
|
2018-10-15 04:34:59 +02:00
|
|
|
ValidCoreCountPerPackage = (UINT32 *)(UINTN)CpuStatus->ValidCoreCountPerPackage;
|
|
|
|
//
|
|
|
|
// Get Offset info for the first thread in the package which current thread belongs to.
|
|
|
|
//
|
|
|
|
FirstThread = ApLocation->Package * CpuStatus->MaxCoreCount * CpuStatus->MaxThreadCount;
|
|
|
|
//
|
|
|
|
// Get the possible threads count for current package.
|
|
|
|
//
|
|
|
|
PackageThreadsCount = CpuStatus->MaxThreadCount * CpuStatus->MaxCoreCount;
|
|
|
|
CurrentThread = FirstThread + CpuStatus->MaxThreadCount * ApLocation->Core + ApLocation->Thread;
|
|
|
|
//
|
|
|
|
// Get the valid thread count for current package.
|
|
|
|
//
|
|
|
|
ValidThreadCount = CpuStatus->MaxThreadCount * ValidCoreCountPerPackage[ApLocation->Package];
|
|
|
|
|
|
|
|
//
|
|
|
|
// Different packages may have different valid cores in them. If driver maintail clearly
|
|
|
|
// cores number in different packages, the logic will be much complicated.
|
|
|
|
// Here driver just simply records the max core number in all packages and use it as expect
|
|
|
|
// core number for all packages.
|
|
|
|
// In below two steps logic, first current thread will Release semaphore for each thread
|
|
|
|
// in current package. Maybe some threads are not valid in this package, but driver don't
|
|
|
|
// care. Second, driver will let current thread wait semaphore for all valid threads in
|
|
|
|
// current package. Because only the valid threads will do release semaphore for this
|
|
|
|
// thread, driver here only need to wait the valid thread count.
|
|
|
|
//
|
|
|
|
|
|
|
|
//
|
|
|
|
// First Notify all threads in current package that this thread has ready.
|
|
|
|
//
|
|
|
|
for (ProcessorIndex = 0; ProcessorIndex < PackageThreadsCount ; ProcessorIndex ++) {
|
|
|
|
S3ReleaseSemaphore (&SemaphorePtr[FirstThread + ProcessorIndex]);
|
|
|
|
}
|
|
|
|
//
|
|
|
|
// Second, check whether all valid threads in current package have ready.
|
|
|
|
//
|
|
|
|
for (ProcessorIndex = 0; ProcessorIndex < ValidThreadCount; ProcessorIndex ++) {
|
|
|
|
S3WaitForSemaphore (&SemaphorePtr[CurrentThread]);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
2015-10-19 21:12:53 +02:00
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
/**
|
|
|
|
|
|
|
|
Set Processor register for one AP.
|
2018-10-25 03:51:29 +02:00
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
@param PreSmmRegisterTable Use pre Smm register table or register table.
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
SetRegister (
|
|
|
|
IN BOOLEAN PreSmmRegisterTable
|
|
|
|
)
|
|
|
|
{
|
|
|
|
CPU_REGISTER_TABLE *RegisterTable;
|
|
|
|
CPU_REGISTER_TABLE *RegisterTables;
|
|
|
|
UINT32 InitApicId;
|
|
|
|
UINTN ProcIndex;
|
|
|
|
UINTN Index;
|
|
|
|
|
|
|
|
if (PreSmmRegisterTable) {
|
|
|
|
RegisterTables = (CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.PreSmmInitRegisterTable;
|
|
|
|
} else {
|
|
|
|
RegisterTables = (CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.RegisterTable;
|
|
|
|
}
|
|
|
|
|
|
|
|
InitApicId = GetInitialApicId ();
|
|
|
|
RegisterTable = NULL;
|
2018-10-25 04:12:52 +02:00
|
|
|
ProcIndex = (UINTN)-1;
|
2018-10-15 04:34:59 +02:00
|
|
|
for (Index = 0; Index < mAcpiCpuData.NumberOfCpus; Index++) {
|
|
|
|
if (RegisterTables[Index].InitialApicId == InitApicId) {
|
|
|
|
RegisterTable = &RegisterTables[Index];
|
|
|
|
ProcIndex = Index;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
ASSERT (RegisterTable != NULL);
|
|
|
|
|
|
|
|
if (mAcpiCpuData.ApLocation != 0) {
|
|
|
|
ProgramProcessorRegister (
|
|
|
|
RegisterTable,
|
|
|
|
(EFI_CPU_PHYSICAL_LOCATION *)(UINTN)mAcpiCpuData.ApLocation + ProcIndex,
|
|
|
|
&mAcpiCpuData.CpuStatus,
|
|
|
|
&mCpuFlags
|
|
|
|
);
|
|
|
|
} else {
|
|
|
|
ProgramProcessorRegister (
|
|
|
|
RegisterTable,
|
|
|
|
NULL,
|
|
|
|
&mAcpiCpuData.CpuStatus,
|
|
|
|
&mCpuFlags
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-10-19 21:12:53 +02:00
|
|
|
/**
|
2017-09-28 10:57:35 +02:00
|
|
|
AP initialization before then after SMBASE relocation in the S3 boot path.
|
2015-10-19 21:12:53 +02:00
|
|
|
**/
|
|
|
|
VOID
|
2017-09-28 11:12:38 +02:00
|
|
|
InitializeAp (
|
2015-10-19 21:12:53 +02:00
|
|
|
VOID
|
|
|
|
)
|
|
|
|
{
|
2017-09-28 10:57:35 +02:00
|
|
|
UINTN TopOfStack;
|
|
|
|
UINT8 Stack[128];
|
2015-10-19 21:12:53 +02:00
|
|
|
|
|
|
|
LoadMtrrData (mAcpiCpuData.MtrrTable);
|
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
SetRegister (TRUE);
|
2017-09-28 10:57:35 +02:00
|
|
|
|
2015-10-19 21:12:53 +02:00
|
|
|
//
|
|
|
|
// Count down the number with lock mechanism.
|
|
|
|
//
|
|
|
|
InterlockedDecrement (&mNumberToFinish);
|
|
|
|
|
2017-09-28 10:57:35 +02:00
|
|
|
//
|
|
|
|
// Wait for BSP to signal SMM Base relocation done.
|
|
|
|
//
|
|
|
|
while (!mInitApsAfterSmmBaseReloc) {
|
|
|
|
CpuPause ();
|
|
|
|
}
|
2015-10-19 21:12:53 +02:00
|
|
|
|
|
|
|
ProgramVirtualWireMode ();
|
|
|
|
DisableLvtInterrupts ();
|
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
SetRegister (FALSE);
|
2015-10-19 21:12:53 +02:00
|
|
|
|
|
|
|
//
|
2016-11-11 06:25:51 +01:00
|
|
|
// Place AP into the safe code, count down the number with lock mechanism in the safe code.
|
2016-11-10 06:40:12 +01:00
|
|
|
//
|
2016-11-17 21:41:35 +01:00
|
|
|
TopOfStack = (UINTN) Stack + sizeof (Stack);
|
|
|
|
TopOfStack &= ~(UINTN) (CPU_STACK_ALIGNMENT - 1);
|
2016-11-10 06:40:12 +01:00
|
|
|
CopyMem ((VOID *) (UINTN) mApHltLoopCode, mApHltLoopCodeTemplate, sizeof (mApHltLoopCodeTemplate));
|
2016-11-17 21:41:35 +01:00
|
|
|
TransferApToSafeState ((UINTN)mApHltLoopCode, TopOfStack, (UINTN)&mNumberToFinish);
|
2015-10-19 21:12:53 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
Prepares startup vector for APs.
|
|
|
|
|
|
|
|
This function prepares startup vector for APs.
|
|
|
|
|
|
|
|
@param WorkingBuffer The address of the work buffer.
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
PrepareApStartupVector (
|
|
|
|
EFI_PHYSICAL_ADDRESS WorkingBuffer
|
|
|
|
)
|
|
|
|
{
|
|
|
|
EFI_PHYSICAL_ADDRESS StartupVector;
|
|
|
|
MP_ASSEMBLY_ADDRESS_MAP AddressMap;
|
|
|
|
|
|
|
|
//
|
|
|
|
// Get the address map of startup code for AP,
|
|
|
|
// including code size, and offset of long jump instructions to redirect.
|
|
|
|
//
|
|
|
|
ZeroMem (&AddressMap, sizeof (AddressMap));
|
|
|
|
AsmGetAddressMap (&AddressMap);
|
|
|
|
|
|
|
|
StartupVector = WorkingBuffer;
|
|
|
|
|
|
|
|
//
|
|
|
|
// Copy AP startup code to startup vector, and then redirect the long jump
|
|
|
|
// instructions for mode switching.
|
|
|
|
//
|
|
|
|
CopyMem ((VOID *) (UINTN) StartupVector, AddressMap.RendezvousFunnelAddress, AddressMap.Size);
|
|
|
|
*(UINT32 *) (UINTN) (StartupVector + AddressMap.FlatJumpOffset + 3) = (UINT32) (StartupVector + AddressMap.PModeEntryOffset);
|
|
|
|
if (AddressMap.LongJumpOffset != 0) {
|
|
|
|
*(UINT32 *) (UINTN) (StartupVector + AddressMap.LongJumpOffset + 2) = (UINT32) (StartupVector + AddressMap.LModeEntryOffset);
|
|
|
|
}
|
|
|
|
|
|
|
|
//
|
|
|
|
// Get the start address of exchange data between BSP and AP.
|
|
|
|
//
|
|
|
|
mExchangeInfo = (MP_CPU_EXCHANGE_INFO *) (UINTN) (StartupVector + AddressMap.Size);
|
|
|
|
ZeroMem ((VOID *) mExchangeInfo, sizeof (MP_CPU_EXCHANGE_INFO));
|
|
|
|
|
|
|
|
CopyMem ((VOID *) (UINTN) &mExchangeInfo->GdtrProfile, (VOID *) (UINTN) mAcpiCpuData.GdtrProfile, sizeof (IA32_DESCRIPTOR));
|
|
|
|
CopyMem ((VOID *) (UINTN) &mExchangeInfo->IdtrProfile, (VOID *) (UINTN) mAcpiCpuData.IdtrProfile, sizeof (IA32_DESCRIPTOR));
|
|
|
|
|
|
|
|
mExchangeInfo->StackStart = (VOID *) (UINTN) mAcpiCpuData.StackAddress;
|
|
|
|
mExchangeInfo->StackSize = mAcpiCpuData.StackSize;
|
|
|
|
mExchangeInfo->BufferStart = (UINT32) StartupVector;
|
|
|
|
mExchangeInfo->Cr3 = (UINT32) (AsmReadCr3 ());
|
2018-01-11 10:05:15 +01:00
|
|
|
mExchangeInfo->InitializeFloatingPointUnitsAddress = (UINTN)InitializeFloatingPointUnits;
|
2015-10-19 21:12:53 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
The function is invoked before SMBASE relocation in S3 path to restores CPU status.
|
|
|
|
|
|
|
|
The function is invoked before SMBASE relocation in S3 path. It does first time microcode load
|
|
|
|
and restores MTRRs for both BSP and APs.
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
2017-09-28 11:12:38 +02:00
|
|
|
InitializeCpuBeforeRebase (
|
2015-10-19 21:12:53 +02:00
|
|
|
VOID
|
|
|
|
)
|
|
|
|
{
|
|
|
|
LoadMtrrData (mAcpiCpuData.MtrrTable);
|
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
SetRegister (TRUE);
|
2015-10-19 21:12:53 +02:00
|
|
|
|
|
|
|
ProgramVirtualWireMode ();
|
|
|
|
|
|
|
|
PrepareApStartupVector (mAcpiCpuData.StartupVector);
|
|
|
|
|
|
|
|
mNumberToFinish = mAcpiCpuData.NumberOfCpus - 1;
|
2017-09-28 11:12:38 +02:00
|
|
|
mExchangeInfo->ApFunction = (VOID *) (UINTN) InitializeAp;
|
2017-09-28 10:57:35 +02:00
|
|
|
|
|
|
|
//
|
|
|
|
// Execute code for before SmmBaseReloc. Note: This flag is maintained across S3 boots.
|
|
|
|
//
|
|
|
|
mInitApsAfterSmmBaseReloc = FALSE;
|
2015-10-19 21:12:53 +02:00
|
|
|
|
|
|
|
//
|
|
|
|
// Send INIT IPI - SIPI to all APs
|
|
|
|
//
|
|
|
|
SendInitSipiSipiAllExcludingSelf ((UINT32)mAcpiCpuData.StartupVector);
|
|
|
|
|
|
|
|
while (mNumberToFinish > 0) {
|
|
|
|
CpuPause ();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
The function is invoked after SMBASE relocation in S3 path to restores CPU status.
|
|
|
|
|
|
|
|
The function is invoked after SMBASE relocation in S3 path. It restores configuration according to
|
|
|
|
data saved by normal boot path for both BSP and APs.
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
2017-09-28 11:12:38 +02:00
|
|
|
InitializeCpuAfterRebase (
|
2015-10-19 21:12:53 +02:00
|
|
|
VOID
|
|
|
|
)
|
|
|
|
{
|
|
|
|
mNumberToFinish = mAcpiCpuData.NumberOfCpus - 1;
|
|
|
|
|
|
|
|
//
|
2018-10-15 04:34:59 +02:00
|
|
|
// Signal that SMM base relocation is complete and to continue initialization for all APs.
|
2015-10-19 21:12:53 +02:00
|
|
|
//
|
2017-09-28 10:57:35 +02:00
|
|
|
mInitApsAfterSmmBaseReloc = TRUE;
|
2015-10-19 21:12:53 +02:00
|
|
|
|
2018-10-15 04:34:59 +02:00
|
|
|
//
|
|
|
|
// Must begin set register after all APs have continue their initialization.
|
|
|
|
// This is a requirement to support semaphore mechanism in register table.
|
|
|
|
// Because if semaphore's dependence type is package type, semaphore will wait
|
|
|
|
// for all Aps in one package finishing their tasks before set next register
|
|
|
|
// for all APs. If the Aps not begin its task during BSP doing its task, the
|
|
|
|
// BSP thread will hang because it is waiting for other Aps in the same
|
|
|
|
// package finishing their task.
|
|
|
|
//
|
|
|
|
SetRegister (FALSE);
|
|
|
|
|
2015-10-19 21:12:53 +02:00
|
|
|
while (mNumberToFinish > 0) {
|
|
|
|
CpuPause ();
|
|
|
|
}
|
|
|
|
}
|
2016-07-19 10:44:16 +02:00
|
|
|
|
|
|
|
/**
|
|
|
|
Restore SMM Configuration in S3 boot path.
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
RestoreSmmConfigurationInS3 (
|
|
|
|
VOID
|
|
|
|
)
|
|
|
|
{
|
2016-07-20 04:24:58 +02:00
|
|
|
if (!mAcpiS3Enable) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-07-19 10:44:16 +02:00
|
|
|
//
|
|
|
|
// Restore SMM Configuration in S3 boot path.
|
|
|
|
//
|
|
|
|
if (mRestoreSmmConfigurationInS3) {
|
|
|
|
//
|
|
|
|
// Need make sure gSmst is correct because below function may use them.
|
|
|
|
//
|
|
|
|
gSmst->SmmStartupThisAp = gSmmCpuPrivate->SmmCoreEntryContext.SmmStartupThisAp;
|
|
|
|
gSmst->CurrentlyExecutingCpu = gSmmCpuPrivate->SmmCoreEntryContext.CurrentlyExecutingCpu;
|
|
|
|
gSmst->NumberOfCpus = gSmmCpuPrivate->SmmCoreEntryContext.NumberOfCpus;
|
|
|
|
gSmst->CpuSaveStateSize = gSmmCpuPrivate->SmmCoreEntryContext.CpuSaveStateSize;
|
|
|
|
gSmst->CpuSaveState = gSmmCpuPrivate->SmmCoreEntryContext.CpuSaveState;
|
|
|
|
|
|
|
|
//
|
|
|
|
// Configure SMM Code Access Check feature if available.
|
|
|
|
//
|
|
|
|
ConfigSmmCodeAccessCheck ();
|
|
|
|
|
|
|
|
SmmCpuFeaturesCompleteSmmReadyToLock ();
|
|
|
|
|
|
|
|
mRestoreSmmConfigurationInS3 = FALSE;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
Perform SMM initialization for all processors in the S3 boot path.
|
|
|
|
|
|
|
|
For a native platform, MP initialization in the S3 boot path is also performed in this function.
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
EFIAPI
|
|
|
|
SmmRestoreCpu (
|
|
|
|
VOID
|
|
|
|
)
|
|
|
|
{
|
|
|
|
SMM_S3_RESUME_STATE *SmmS3ResumeState;
|
|
|
|
IA32_DESCRIPTOR Ia32Idtr;
|
|
|
|
IA32_DESCRIPTOR X64Idtr;
|
|
|
|
IA32_IDT_GATE_DESCRIPTOR IdtEntryTable[EXCEPTION_VECTOR_NUMBER];
|
|
|
|
EFI_STATUS Status;
|
|
|
|
|
|
|
|
DEBUG ((EFI_D_INFO, "SmmRestoreCpu()\n"));
|
|
|
|
|
|
|
|
mSmmS3Flag = TRUE;
|
|
|
|
|
|
|
|
//
|
|
|
|
// See if there is enough context to resume PEI Phase
|
|
|
|
//
|
|
|
|
if (mSmmS3ResumeState == NULL) {
|
|
|
|
DEBUG ((EFI_D_ERROR, "No context to return to PEI Phase\n"));
|
|
|
|
CpuDeadLoop ();
|
|
|
|
}
|
|
|
|
|
|
|
|
SmmS3ResumeState = mSmmS3ResumeState;
|
|
|
|
ASSERT (SmmS3ResumeState != NULL);
|
|
|
|
|
|
|
|
if (SmmS3ResumeState->Signature == SMM_S3_RESUME_SMM_64) {
|
|
|
|
//
|
|
|
|
// Save the IA32 IDT Descriptor
|
|
|
|
//
|
|
|
|
AsmReadIdtr ((IA32_DESCRIPTOR *) &Ia32Idtr);
|
|
|
|
|
|
|
|
//
|
|
|
|
// Setup X64 IDT table
|
|
|
|
//
|
|
|
|
ZeroMem (IdtEntryTable, sizeof (IA32_IDT_GATE_DESCRIPTOR) * 32);
|
|
|
|
X64Idtr.Base = (UINTN) IdtEntryTable;
|
|
|
|
X64Idtr.Limit = (UINT16) (sizeof (IA32_IDT_GATE_DESCRIPTOR) * 32 - 1);
|
|
|
|
AsmWriteIdtr ((IA32_DESCRIPTOR *) &X64Idtr);
|
|
|
|
|
|
|
|
//
|
|
|
|
// Setup the default exception handler
|
|
|
|
//
|
|
|
|
Status = InitializeCpuExceptionHandlers (NULL);
|
|
|
|
ASSERT_EFI_ERROR (Status);
|
|
|
|
|
|
|
|
//
|
|
|
|
// Initialize Debug Agent to support source level debug
|
|
|
|
//
|
|
|
|
InitializeDebugAgent (DEBUG_AGENT_INIT_THUNK_PEI_IA32TOX64, (VOID *)&Ia32Idtr, NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
//
|
|
|
|
// Skip initialization if mAcpiCpuData is not valid
|
|
|
|
//
|
|
|
|
if (mAcpiCpuData.NumberOfCpus > 0) {
|
|
|
|
//
|
|
|
|
// First time microcode load and restore MTRRs
|
|
|
|
//
|
2017-09-28 11:12:38 +02:00
|
|
|
InitializeCpuBeforeRebase ();
|
2016-07-19 10:44:16 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
//
|
|
|
|
// Restore SMBASE for BSP and all APs
|
|
|
|
//
|
|
|
|
SmmRelocateBases ();
|
|
|
|
|
|
|
|
//
|
|
|
|
// Skip initialization if mAcpiCpuData is not valid
|
|
|
|
//
|
|
|
|
if (mAcpiCpuData.NumberOfCpus > 0) {
|
|
|
|
//
|
|
|
|
// Restore MSRs for BSP and all APs
|
|
|
|
//
|
2017-09-28 11:12:38 +02:00
|
|
|
InitializeCpuAfterRebase ();
|
2016-07-19 10:44:16 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
//
|
|
|
|
// Set a flag to restore SMM configuration in S3 path.
|
|
|
|
//
|
|
|
|
mRestoreSmmConfigurationInS3 = TRUE;
|
|
|
|
|
|
|
|
DEBUG (( EFI_D_INFO, "SMM S3 Return CS = %x\n", SmmS3ResumeState->ReturnCs));
|
|
|
|
DEBUG (( EFI_D_INFO, "SMM S3 Return Entry Point = %x\n", SmmS3ResumeState->ReturnEntryPoint));
|
|
|
|
DEBUG (( EFI_D_INFO, "SMM S3 Return Context1 = %x\n", SmmS3ResumeState->ReturnContext1));
|
|
|
|
DEBUG (( EFI_D_INFO, "SMM S3 Return Context2 = %x\n", SmmS3ResumeState->ReturnContext2));
|
|
|
|
DEBUG (( EFI_D_INFO, "SMM S3 Return Stack Pointer = %x\n", SmmS3ResumeState->ReturnStackPointer));
|
|
|
|
|
|
|
|
//
|
|
|
|
// If SMM is in 32-bit mode, then use SwitchStack() to resume PEI Phase
|
|
|
|
//
|
|
|
|
if (SmmS3ResumeState->Signature == SMM_S3_RESUME_SMM_32) {
|
|
|
|
DEBUG ((EFI_D_INFO, "Call SwitchStack() to return to S3 Resume in PEI Phase\n"));
|
|
|
|
|
|
|
|
SwitchStack (
|
|
|
|
(SWITCH_STACK_ENTRY_POINT)(UINTN)SmmS3ResumeState->ReturnEntryPoint,
|
|
|
|
(VOID *)(UINTN)SmmS3ResumeState->ReturnContext1,
|
|
|
|
(VOID *)(UINTN)SmmS3ResumeState->ReturnContext2,
|
|
|
|
(VOID *)(UINTN)SmmS3ResumeState->ReturnStackPointer
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
//
|
|
|
|
// If SMM is in 64-bit mode, then use AsmDisablePaging64() to resume PEI Phase
|
|
|
|
//
|
|
|
|
if (SmmS3ResumeState->Signature == SMM_S3_RESUME_SMM_64) {
|
|
|
|
DEBUG ((EFI_D_INFO, "Call AsmDisablePaging64() to return to S3 Resume in PEI Phase\n"));
|
|
|
|
//
|
|
|
|
// Disable interrupt of Debug timer, since new IDT table is for IA32 and will not work in long mode.
|
|
|
|
//
|
|
|
|
SaveAndSetDebugTimerInterrupt (FALSE);
|
|
|
|
//
|
|
|
|
// Restore IA32 IDT table
|
|
|
|
//
|
|
|
|
AsmWriteIdtr ((IA32_DESCRIPTOR *) &Ia32Idtr);
|
|
|
|
AsmDisablePaging64 (
|
|
|
|
SmmS3ResumeState->ReturnCs,
|
|
|
|
(UINT32)SmmS3ResumeState->ReturnEntryPoint,
|
|
|
|
(UINT32)SmmS3ResumeState->ReturnContext1,
|
|
|
|
(UINT32)SmmS3ResumeState->ReturnContext2,
|
|
|
|
(UINT32)SmmS3ResumeState->ReturnStackPointer
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
//
|
|
|
|
// Can not resume PEI Phase
|
|
|
|
//
|
|
|
|
DEBUG ((EFI_D_ERROR, "No context to return to PEI Phase\n"));
|
|
|
|
CpuDeadLoop ();
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
Initialize SMM S3 resume state structure used during S3 Resume.
|
|
|
|
|
|
|
|
@param[in] Cr3 The base address of the page tables to use in SMM.
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
InitSmmS3ResumeState (
|
|
|
|
IN UINT32 Cr3
|
|
|
|
)
|
|
|
|
{
|
|
|
|
VOID *GuidHob;
|
|
|
|
EFI_SMRAM_DESCRIPTOR *SmramDescriptor;
|
|
|
|
SMM_S3_RESUME_STATE *SmmS3ResumeState;
|
2016-11-10 06:40:12 +01:00
|
|
|
EFI_PHYSICAL_ADDRESS Address;
|
|
|
|
EFI_STATUS Status;
|
2016-07-19 10:44:16 +02:00
|
|
|
|
2016-07-20 04:24:58 +02:00
|
|
|
if (!mAcpiS3Enable) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-07-19 10:44:16 +02:00
|
|
|
GuidHob = GetFirstGuidHob (&gEfiAcpiVariableGuid);
|
2018-09-10 05:13:36 +02:00
|
|
|
if (GuidHob == NULL) {
|
|
|
|
DEBUG ((
|
|
|
|
DEBUG_ERROR,
|
|
|
|
"ERROR:%a(): HOB(gEfiAcpiVariableGuid=%g) needed by S3 resume doesn't exist!\n",
|
|
|
|
__FUNCTION__,
|
|
|
|
&gEfiAcpiVariableGuid
|
|
|
|
));
|
|
|
|
CpuDeadLoop ();
|
|
|
|
} else {
|
2016-07-19 10:44:16 +02:00
|
|
|
SmramDescriptor = (EFI_SMRAM_DESCRIPTOR *) GET_GUID_HOB_DATA (GuidHob);
|
|
|
|
|
|
|
|
DEBUG ((EFI_D_INFO, "SMM S3 SMRAM Structure = %x\n", SmramDescriptor));
|
|
|
|
DEBUG ((EFI_D_INFO, "SMM S3 Structure = %x\n", SmramDescriptor->CpuStart));
|
|
|
|
|
|
|
|
SmmS3ResumeState = (SMM_S3_RESUME_STATE *)(UINTN)SmramDescriptor->CpuStart;
|
|
|
|
ZeroMem (SmmS3ResumeState, sizeof (SMM_S3_RESUME_STATE));
|
|
|
|
|
|
|
|
mSmmS3ResumeState = SmmS3ResumeState;
|
|
|
|
SmmS3ResumeState->Smst = (EFI_PHYSICAL_ADDRESS)(UINTN)gSmst;
|
|
|
|
|
|
|
|
SmmS3ResumeState->SmmS3ResumeEntryPoint = (EFI_PHYSICAL_ADDRESS)(UINTN)SmmRestoreCpu;
|
|
|
|
|
|
|
|
SmmS3ResumeState->SmmS3StackSize = SIZE_32KB;
|
|
|
|
SmmS3ResumeState->SmmS3StackBase = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePages (EFI_SIZE_TO_PAGES ((UINTN)SmmS3ResumeState->SmmS3StackSize));
|
|
|
|
if (SmmS3ResumeState->SmmS3StackBase == 0) {
|
|
|
|
SmmS3ResumeState->SmmS3StackSize = 0;
|
|
|
|
}
|
|
|
|
|
UefiCpuPkg/PiSmmCpuDxeSmm: patch "gSmmCr0" with PatchInstructionX86()
Like "gSmmCr4" in the previous patch, "gSmmCr0" is not only used for
machine code patching, but also as a means to communicate the initial CR0
value from SmmRelocateBases() to InitSmmS3ResumeState(). In other words,
the last four bytes of the "mov eax, Cr0Value" instruction's binary
representation are utilized as normal data too.
In order to get rid of the DB for "mov eax, Cr0Value", we have to split
both roles, patching and data flow. Introduce the "mSmmCr0" global (SMRAM)
variable for the data flow purpose. Rename the "gSmmCr0" variable to
"gPatchSmmCr0" so that its association with PatchInstructionX86() is clear
from the declaration, change its type to X86_ASSEMBLY_PATCH_LABEL, and
patch it with PatchInstructionX86(), to the value now contained in
"mSmmCr0".
This lets us remove the binary (DB) encoding of "mov eax, Cr0Value" in
"SmmInit.nasm".
Cc: Eric Dong <eric.dong@intel.com>
Cc: Michael D Kinney <michael.d.kinney@intel.com>
Ref: https://bugzilla.tianocore.org/show_bug.cgi?id=866
Contributed-under: TianoCore Contribution Agreement 1.1
Signed-off-by: Laszlo Ersek <lersek@redhat.com>
Reviewed-by: Liming Gao <liming.gao@intel.com>
2018-02-02 02:10:05 +01:00
|
|
|
SmmS3ResumeState->SmmS3Cr0 = mSmmCr0;
|
2016-07-19 10:44:16 +02:00
|
|
|
SmmS3ResumeState->SmmS3Cr3 = Cr3;
|
UefiCpuPkg/PiSmmCpuDxeSmm: patch "gSmmCr4" with PatchInstructionX86()
Unlike "gSmmCr3" in the previous patch, "gSmmCr4" is not only used for
machine code patching, but also as a means to communicate the initial CR4
value from SmmRelocateBases() to InitSmmS3ResumeState(). In other words,
the last four bytes of the "mov eax, Cr4Value" instruction's binary
representation are utilized as normal data too.
In order to get rid of the DB for "mov eax, Cr4Value", we have to split
both roles, patching and data flow. Introduce the "mSmmCr4" global (SMRAM)
variable for the data flow purpose. Rename the "gSmmCr4" variable to
"gPatchSmmCr4" so that its association with PatchInstructionX86() is clear
from the declaration, change its type to X86_ASSEMBLY_PATCH_LABEL, and
patch it with PatchInstructionX86(), to the value now contained in
"mSmmCr4".
This lets us remove the binary (DB) encoding of "mov eax, Cr4Value" in
"SmmInit.nasm".
Cc: Eric Dong <eric.dong@intel.com>
Cc: Michael D Kinney <michael.d.kinney@intel.com>
Ref: https://bugzilla.tianocore.org/show_bug.cgi?id=866
Contributed-under: TianoCore Contribution Agreement 1.1
Signed-off-by: Laszlo Ersek <lersek@redhat.com>
Reviewed-by: Liming Gao <liming.gao@intel.com>
2018-02-02 02:10:05 +01:00
|
|
|
SmmS3ResumeState->SmmS3Cr4 = mSmmCr4;
|
2016-07-19 10:44:16 +02:00
|
|
|
|
|
|
|
if (sizeof (UINTN) == sizeof (UINT64)) {
|
|
|
|
SmmS3ResumeState->Signature = SMM_S3_RESUME_SMM_64;
|
|
|
|
}
|
|
|
|
if (sizeof (UINTN) == sizeof (UINT32)) {
|
|
|
|
SmmS3ResumeState->Signature = SMM_S3_RESUME_SMM_32;
|
|
|
|
}
|
|
|
|
|
2018-09-14 07:40:37 +02:00
|
|
|
//
|
|
|
|
// Patch SmmS3ResumeState->SmmS3Cr3
|
|
|
|
//
|
|
|
|
InitSmmS3Cr3 ();
|
|
|
|
}
|
2016-11-10 06:40:12 +01:00
|
|
|
|
|
|
|
//
|
|
|
|
// Allocate safe memory in ACPI NVS for AP to execute hlt loop in
|
|
|
|
// protected mode on S3 path
|
|
|
|
//
|
|
|
|
Address = BASE_4GB - 1;
|
|
|
|
Status = gBS->AllocatePages (
|
|
|
|
AllocateMaxAddress,
|
|
|
|
EfiACPIMemoryNVS,
|
|
|
|
EFI_SIZE_TO_PAGES (sizeof (mApHltLoopCodeTemplate)),
|
|
|
|
&Address
|
|
|
|
);
|
|
|
|
ASSERT_EFI_ERROR (Status);
|
|
|
|
mApHltLoopCode = (UINT8 *) (UINTN) Address;
|
2016-07-19 10:44:16 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
Copy register table from ACPI NVS memory into SMRAM.
|
|
|
|
|
|
|
|
@param[in] DestinationRegisterTableList Points to destination register table.
|
|
|
|
@param[in] SourceRegisterTableList Points to source register table.
|
|
|
|
@param[in] NumberOfCpus Number of CPUs.
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
CopyRegisterTable (
|
|
|
|
IN CPU_REGISTER_TABLE *DestinationRegisterTableList,
|
|
|
|
IN CPU_REGISTER_TABLE *SourceRegisterTableList,
|
|
|
|
IN UINT32 NumberOfCpus
|
|
|
|
)
|
|
|
|
{
|
|
|
|
UINTN Index;
|
|
|
|
CPU_REGISTER_TABLE_ENTRY *RegisterTableEntry;
|
|
|
|
|
|
|
|
CopyMem (DestinationRegisterTableList, SourceRegisterTableList, NumberOfCpus * sizeof (CPU_REGISTER_TABLE));
|
|
|
|
for (Index = 0; Index < NumberOfCpus; Index++) {
|
2017-03-07 13:01:51 +01:00
|
|
|
if (DestinationRegisterTableList[Index].AllocatedSize != 0) {
|
|
|
|
RegisterTableEntry = AllocateCopyPool (
|
|
|
|
DestinationRegisterTableList[Index].AllocatedSize,
|
|
|
|
(VOID *)(UINTN)SourceRegisterTableList[Index].RegisterTableEntry
|
|
|
|
);
|
|
|
|
ASSERT (RegisterTableEntry != NULL);
|
|
|
|
DestinationRegisterTableList[Index].RegisterTableEntry = (EFI_PHYSICAL_ADDRESS)(UINTN)RegisterTableEntry;
|
2016-07-19 10:44:16 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
Get ACPI CPU data.
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
GetAcpiCpuData (
|
|
|
|
VOID
|
|
|
|
)
|
|
|
|
{
|
|
|
|
ACPI_CPU_DATA *AcpiCpuData;
|
|
|
|
IA32_DESCRIPTOR *Gdtr;
|
|
|
|
IA32_DESCRIPTOR *Idtr;
|
2018-08-10 04:27:42 +02:00
|
|
|
VOID *GdtForAp;
|
|
|
|
VOID *IdtForAp;
|
|
|
|
VOID *MachineCheckHandlerForAp;
|
2018-10-15 04:34:59 +02:00
|
|
|
CPU_STATUS_INFORMATION *CpuStatus;
|
2016-07-19 10:44:16 +02:00
|
|
|
|
2016-07-20 04:24:58 +02:00
|
|
|
if (!mAcpiS3Enable) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-07-19 10:44:16 +02:00
|
|
|
//
|
|
|
|
// Prevent use of mAcpiCpuData by initialize NumberOfCpus to 0
|
|
|
|
//
|
|
|
|
mAcpiCpuData.NumberOfCpus = 0;
|
|
|
|
|
|
|
|
//
|
|
|
|
// If PcdCpuS3DataAddress was never set, then do not copy CPU S3 Data into SMRAM
|
|
|
|
//
|
|
|
|
AcpiCpuData = (ACPI_CPU_DATA *)(UINTN)PcdGet64 (PcdCpuS3DataAddress);
|
|
|
|
if (AcpiCpuData == 0) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
//
|
|
|
|
// For a native platform, copy the CPU S3 data into SMRAM for use on CPU S3 Resume.
|
|
|
|
//
|
|
|
|
CopyMem (&mAcpiCpuData, AcpiCpuData, sizeof (mAcpiCpuData));
|
|
|
|
|
|
|
|
mAcpiCpuData.MtrrTable = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (sizeof (MTRR_SETTINGS));
|
|
|
|
ASSERT (mAcpiCpuData.MtrrTable != 0);
|
|
|
|
|
|
|
|
CopyMem ((VOID *)(UINTN)mAcpiCpuData.MtrrTable, (VOID *)(UINTN)AcpiCpuData->MtrrTable, sizeof (MTRR_SETTINGS));
|
|
|
|
|
|
|
|
mAcpiCpuData.GdtrProfile = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (sizeof (IA32_DESCRIPTOR));
|
|
|
|
ASSERT (mAcpiCpuData.GdtrProfile != 0);
|
|
|
|
|
|
|
|
CopyMem ((VOID *)(UINTN)mAcpiCpuData.GdtrProfile, (VOID *)(UINTN)AcpiCpuData->GdtrProfile, sizeof (IA32_DESCRIPTOR));
|
|
|
|
|
|
|
|
mAcpiCpuData.IdtrProfile = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (sizeof (IA32_DESCRIPTOR));
|
|
|
|
ASSERT (mAcpiCpuData.IdtrProfile != 0);
|
|
|
|
|
|
|
|
CopyMem ((VOID *)(UINTN)mAcpiCpuData.IdtrProfile, (VOID *)(UINTN)AcpiCpuData->IdtrProfile, sizeof (IA32_DESCRIPTOR));
|
|
|
|
|
|
|
|
mAcpiCpuData.PreSmmInitRegisterTable = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (mAcpiCpuData.NumberOfCpus * sizeof (CPU_REGISTER_TABLE));
|
|
|
|
ASSERT (mAcpiCpuData.PreSmmInitRegisterTable != 0);
|
|
|
|
|
|
|
|
CopyRegisterTable (
|
|
|
|
(CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.PreSmmInitRegisterTable,
|
|
|
|
(CPU_REGISTER_TABLE *)(UINTN)AcpiCpuData->PreSmmInitRegisterTable,
|
|
|
|
mAcpiCpuData.NumberOfCpus
|
|
|
|
);
|
|
|
|
|
|
|
|
mAcpiCpuData.RegisterTable = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (mAcpiCpuData.NumberOfCpus * sizeof (CPU_REGISTER_TABLE));
|
|
|
|
ASSERT (mAcpiCpuData.RegisterTable != 0);
|
|
|
|
|
|
|
|
CopyRegisterTable (
|
|
|
|
(CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.RegisterTable,
|
|
|
|
(CPU_REGISTER_TABLE *)(UINTN)AcpiCpuData->RegisterTable,
|
|
|
|
mAcpiCpuData.NumberOfCpus
|
|
|
|
);
|
|
|
|
|
|
|
|
//
|
|
|
|
// Copy AP's GDT, IDT and Machine Check handler into SMRAM.
|
|
|
|
//
|
|
|
|
Gdtr = (IA32_DESCRIPTOR *)(UINTN)mAcpiCpuData.GdtrProfile;
|
|
|
|
Idtr = (IA32_DESCRIPTOR *)(UINTN)mAcpiCpuData.IdtrProfile;
|
|
|
|
|
2018-08-10 04:27:42 +02:00
|
|
|
GdtForAp = AllocatePool ((Gdtr->Limit + 1) + (Idtr->Limit + 1) + mAcpiCpuData.ApMachineCheckHandlerSize);
|
|
|
|
ASSERT (GdtForAp != NULL);
|
|
|
|
IdtForAp = (VOID *) ((UINTN)GdtForAp + (Gdtr->Limit + 1));
|
|
|
|
MachineCheckHandlerForAp = (VOID *) ((UINTN)IdtForAp + (Idtr->Limit + 1));
|
|
|
|
|
|
|
|
CopyMem (GdtForAp, (VOID *)Gdtr->Base, Gdtr->Limit + 1);
|
|
|
|
CopyMem (IdtForAp, (VOID *)Idtr->Base, Idtr->Limit + 1);
|
|
|
|
CopyMem (MachineCheckHandlerForAp, (VOID *)(UINTN)mAcpiCpuData.ApMachineCheckHandlerBase, mAcpiCpuData.ApMachineCheckHandlerSize);
|
2016-07-19 10:44:16 +02:00
|
|
|
|
2018-08-10 04:27:42 +02:00
|
|
|
Gdtr->Base = (UINTN)GdtForAp;
|
|
|
|
Idtr->Base = (UINTN)IdtForAp;
|
|
|
|
mAcpiCpuData.ApMachineCheckHandlerBase = (EFI_PHYSICAL_ADDRESS)(UINTN)MachineCheckHandlerForAp;
|
2018-10-15 04:34:59 +02:00
|
|
|
|
|
|
|
CpuStatus = &mAcpiCpuData.CpuStatus;
|
|
|
|
CopyMem (CpuStatus, &AcpiCpuData->CpuStatus, sizeof (CPU_STATUS_INFORMATION));
|
|
|
|
if (AcpiCpuData->CpuStatus.ValidCoreCountPerPackage != 0) {
|
|
|
|
CpuStatus->ValidCoreCountPerPackage = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocateCopyPool (
|
|
|
|
sizeof (UINT32) * CpuStatus->PackageCount,
|
|
|
|
(UINT32 *)(UINTN)AcpiCpuData->CpuStatus.ValidCoreCountPerPackage
|
|
|
|
);
|
|
|
|
ASSERT (CpuStatus->ValidCoreCountPerPackage != 0);
|
|
|
|
}
|
|
|
|
if (AcpiCpuData->ApLocation != 0) {
|
|
|
|
mAcpiCpuData.ApLocation = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocateCopyPool (
|
|
|
|
mAcpiCpuData.NumberOfCpus * sizeof (EFI_CPU_PHYSICAL_LOCATION),
|
|
|
|
(EFI_CPU_PHYSICAL_LOCATION *)(UINTN)AcpiCpuData->ApLocation
|
|
|
|
);
|
|
|
|
ASSERT (mAcpiCpuData.ApLocation != 0);
|
|
|
|
}
|
|
|
|
if (CpuStatus->PackageCount != 0) {
|
UefiCpuPkg/PiSmmCpuDxeSmm: Separate semaphore container.
In current implementation, core and package level sync uses same semaphores.
Sharing the semaphore may cause wrong execution order.
For example:
1. Feature A has CPU_FEATURE_CORE_BEFORE dependency with Feature B.
2. Feature C has CPU_FEATURE_PACKAGE_AFTER dependency with Feature B.
The expected feature initialization order is A B C:
A ---- (Core Depends) ----> B ---- (Package Depends) ----> C
For a CPU has 1 package, 2 cores and 4 threads. The feature initialization
order may like below:
Thread#1 Thread#2 Thread#3 Thread#4
[A.Init] [A.Init] [A.Init]
Release(S1, S2) Release(S1, S2) Release(S3, S4)
Wait(S1) * 2 Wait(S2) * 2 <------------------------------- Core sync
[B.Init] [B.Init]
Release (S1,S2,S3,S4)
Wait (S1) * 4 <----------------------------------------------------- Package sync
Wait(S4 * 2) <- Core sync
[B.Init]
In above case, for thread#4, when it syncs in core level, Wait(S4) * 2 isn't
blocked and [B.Init] runs. But [A.Init] hasn't run in thread#3. It's wrong!
Thread#4 should execute [B.Init] after thread#3 executes [A.Init] because B
core level depends on A.
The reason of the wrong execution order is that S4 is released in thread#1
by calling Release (S1, S2, S3, S4) and in thread #4 by calling
Release (S3, S4).
To fix this issue, core level sync and package level sync should use separate
semaphores.
In above example, the S4 released in Release (S1, S2, S3, S4) should not be the
same semaphore as that in Release (S3, S4).
Related BZ: https://bugzilla.tianocore.org/show_bug.cgi?id=1311
Cc: Laszlo Ersek <lersek@redhat.com>
Cc: Ruiyu Ni <ruiyu.ni@intel.com>
Contributed-under: TianoCore Contribution Agreement 1.1
Signed-off-by: Eric Dong <eric.dong@intel.com>
Reviewed-by: Ruiyu Ni <ruiyu.ni@intel.com>
Acked-by: Laszlo Ersek <lersek@redhat.com>
2018-11-10 03:53:41 +01:00
|
|
|
mCpuFlags.CoreSemaphoreCount = AllocateZeroPool (
|
|
|
|
sizeof (UINT32) * CpuStatus->PackageCount *
|
|
|
|
CpuStatus->MaxCoreCount * CpuStatus->MaxThreadCount
|
|
|
|
);
|
|
|
|
ASSERT (mCpuFlags.CoreSemaphoreCount != NULL);
|
|
|
|
mCpuFlags.PackageSemaphoreCount = AllocateZeroPool (
|
|
|
|
sizeof (UINT32) * CpuStatus->PackageCount *
|
|
|
|
CpuStatus->MaxCoreCount * CpuStatus->MaxThreadCount
|
|
|
|
);
|
|
|
|
ASSERT (mCpuFlags.PackageSemaphoreCount != NULL);
|
2018-10-15 04:34:59 +02:00
|
|
|
}
|
|
|
|
InitializeSpinLock((SPIN_LOCK*) &mCpuFlags.MemoryMappedLock);
|
2016-07-19 10:44:16 +02:00
|
|
|
}
|
2016-07-20 04:24:58 +02:00
|
|
|
|
|
|
|
/**
|
|
|
|
Get ACPI S3 enable flag.
|
|
|
|
|
|
|
|
**/
|
|
|
|
VOID
|
|
|
|
GetAcpiS3EnableFlag (
|
|
|
|
VOID
|
|
|
|
)
|
|
|
|
{
|
|
|
|
mAcpiS3Enable = PcdGetBool (PcdAcpiS3Enable);
|
|
|
|
}
|