public inbox for devel@edk2.groups.io
 help / color / mirror / Atom feed
From: "Laszlo Ersek" <lersek@redhat.com>
To: devel@edk2.groups.io, star.zeng@intel.com
Cc: Ray Ni <ray.ni@intel.com>, Eric Dong <eric.dong@intel.com>
Subject: Re: [edk2-devel] [PATCH V2] UefiCpuPkg PiSmmCpuDxeSmm: Reduce SMRAM consumption in CpuS3.c
Date: Wed, 6 Jan 2021 19:46:28 +0100	[thread overview]
Message-ID: <4bfa073a-4ddb-7fd7-a4c3-ef20b3807f50@redhat.com> (raw)
In-Reply-To: <a6aba141-7894-fe5d-2c15-6c77e2137316@redhat.com>

On 01/06/21 18:56, Laszlo Ersek wrote:
> On 01/06/21 07:48, Zeng, Star wrote:
>> This patch makes two refinements to reduce SMRAM consumption in CpuS3.c.
>> 1. Only do CopyRegisterTable() when register table is not empty,
>>   IsRegisterTableEmpty() is created to check whether the register table
>>   is empty or not.
>>
>>   Take empty PreSmmInitRegisterTable as example, about 24K SMRAM consumption
>>   could be reduced when mAcpiCpuData.NumberOfCpus=1024.
>>   sizeof (CPU_REGISTER_TABLE) = 24
>>   mAcpiCpuData.NumberOfCpus = 1024 = 1K
>>   mAcpiCpuData.NumberOfCpus * sizeof (CPU_REGISTER_TABLE) = 24K
>>
>> 2. Only copy table entries buffer instead of whole buffer.
>>   AllocatedSize in SourceRegisterTableList is the whole buffer size.
>>   Actually, only the table entries buffer needs to be copied, and the size
>>   is TableLength * sizeof (CPU_REGISTER_TABLE_ENTRY).
>>
>>   Take AllocatedSize=0x1000=4096, TableLength=100 and NumberOfCpus=1024 as example,
>>   about 1696K SMRAM consumption could be reduced.
>>   sizeof (CPU_REGISTER_TABLE_ENTRY) = 24
>>   TableLength = 100
>>   TableLength * sizeof (CPU_REGISTER_TABLE_ENTRY) = 2400
>>   AllocatedSize = 0x1000 = 4096
>>   AllocatedSize - TableLength * sizeof (CPU_REGISTER_TABLE_ENTRY) = 4096 - 2400 = 1696
>>   NumberOfCpus = 1024 = 1K
>>   NumberOfCpus * (AllocatedSize - TableLength * sizeof (CPU_REGISTER_TABLE_ENTRY)) = 1696K
>>
>> This patch also corrects the CopyRegisterTable() function description.
>>
>> Signed-off-by: Star Zeng <star.zeng@intel.com>
>> Cc: Ray Ni <ray.ni@intel.com>
>> Cc: Eric Dong <eric.dong@intel.com>
>> Cc: Laszlo Ersek <lersek@redhat.com>
>> ---
>>  UefiCpuPkg/PiSmmCpuDxeSmm/CpuS3.c | 71 +++++++++++++++++++++++--------
>>  1 file changed, 54 insertions(+), 17 deletions(-)
>>
>> diff --git a/UefiCpuPkg/PiSmmCpuDxeSmm/CpuS3.c b/UefiCpuPkg/PiSmmCpuDxeSmm/CpuS3.c
>> index 9592430636ec..9b1f952c8a74 100644
>> --- a/UefiCpuPkg/PiSmmCpuDxeSmm/CpuS3.c
>> +++ b/UefiCpuPkg/PiSmmCpuDxeSmm/CpuS3.c
>> @@ -1,7 +1,7 @@
>>  /** @file
>>  Code for Processor S3 restoration
>>  
>> -Copyright (c) 2006 - 2020, Intel Corporation. All rights reserved.<BR>
>> +Copyright (c) 2006 - 2021, Intel Corporation. All rights reserved.<BR>
>>  SPDX-License-Identifier: BSD-2-Clause-Patent
>>  
>>  **/
>> @@ -487,6 +487,9 @@ SetRegister (
>>    } else {
>>      RegisterTables = (CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.RegisterTable;
>>    }
>> +  if (RegisterTables == NULL) {
>> +    return;
>> +  }
>>  
>>    InitApicId = GetInitialApicId ();
>>    RegisterTable = NULL;
>> @@ -948,7 +951,7 @@ InitSmmS3ResumeState (
>>  }
>>  
>>  /**
>> -  Copy register table from ACPI NVS memory into SMRAM.
>> +  Copy register table from non-SMRAM into SMRAM.
>>  
>>    @param[in] DestinationRegisterTableList  Points to destination register table.
>>    @param[in] SourceRegisterTableList       Points to source register table.
>> @@ -967,7 +970,8 @@ CopyRegisterTable (
>>  
>>    CopyMem (DestinationRegisterTableList, SourceRegisterTableList, NumberOfCpus * sizeof (CPU_REGISTER_TABLE));
>>    for (Index = 0; Index < NumberOfCpus; Index++) {
>> -    if (DestinationRegisterTableList[Index].AllocatedSize != 0) {
>> +    if (DestinationRegisterTableList[Index].TableLength != 0) {
>> +      DestinationRegisterTableList[Index].AllocatedSize = DestinationRegisterTableList[Index].TableLength * sizeof (CPU_REGISTER_TABLE_ENTRY);
>>        RegisterTableEntry = AllocateCopyPool (
>>          DestinationRegisterTableList[Index].AllocatedSize,
>>          (VOID *)(UINTN)SourceRegisterTableList[Index].RegisterTableEntry
>> @@ -978,6 +982,31 @@ CopyRegisterTable (
>>    }
>>  }
>>  
>> +/**
>> +  Check whether the register table is empty or not.
>> +
>> +  @param[in] RegisterTable  Point to the register table.
>> +
>> +  @retval TRUE              The register table is empty.
>> +  @retval FALSE             The register table is not empty.
>> +**/
>> +BOOLEAN
>> +IsRegisterTableEmpty (
>> +  IN CPU_REGISTER_TABLE     *RegisterTable,
>> +  IN UINT32                 NumberOfCpus
>> +  )
>> +{
>> +  UINTN                     Index;
>> +
>> +  for (Index = 0; Index < NumberOfCpus; Index++) {
>> +    if (RegisterTable[Index].TableLength != 0) {
>> +      return FALSE;
>> +    }
>> +  }
>> +
>> +  return TRUE;
>> +}
>> +
>>  /**
>>    Get ACPI CPU data.
>>  
>> @@ -1032,23 +1061,31 @@ GetAcpiCpuData (
>>  
>>    CopyMem ((VOID *)(UINTN)mAcpiCpuData.IdtrProfile, (VOID *)(UINTN)AcpiCpuData->IdtrProfile, sizeof (IA32_DESCRIPTOR));
>>  
>> -  mAcpiCpuData.PreSmmInitRegisterTable = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (mAcpiCpuData.NumberOfCpus * sizeof (CPU_REGISTER_TABLE));
>> -  ASSERT (mAcpiCpuData.PreSmmInitRegisterTable != 0);
>> +  if (!IsRegisterTableEmpty ((CPU_REGISTER_TABLE *)(UINTN)AcpiCpuData->PreSmmInitRegisterTable, mAcpiCpuData.NumberOfCpus)) {
>> +    mAcpiCpuData.PreSmmInitRegisterTable = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (mAcpiCpuData.NumberOfCpus * sizeof (CPU_REGISTER_TABLE));
>> +    ASSERT (mAcpiCpuData.PreSmmInitRegisterTable != 0);
>>  
>> -  CopyRegisterTable (
>> -    (CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.PreSmmInitRegisterTable,
>> -    (CPU_REGISTER_TABLE *)(UINTN)AcpiCpuData->PreSmmInitRegisterTable,
>> -    mAcpiCpuData.NumberOfCpus
>> -    );
>> +    CopyRegisterTable (
>> +      (CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.PreSmmInitRegisterTable,
>> +      (CPU_REGISTER_TABLE *)(UINTN)AcpiCpuData->PreSmmInitRegisterTable,
>> +      mAcpiCpuData.NumberOfCpus
>> +      );
>> +  } else {
>> +    mAcpiCpuData.PreSmmInitRegisterTable = 0;
>> +  }
>>  
>> -  mAcpiCpuData.RegisterTable = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (mAcpiCpuData.NumberOfCpus * sizeof (CPU_REGISTER_TABLE));
>> -  ASSERT (mAcpiCpuData.RegisterTable != 0);
>> +  if (!IsRegisterTableEmpty ((CPU_REGISTER_TABLE *)(UINTN)AcpiCpuData->RegisterTable, mAcpiCpuData.NumberOfCpus)) {
>> +    mAcpiCpuData.RegisterTable = (EFI_PHYSICAL_ADDRESS)(UINTN)AllocatePool (mAcpiCpuData.NumberOfCpus * sizeof (CPU_REGISTER_TABLE));
>> +    ASSERT (mAcpiCpuData.RegisterTable != 0);
>>  
>> -  CopyRegisterTable (
>> -    (CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.RegisterTable,
>> -    (CPU_REGISTER_TABLE *)(UINTN)AcpiCpuData->RegisterTable,
>> -    mAcpiCpuData.NumberOfCpus
>> -    );
>> +    CopyRegisterTable (
>> +      (CPU_REGISTER_TABLE *)(UINTN)mAcpiCpuData.RegisterTable,
>> +      (CPU_REGISTER_TABLE *)(UINTN)AcpiCpuData->RegisterTable,
>> +      mAcpiCpuData.NumberOfCpus
>> +      );
>> +  } else {
>> +    mAcpiCpuData.RegisterTable = 0;
>> +  }
>>  
>>    //
>>    // Copy AP's GDT, IDT and Machine Check handler into SMRAM.
>>
> 
> This patch is a step in the right direction, but, IMO, it can be improved.
> 
> The IsRegisterTableEmpty() function should also handle the case when the
> "RegisterTable" parameter is NULL. The function should then also return
> TRUE.
> 
> And then, two more patches would be nice:
> 
> 
> (2) The register table allocation in
> "UefiCpuPkg/CpuS3DataDxe/CpuS3Data.c" should be removed.
> 
> Right now, the code there allocates memory just so it can set the
> "TableLength" and "AllocatedSize" fields to zero, for each "InitialApicId".
> 
> It's a waste -- the memory is allocated only for ensuring that
> PiSmmCpuDxeSmm does not program any CPU registers during S3 resume.
> 
> Setting "AcpiCpuData->RegisterTable" and
> "AcpiCpuData->PreSmmInitRegisterTable" should have the same effect.

... sorry, I meant: setting "AcpiCpuData->RegisterTable" and
"AcpiCpuData->PreSmmInitRegisterTable" *TO NULL* should have the same
effect.

Thanks,
Laszlo

> 
> 
> (3) The same simplification should be then mirrored to
> "OvmfPkg/CpuS3DataDxe/CpuS3Data.c".
> 
> I can write the OvmfPkg patch myself, of course, but first I'd like to
> see this use case confirmed / supported.
> 
> This patch looks OK otherwise.
> 
> Thanks!
> Laszlo
> 
> 
> 
> 
> 
> 


  reply	other threads:[~2021-01-06 18:46 UTC|newest]

Thread overview: 8+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2021-01-06  6:48 [PATCH V2] UefiCpuPkg PiSmmCpuDxeSmm: Reduce SMRAM consumption in CpuS3.c Zeng, Star
2021-01-06  9:44 ` Ni, Ray
2021-01-06 17:56 ` [edk2-devel] " Laszlo Ersek
2021-01-06 18:46   ` Laszlo Ersek [this message]
2021-01-07  5:23   ` Ni, Ray
2021-01-07 10:09     ` Laszlo Ersek
2021-01-07 10:47       ` Zeng, Star
2021-01-07 11:00         ` Laszlo Ersek

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-list from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=4bfa073a-4ddb-7fd7-a4c3-ef20b3807f50@redhat.com \
    --to=devel@edk2.groups.io \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox