blob: d8dc3a839cb6553021edea65553314ea07044d78 [file] [log] [blame]
// Bench.cpp
#include "StdAfx.h"
#ifndef _WIN32
#define USE_POSIX_TIME
#define USE_POSIX_TIME2
#endif
#ifdef USE_POSIX_TIME
#include <time.h>
#ifdef USE_POSIX_TIME2
#include <sys/time.h>
#endif
#endif
#ifdef _WIN32
#define USE_ALLOCA
#endif
#ifdef USE_ALLOCA
#ifdef _WIN32
#include <malloc.h>
#else
#include <stdlib.h>
#endif
#endif
#include "../../../../C/7zCrc.h"
#include "../../../../C/Alloc.h"
#include "../../../../C/CpuArch.h"
#if !defined(_7ZIP_ST) || defined(_WIN32)
#include "../../../Windows/System.h"
#endif
#ifndef _7ZIP_ST
#include "../../../Windows/Synchronization.h"
#include "../../../Windows/Thread.h"
#endif
#include "../../../Common/IntToString.h"
#include "../../../Common/StringConvert.h"
#include "../../../Common/StringToInt.h"
#include "../../Common/MethodProps.h"
#include "../../Common/StreamUtils.h"
#include "Bench.h"
using namespace NWindows;
static const UInt64 kComplexInCommands = (UInt64)1 <<
#ifdef UNDER_CE
31;
#else
34;
#endif
static const UInt64 kComplexInSeconds = 4;
static void SetComplexCommands(UInt32 complexInSeconds, UInt64 cpuFreq, UInt64 &complexInCommands)
{
complexInCommands = kComplexInCommands;
const UInt64 kMinFreq = (UInt64)1000000 * 30;
const UInt64 kMaxFreq = (UInt64)1000000 * 20000;
if (cpuFreq < kMinFreq) cpuFreq = kMinFreq;
if (cpuFreq < kMaxFreq)
{
if (complexInSeconds != 0)
complexInCommands = complexInSeconds * cpuFreq;
else
complexInCommands = cpuFreq >> 2;
}
}
static const unsigned kNumHashDictBits = 17;
static const UInt32 kFilterUnpackSize = (48 << 10);
static const unsigned kOldLzmaDictBits = 30;
static const UInt32 kAdditionalSize = (1 << 16);
static const UInt32 kCompressedAdditionalSize = (1 << 10);
static const UInt32 kMaxLzmaPropSize = 5;
class CBaseRandomGenerator
{
UInt32 A1;
UInt32 A2;
public:
CBaseRandomGenerator() { Init(); }
void Init() { A1 = 362436069; A2 = 521288629;}
UInt32 GetRnd()
{
return
((A1 = 36969 * (A1 & 0xffff) + (A1 >> 16)) << 16) +
((A2 = 18000 * (A2 & 0xffff) + (A2 >> 16)) );
}
};
class CBenchBuffer
{
public:
size_t BufferSize;
Byte *Buffer;
CBenchBuffer(): Buffer(0) {}
virtual ~CBenchBuffer() { Free(); }
void Free()
{
::MidFree(Buffer);
Buffer = 0;
}
bool Alloc(size_t bufferSize)
{
if (Buffer != 0 && BufferSize == bufferSize)
return true;
Free();
Buffer = (Byte *)::MidAlloc(bufferSize);
BufferSize = bufferSize;
return (Buffer != 0 || bufferSize == 0);
}
};
class CBenchRandomGenerator: public CBenchBuffer
{
CBaseRandomGenerator *RG;
public:
void Set(CBaseRandomGenerator *rg) { RG = rg; }
UInt32 GetVal(UInt32 &res, unsigned numBits)
{
UInt32 val = res & (((UInt32)1 << numBits) - 1);
res >>= numBits;
return val;
}
UInt32 GetLen(UInt32 &res)
{
UInt32 len = GetVal(res, 2);
return GetVal(res, 1 + len);
}
void GenerateSimpleRandom()
{
for (UInt32 i = 0; i < BufferSize; i++)
Buffer[i] = (Byte)RG->GetRnd();
}
void Generate(unsigned dictBits)
{
UInt32 pos = 0;
UInt32 rep0 = 1;
while (pos < BufferSize)
{
UInt32 res = RG->GetRnd();
res >>= 1;
if (GetVal(res, 1) == 0 || pos < 1024)
Buffer[pos++] = (Byte)(res & 0xFF);
else
{
UInt32 len;
len = 1 + GetLen(res);
if (GetVal(res, 3) != 0)
{
len += GetLen(res);
do
{
UInt32 ppp = GetVal(res, 5) + 6;
res = RG->GetRnd();
if (ppp > dictBits)
continue;
rep0 = /* (1 << ppp) +*/ GetVal(res, ppp);
res = RG->GetRnd();
}
while (rep0 >= pos);
rep0++;
}
for (UInt32 i = 0; i < len && pos < BufferSize; i++, pos++)
Buffer[pos] = Buffer[pos - rep0];
}
}
}
};
class CBenchmarkInStream:
public ISequentialInStream,
public CMyUnknownImp
{
const Byte *Data;
size_t Pos;
size_t Size;
public:
MY_UNKNOWN_IMP
void Init(const Byte *data, size_t size)
{
Data = data;
Size = size;
Pos = 0;
}
STDMETHOD(Read)(void *data, UInt32 size, UInt32 *processedSize);
};
STDMETHODIMP CBenchmarkInStream::Read(void *data, UInt32 size, UInt32 *processedSize)
{
size_t remain = Size - Pos;
UInt32 kMaxBlockSize = (1 << 20);
if (size > kMaxBlockSize)
size = kMaxBlockSize;
if (size > remain)
size = (UInt32)remain;
for (UInt32 i = 0; i < size; i++)
((Byte *)data)[i] = Data[Pos + i];
Pos += size;
if(processedSize != NULL)
*processedSize = size;
return S_OK;
}
class CBenchmarkOutStream:
public ISequentialOutStream,
public CBenchBuffer,
public CMyUnknownImp
{
// bool _overflow;
public:
UInt32 Pos;
bool RealCopy;
bool CalcCrc;
UInt32 Crc;
// CBenchmarkOutStream(): _overflow(false) {}
void Init(bool realCopy, bool calcCrc)
{
Crc = CRC_INIT_VAL;
RealCopy = realCopy;
CalcCrc = calcCrc;
// _overflow = false;
Pos = 0;
}
MY_UNKNOWN_IMP
STDMETHOD(Write)(const void *data, UInt32 size, UInt32 *processedSize);
};
STDMETHODIMP CBenchmarkOutStream::Write(const void *data, UInt32 size, UInt32 *processedSize)
{
size_t curSize = BufferSize - Pos;
if (curSize > size)
curSize = size;
if (RealCopy)
memcpy(Buffer + Pos, data, curSize);
if (CalcCrc)
Crc = CrcUpdate(Crc, data, curSize);
Pos += (UInt32)curSize;
if(processedSize != NULL)
*processedSize = (UInt32)curSize;
if (curSize != size)
{
// _overflow = true;
return E_FAIL;
}
return S_OK;
}
class CCrcOutStream:
public ISequentialOutStream,
public CMyUnknownImp
{
public:
bool CalcCrc;
UInt32 Crc;
MY_UNKNOWN_IMP
CCrcOutStream(): CalcCrc(true) {};
void Init() { Crc = CRC_INIT_VAL; }
STDMETHOD(Write)(const void *data, UInt32 size, UInt32 *processedSize);
};
STDMETHODIMP CCrcOutStream::Write(const void *data, UInt32 size, UInt32 *processedSize)
{
if (CalcCrc)
Crc = CrcUpdate(Crc, data, size);
if (processedSize != NULL)
*processedSize = size;
return S_OK;
}
static UInt64 GetTimeCount()
{
#ifdef USE_POSIX_TIME
#ifdef USE_POSIX_TIME2
timeval v;
if (gettimeofday(&v, 0) == 0)
return (UInt64)(v.tv_sec) * 1000000 + v.tv_usec;
return (UInt64)time(NULL) * 1000000;
#else
return time(NULL);
#endif
#else
/*
LARGE_INTEGER value;
if (::QueryPerformanceCounter(&value))
return value.QuadPart;
*/
return GetTickCount();
#endif
}
static UInt64 GetFreq()
{
#ifdef USE_POSIX_TIME
#ifdef USE_POSIX_TIME2
return 1000000;
#else
return 1;
#endif
#else
/*
LARGE_INTEGER value;
if (::QueryPerformanceFrequency(&value))
return value.QuadPart;
*/
return 1000;
#endif
}
#ifdef USE_POSIX_TIME
struct CUserTime
{
UInt64 Sum;
clock_t Prev;
void Init()
{
Prev = clock();
Sum = 0;
}
UInt64 GetUserTime()
{
clock_t v = clock();
Sum += v - Prev;
Prev = v;
return Sum;
}
};
#else
static inline UInt64 GetTime64(const FILETIME &t) { return ((UInt64)t.dwHighDateTime << 32) | t.dwLowDateTime; }
UInt64 GetWinUserTime()
{
FILETIME creationTime, exitTime, kernelTime, userTime;
if (
#ifdef UNDER_CE
::GetThreadTimes(::GetCurrentThread()
#else
::GetProcessTimes(::GetCurrentProcess()
#endif
, &creationTime, &exitTime, &kernelTime, &userTime) != 0)
return GetTime64(userTime) + GetTime64(kernelTime);
return (UInt64)GetTickCount() * 10000;
}
struct CUserTime
{
UInt64 StartTime;
void Init() { StartTime = GetWinUserTime(); }
UInt64 GetUserTime() { return GetWinUserTime() - StartTime; }
};
#endif
static UInt64 GetUserFreq()
{
#ifdef USE_POSIX_TIME
return CLOCKS_PER_SEC;
#else
return 10000000;
#endif
}
class CBenchProgressStatus
{
#ifndef _7ZIP_ST
NSynchronization::CCriticalSection CS;
#endif
public:
HRESULT Res;
bool EncodeMode;
void SetResult(HRESULT res)
{
#ifndef _7ZIP_ST
NSynchronization::CCriticalSectionLock lock(CS);
#endif
Res = res;
}
HRESULT GetResult()
{
#ifndef _7ZIP_ST
NSynchronization::CCriticalSectionLock lock(CS);
#endif
return Res;
}
};
struct CBenchInfoCalc
{
CBenchInfo BenchInfo;
CUserTime UserTime;
void SetStartTime();
void SetFinishTime(CBenchInfo &dest);
};
void CBenchInfoCalc::SetStartTime()
{
BenchInfo.GlobalFreq = GetFreq();
BenchInfo.UserFreq = GetUserFreq();
BenchInfo.GlobalTime = ::GetTimeCount();
BenchInfo.UserTime = 0;
UserTime.Init();
}
void CBenchInfoCalc::SetFinishTime(CBenchInfo &dest)
{
dest = BenchInfo;
dest.GlobalTime = ::GetTimeCount() - BenchInfo.GlobalTime;
dest.UserTime = UserTime.GetUserTime();
}
class CBenchProgressInfo:
public ICompressProgressInfo,
public CMyUnknownImp,
public CBenchInfoCalc
{
public:
CBenchProgressStatus *Status;
HRESULT Res;
IBenchCallback *Callback;
CBenchProgressInfo(): Callback(0) {}
MY_UNKNOWN_IMP
STDMETHOD(SetRatioInfo)(const UInt64 *inSize, const UInt64 *outSize);
};
STDMETHODIMP CBenchProgressInfo::SetRatioInfo(const UInt64 *inSize, const UInt64 *outSize)
{
HRESULT res = Status->GetResult();
if (res != S_OK)
return res;
if (!Callback)
return res;
CBenchInfo info;
SetFinishTime(info);
if (Status->EncodeMode)
{
info.UnpackSize = BenchInfo.UnpackSize + *inSize;
info.PackSize = BenchInfo.PackSize + *outSize;
res = Callback->SetEncodeResult(info, false);
}
else
{
info.PackSize = BenchInfo.PackSize + *inSize;
info.UnpackSize = BenchInfo.UnpackSize + *outSize;
res = Callback->SetDecodeResult(info, false);
}
if (res != S_OK)
Status->SetResult(res);
return res;
}
static const int kSubBits = 8;
static UInt32 GetLogSize(UInt32 size)
{
for (int i = kSubBits; i < 32; i++)
for (UInt32 j = 0; j < (1 << kSubBits); j++)
if (size <= (((UInt32)1) << i) + (j << (i - kSubBits)))
return (i << kSubBits) + j;
return (32 << kSubBits);
}
static void NormalizeVals(UInt64 &v1, UInt64 &v2)
{
while (v1 > 1000000)
{
v1 >>= 1;
v2 >>= 1;
}
}
UInt64 CBenchInfo::GetUsage() const
{
UInt64 userTime = UserTime;
UInt64 userFreq = UserFreq;
UInt64 globalTime = GlobalTime;
UInt64 globalFreq = GlobalFreq;
NormalizeVals(userTime, userFreq);
NormalizeVals(globalFreq, globalTime);
if (userFreq == 0)
userFreq = 1;
if (globalTime == 0)
globalTime = 1;
return userTime * globalFreq * 1000000 / userFreq / globalTime;
}
UInt64 CBenchInfo::GetRatingPerUsage(UInt64 rating) const
{
UInt64 userTime = UserTime;
UInt64 userFreq = UserFreq;
UInt64 globalTime = GlobalTime;
UInt64 globalFreq = GlobalFreq;
NormalizeVals(userFreq, userTime);
NormalizeVals(globalTime, globalFreq);
if (globalFreq == 0)
globalFreq = 1;
if (userTime == 0)
userTime = 1;
return userFreq * globalTime / globalFreq * rating / userTime;
}
static UInt64 MyMultDiv64(UInt64 value, UInt64 elapsedTime, UInt64 freq)
{
UInt64 elTime = elapsedTime;
NormalizeVals(freq, elTime);
if (elTime == 0)
elTime = 1;
return value * freq / elTime;
}
UInt64 CBenchInfo::GetSpeed(UInt64 numCommands) const
{
return MyMultDiv64(numCommands, GlobalTime, GlobalFreq);
}
struct CBenchProps
{
bool LzmaRatingMode;
UInt32 EncComplex;
UInt32 DecComplexCompr;
UInt32 DecComplexUnc;
CBenchProps(): LzmaRatingMode(false) {}
void SetLzmaCompexity();
UInt64 GeComprCommands(UInt64 unpackSize)
{
return unpackSize * EncComplex;
}
UInt64 GeDecomprCommands(UInt64 packSize, UInt64 unpackSize)
{
return (packSize * DecComplexCompr + unpackSize * DecComplexUnc);
}
UInt64 GetCompressRating(UInt32 dictSize, UInt64 elapsedTime, UInt64 freq, UInt64 size);
UInt64 GetDecompressRating(UInt64 elapsedTime, UInt64 freq, UInt64 outSize, UInt64 inSize, UInt64 numIterations);
};
void CBenchProps::SetLzmaCompexity()
{
EncComplex = 1200;
DecComplexUnc = 4;
DecComplexCompr = 190;
LzmaRatingMode = true;
}
UInt64 CBenchProps::GetCompressRating(UInt32 dictSize, UInt64 elapsedTime, UInt64 freq, UInt64 size)
{
if (dictSize < (1 << kBenchMinDicLogSize))
dictSize = (1 << kBenchMinDicLogSize);
UInt64 encComplex = EncComplex;
if (LzmaRatingMode)
{
UInt64 t = GetLogSize(dictSize) - (kBenchMinDicLogSize << kSubBits);
encComplex = 870 + ((t * t * 5) >> (2 * kSubBits));
}
UInt64 numCommands = (UInt64)size * encComplex;
return MyMultDiv64(numCommands, elapsedTime, freq);
}
UInt64 CBenchProps::GetDecompressRating(UInt64 elapsedTime, UInt64 freq, UInt64 outSize, UInt64 inSize, UInt64 numIterations)
{
UInt64 numCommands = (inSize * DecComplexCompr + outSize * DecComplexUnc) * numIterations;
return MyMultDiv64(numCommands, elapsedTime, freq);
}
UInt64 GetCompressRating(UInt32 dictSize, UInt64 elapsedTime, UInt64 freq, UInt64 size)
{
CBenchProps props;
props.SetLzmaCompexity();
return props.GetCompressRating(dictSize, elapsedTime, freq, size);
}
UInt64 GetDecompressRating(UInt64 elapsedTime, UInt64 freq, UInt64 outSize, UInt64 inSize, UInt64 numIterations)
{
CBenchProps props;
props.SetLzmaCompexity();
return props.GetDecompressRating(elapsedTime, freq, outSize, inSize, numIterations);
}
struct CEncoderInfo;
struct CEncoderInfo
{
#ifndef _7ZIP_ST
NWindows::CThread thread[2];
UInt32 NumDecoderSubThreads;
#endif
CMyComPtr<ICompressCoder> _encoder;
CMyComPtr<ICompressFilter> _encoderFilter;
CBenchProgressInfo *progressInfoSpec[2];
CMyComPtr<ICompressProgressInfo> progressInfo[2];
UInt64 NumIterations;
#ifdef USE_ALLOCA
size_t AllocaSize;
#endif
Byte _key[32];
Byte _iv[16];
Byte _psw[16];
bool CheckCrc_Enc;
bool CheckCrc_Dec;
struct CDecoderInfo
{
CEncoderInfo *Encoder;
UInt32 DecoderIndex;
#ifdef USE_ALLOCA
size_t AllocaSize;
#endif
bool CallbackMode;
};
CDecoderInfo decodersInfo[2];
CMyComPtr<ICompressCoder> _decoders[2];
CMyComPtr<ICompressFilter> _decoderFilter;
HRESULT Results[2];
CBenchmarkOutStream *outStreamSpec;
CMyComPtr<ISequentialOutStream> outStream;
IBenchCallback *callback;
IBenchPrintCallback *printCallback;
UInt32 crc;
UInt32 kBufferSize;
UInt32 compressedSize;
CBenchRandomGenerator rg;
CBenchBuffer rgCopy; // it must be 16-byte aligned !!!
CBenchmarkOutStream *propStreamSpec;
CMyComPtr<ISequentialOutStream> propStream;
// for decode
COneMethodInfo _method;
UInt32 _uncompressedDataSize;
HRESULT Init(
const COneMethodInfo &method,
UInt32 uncompressedDataSize,
unsigned generateDictBits,
CBaseRandomGenerator *rg);
HRESULT Encode();
HRESULT Decode(UInt32 decoderIndex);
CEncoderInfo():
CheckCrc_Enc(true),
CheckCrc_Dec(true),
outStreamSpec(0), callback(0), printCallback(0), propStreamSpec(0) {}
#ifndef _7ZIP_ST
static THREAD_FUNC_DECL EncodeThreadFunction(void *param)
{
HRESULT res;
CEncoderInfo *encoder = (CEncoderInfo *)param;
try
{
#ifdef USE_ALLOCA
alloca(encoder->AllocaSize);
#endif
res = encoder->Encode();
encoder->Results[0] = res;
}
catch(...)
{
res = E_FAIL;
}
if (res != S_OK)
encoder->progressInfoSpec[0]->Status->SetResult(res);
return 0;
}
static THREAD_FUNC_DECL DecodeThreadFunction(void *param)
{
CDecoderInfo *decoder = (CDecoderInfo *)param;
#ifdef USE_ALLOCA
alloca(decoder->AllocaSize);
#endif
CEncoderInfo *encoder = decoder->Encoder;
encoder->Results[decoder->DecoderIndex] = encoder->Decode(decoder->DecoderIndex);
return 0;
}
HRESULT CreateEncoderThread()
{
return thread[0].Create(EncodeThreadFunction, this);
}
HRESULT CreateDecoderThread(int index, bool callbackMode
#ifdef USE_ALLOCA
, size_t allocaSize
#endif
)
{
CDecoderInfo &decoder = decodersInfo[index];
decoder.DecoderIndex = index;
decoder.Encoder = this;
#ifdef USE_ALLOCA
decoder.AllocaSize = allocaSize;
#endif
decoder.CallbackMode = callbackMode;
return thread[index].Create(DecodeThreadFunction, &decoder);
}
#endif
};
static const UInt32 k_LZMA = 0x030101;
HRESULT CEncoderInfo::Init(
const COneMethodInfo &method,
UInt32 uncompressedDataSize,
unsigned generateDictBits,
CBaseRandomGenerator *rgLoc)
{
rg.Set(rgLoc);
kBufferSize = uncompressedDataSize;
UInt32 kCompressedBufferSize =
kBufferSize + kCompressedAdditionalSize;
// (kBufferSize - kBufferSize / 4) + kCompressedAdditionalSize;
if (!rg.Alloc(kBufferSize))
return E_OUTOFMEMORY;
if (generateDictBits == 0)
rg.GenerateSimpleRandom();
else
rg.Generate(generateDictBits);
crc = CrcCalc(rg.Buffer, rg.BufferSize);
if (_encoderFilter)
{
if (!rgCopy.Alloc(rg.BufferSize))
return E_OUTOFMEMORY;
}
outStreamSpec = new CBenchmarkOutStream;
if (!outStreamSpec->Alloc(kCompressedBufferSize))
return E_OUTOFMEMORY;
outStream = outStreamSpec;
propStreamSpec = 0;
if (!propStream)
{
propStreamSpec = new CBenchmarkOutStream;
propStream = propStreamSpec;
}
if (!propStreamSpec->Alloc(kMaxLzmaPropSize))
return E_OUTOFMEMORY;
propStreamSpec->Init(true, false);
CMyComPtr<IUnknown> coder;
if (_encoderFilter)
coder = _encoderFilter;
else
coder = _encoder;
{
CMyComPtr<ICompressSetCoderProperties> scp;
coder.QueryInterface(IID_ICompressSetCoderProperties, &scp);
if (scp)
{
UInt64 reduceSize = uncompressedDataSize;
RINOK(method.SetCoderProps(scp, &reduceSize));
}
else
{
if (method.AreThereNonOptionalProps())
return E_INVALIDARG;
}
CMyComPtr<ICompressWriteCoderProperties> writeCoderProps;
coder.QueryInterface(IID_ICompressWriteCoderProperties, &writeCoderProps);
if (writeCoderProps)
{
RINOK(writeCoderProps->WriteCoderProperties(propStream));
}
{
CMyComPtr<ICryptoSetPassword> sp;
coder.QueryInterface(IID_ICryptoSetPassword, &sp);
if (sp)
{
RINOK(sp->CryptoSetPassword(_psw, sizeof(_psw)));
// we must call encoding one time to calculate password key for key cache.
// it must be after WriteCoderProperties!
CBenchmarkInStream *inStreamSpec = new CBenchmarkInStream;
CMyComPtr<ISequentialInStream> inStream = inStreamSpec;
Byte temp[16];
memset(temp, 0, sizeof(temp));
inStreamSpec->Init(temp, sizeof(temp));
CCrcOutStream *outStreamSpec = new CCrcOutStream;
CMyComPtr<ISequentialOutStream> outStream = outStreamSpec;
outStreamSpec->Init();
if (_encoderFilter)
{
_encoderFilter->Init();
_encoderFilter->Filter(temp, sizeof(temp));
}
else
{
RINOK(_encoder->Code(inStream, outStream, 0, 0, NULL));
}
}
}
}
return S_OK;
}
HRESULT CEncoderInfo::Encode()
{
CBenchInfo &bi = progressInfoSpec[0]->BenchInfo;
bi.UnpackSize = 0;
bi.PackSize = 0;
CMyComPtr<ICryptoProperties> cp;
CMyComPtr<IUnknown> coder;
if (_encoderFilter)
coder = _encoderFilter;
else
coder = _encoder;
coder.QueryInterface(IID_ICryptoProperties, &cp);
CBenchmarkInStream *inStreamSpec = new CBenchmarkInStream;
CMyComPtr<ISequentialInStream> inStream = inStreamSpec;
UInt64 prev = 0;
UInt32 crcPrev = 0;
if (cp)
{
RINOK(cp->SetKey(_key, sizeof(_key)));
RINOK(cp->SetInitVector(_iv, sizeof(_iv)));
}
for (UInt64 i = 0; i < NumIterations; i++)
{
if (printCallback && bi.UnpackSize - prev > (1 << 20))
{
RINOK(printCallback->CheckBreak());
prev = bi.UnpackSize;
}
bool isLast = (i == NumIterations - 1);
bool calcCrc = ((isLast || (i & 0x7F) == 0 || CheckCrc_Enc) && NumIterations != 1);
outStreamSpec->Init(isLast, calcCrc);
if (_encoderFilter)
{
memcpy(rgCopy.Buffer, rg.Buffer, rg.BufferSize);
_encoderFilter->Init();
_encoderFilter->Filter(rgCopy.Buffer, (UInt32)rg.BufferSize);
RINOK(WriteStream(outStream, rgCopy.Buffer, rg.BufferSize));
}
else
{
inStreamSpec->Init(rg.Buffer, rg.BufferSize);
RINOK(_encoder->Code(inStream, outStream, 0, 0, progressInfo[0]));
}
UInt32 crcNew = CRC_GET_DIGEST(outStreamSpec->Crc);
if (i == 0)
crcPrev = crcNew;
else if (calcCrc && crcPrev != crcNew)
return E_FAIL;
compressedSize = outStreamSpec->Pos;
bi.UnpackSize += rg.BufferSize;
bi.PackSize += compressedSize;
}
_encoder.Release();
_encoderFilter.Release();
return S_OK;
}
HRESULT CEncoderInfo::Decode(UInt32 decoderIndex)
{
CBenchmarkInStream *inStreamSpec = new CBenchmarkInStream;
CMyComPtr<ISequentialInStream> inStream = inStreamSpec;
CMyComPtr<ICompressCoder> &decoder = _decoders[decoderIndex];
CMyComPtr<IUnknown> coder;
if (_decoderFilter)
{
if (decoderIndex != 0)
return E_FAIL;
coder = _decoderFilter;
}
else
coder = decoder;
CMyComPtr<ICompressSetDecoderProperties2> setDecProps;
coder.QueryInterface(IID_ICompressSetDecoderProperties2, &setDecProps);
if (!setDecProps && propStreamSpec->Pos != 0)
return E_FAIL;
CCrcOutStream *crcOutStreamSpec = new CCrcOutStream;
CMyComPtr<ISequentialOutStream> crcOutStream = crcOutStreamSpec;
CBenchProgressInfo *pi = progressInfoSpec[decoderIndex];
pi->BenchInfo.UnpackSize = 0;
pi->BenchInfo.PackSize = 0;
#ifndef _7ZIP_ST
{
CMyComPtr<ICompressSetCoderMt> setCoderMt;
coder.QueryInterface(IID_ICompressSetCoderMt, &setCoderMt);
if (setCoderMt)
{
RINOK(setCoderMt->SetNumberOfThreads(NumDecoderSubThreads));
}
}
#endif
CMyComPtr<ICompressSetCoderProperties> scp;
coder.QueryInterface(IID_ICompressSetCoderProperties, &scp);
if (scp)
{
UInt64 reduceSize = _uncompressedDataSize;
RINOK(_method.SetCoderProps(scp, &reduceSize));
}
CMyComPtr<ICryptoProperties> cp;
coder.QueryInterface(IID_ICryptoProperties, &cp);
if (setDecProps)
{
RINOK(setDecProps->SetDecoderProperties2(propStreamSpec->Buffer, propStreamSpec->Pos));
}
{
CMyComPtr<ICryptoSetPassword> sp;
coder.QueryInterface(IID_ICryptoSetPassword, &sp);
if (sp)
{
RINOK(sp->CryptoSetPassword(_psw, sizeof(_psw)));
}
}
UInt64 prev = 0;
if (cp)
{
RINOK(cp->SetKey(_key, sizeof(_key)));
RINOK(cp->SetInitVector(_iv, sizeof(_iv)));
}
for (UInt64 i = 0; i < NumIterations; i++)
{
if (printCallback && pi->BenchInfo.UnpackSize - prev > (1 << 20))
{
RINOK(printCallback->CheckBreak());
prev = pi->BenchInfo.UnpackSize;
}
inStreamSpec->Init(outStreamSpec->Buffer, compressedSize);
crcOutStreamSpec->Init();
UInt64 outSize = kBufferSize;
crcOutStreamSpec->CalcCrc = ((i & 0x7F) == 0 || CheckCrc_Dec);
if (_decoderFilter)
{
if (compressedSize > rgCopy.BufferSize)
return E_FAIL;
memcpy(rgCopy.Buffer, outStreamSpec->Buffer, compressedSize);
_decoderFilter->Init();
_decoderFilter->Filter(rgCopy.Buffer, compressedSize);
RINOK(WriteStream(crcOutStream, rgCopy.Buffer, rg.BufferSize));
}
else
{
RINOK(decoder->Code(inStream, crcOutStream, 0, &outSize, progressInfo[decoderIndex]));
}
if (crcOutStreamSpec->CalcCrc && CRC_GET_DIGEST(crcOutStreamSpec->Crc) != crc)
return S_FALSE;
pi->BenchInfo.UnpackSize += kBufferSize;
pi->BenchInfo.PackSize += compressedSize;
}
decoder.Release();
_decoderFilter.Release();
return S_OK;
}
static const UInt32 kNumThreadsMax = (1 << 12);
struct CBenchEncoders
{
CEncoderInfo *encoders;
CBenchEncoders(UInt32 num): encoders(0) { encoders = new CEncoderInfo[num]; }
~CBenchEncoders() { delete []encoders; }
};
static UInt64 GetNumIterations(UInt64 numCommands, UInt64 complexInCommands)
{
if (numCommands < (1 << 4))
numCommands = (1 << 4);
UInt64 res = complexInCommands / numCommands;
return (res == 0 ? 1 : res);
}
static HRESULT MethodBench(
DECL_EXTERNAL_CODECS_LOC_VARS
UInt64 complexInCommands,
bool oldLzmaBenchMode,
UInt32 numThreads,
const COneMethodInfo &method2,
UInt32 uncompressedDataSize,
unsigned generateDictBits,
IBenchPrintCallback *printCallback,
IBenchCallback *callback,
CBenchProps *benchProps)
{
COneMethodInfo method = method2;
UInt64 methodId;
UInt32 numInStreams, numOutStreams;
if (!FindMethod(
EXTERNAL_CODECS_LOC_VARS
method.MethodName, methodId, numInStreams, numOutStreams))
return E_NOTIMPL;
if (numInStreams != 1 || numOutStreams != 1)
return E_INVALIDARG;
UInt32 numEncoderThreads = 1;
UInt32 numSubDecoderThreads = 1;
#ifndef _7ZIP_ST
numEncoderThreads = numThreads;
if (oldLzmaBenchMode && methodId == k_LZMA)
{
bool fixedNumber;
UInt32 numLzmaThreads = method.Get_Lzma_NumThreads(fixedNumber);
if (!fixedNumber && numThreads == 1)
method.AddNumThreadsProp(1);
if (numThreads > 1 && numLzmaThreads > 1)
{
numEncoderThreads = numThreads / 2;
numSubDecoderThreads = 2;
}
}
#endif
CBenchEncoders encodersSpec(numEncoderThreads);
CEncoderInfo *encoders = encodersSpec.encoders;
UInt32 i;
for (i = 0; i < numEncoderThreads; i++)
{
CEncoderInfo &encoder = encoders[i];
encoder.callback = (i == 0) ? callback : 0;
encoder.printCallback = printCallback;
CMyComPtr<ICompressCoder2> coder2;
RINOK(CreateCoder(EXTERNAL_CODECS_LOC_VARS methodId,
encoder._encoderFilter, encoder._encoder, coder2, true, false));
if (!encoder._encoder && !encoder._encoderFilter)
return E_NOTIMPL;
// encoder._encoderFilter.Release(); // we can disable filter to check the speed of FilterCoder.
encoder.CheckCrc_Enc = (benchProps->EncComplex) > 30 ;
encoder.CheckCrc_Dec = (benchProps->DecComplexCompr + benchProps->DecComplexUnc) > 30 ;
memset(encoder._iv, 0, sizeof(encoder._iv));
memset(encoder._key, 0, sizeof(encoder._key));
memset(encoder._psw, 0, sizeof(encoder._psw));
for (UInt32 j = 0; j < numSubDecoderThreads; j++)
{
CMyComPtr<ICompressCoder2> coder2de;
CMyComPtr<ICompressCoder> &decoder = encoder._decoders[j];
RINOK(CreateCoder(EXTERNAL_CODECS_LOC_VARS methodId,
encoder._decoderFilter, decoder, coder2de, false, false));
if (!encoder._decoderFilter && !decoder)
return E_NOTIMPL;
}
}
CBaseRandomGenerator rg;
rg.Init();
for (i = 0; i < numEncoderThreads; i++)
{
CEncoderInfo &encoder = encoders[i];
encoder._method = method;
encoder._uncompressedDataSize = uncompressedDataSize;
RINOK(encoders[i].Init(method, uncompressedDataSize, generateDictBits, &rg));
}
CBenchProgressStatus status;
status.Res = S_OK;
status.EncodeMode = true;
for (i = 0; i < numEncoderThreads; i++)
{
CEncoderInfo &encoder = encoders[i];
encoder.NumIterations = GetNumIterations(benchProps->GeComprCommands(uncompressedDataSize), complexInCommands);
for (int j = 0; j < 2; j++)
{
CBenchProgressInfo *spec = new CBenchProgressInfo;
encoder.progressInfoSpec[j] = spec;
encoder.progressInfo[j] = spec;
spec->Status = &status;
}
if (i == 0)
{
CBenchProgressInfo *bpi = encoder.progressInfoSpec[0];
bpi->Callback = callback;
bpi->BenchInfo.NumIterations = numEncoderThreads;
bpi->SetStartTime();
}
#ifndef _7ZIP_ST
if (numEncoderThreads > 1)
{
#ifdef USE_ALLOCA
encoder.AllocaSize = (i * 16 * 21) & 0x7FF;
#endif
RINOK(encoder.CreateEncoderThread())
}
else
#endif
{
RINOK(encoder.Encode());
}
}
#ifndef _7ZIP_ST
if (numEncoderThreads > 1)
for (i = 0; i < numEncoderThreads; i++)
encoders[i].thread[0].Wait();
#endif
RINOK(status.Res);
CBenchInfo info;
encoders[0].progressInfoSpec[0]->SetFinishTime(info);
info.UnpackSize = 0;
info.PackSize = 0;
info.NumIterations = encoders[0].NumIterations;
for (i = 0; i < numEncoderThreads; i++)
{
CEncoderInfo &encoder = encoders[i];
info.UnpackSize += encoder.kBufferSize;
info.PackSize += encoder.compressedSize;
}
RINOK(callback->SetEncodeResult(info, true));
status.Res = S_OK;
status.EncodeMode = false;
UInt32 numDecoderThreads = numEncoderThreads * numSubDecoderThreads;
for (i = 0; i < numEncoderThreads; i++)
{
CEncoderInfo &encoder = encoders[i];
if (i == 0)
{
encoder.NumIterations = GetNumIterations(benchProps->GeDecomprCommands(encoder.compressedSize, encoder.kBufferSize), complexInCommands);
CBenchProgressInfo *bpi = encoder.progressInfoSpec[0];
bpi->Callback = callback;
bpi->BenchInfo.NumIterations = numDecoderThreads;
bpi->SetStartTime();
}
else
encoder.NumIterations = encoders[0].NumIterations;
#ifndef _7ZIP_ST
{
int numSubThreads = method.Get_NumThreads();
encoder.NumDecoderSubThreads = (numSubThreads <= 0) ? 1 : numSubThreads;
}
if (numDecoderThreads > 1)
{
for (UInt32 j = 0; j < numSubDecoderThreads; j++)
{
HRESULT res = encoder.CreateDecoderThread(j, (i == 0 && j == 0)
#ifdef USE_ALLOCA
, ((i * numSubDecoderThreads + j) * 16 * 21) & 0x7FF
#endif
);
RINOK(res);
}
}
else
#endif
{
RINOK(encoder.Decode(0));
}
}
#ifndef _7ZIP_ST
HRESULT res = S_OK;
if (numDecoderThreads > 1)
for (i = 0; i < numEncoderThreads; i++)
for (UInt32 j = 0; j < numSubDecoderThreads; j++)
{
CEncoderInfo &encoder = encoders[i];
encoder.thread[j].Wait();
if (encoder.Results[j] != S_OK)
res = encoder.Results[j];
}
RINOK(res);
#endif
RINOK(status.Res);
encoders[0].progressInfoSpec[0]->SetFinishTime(info);
#ifndef _7ZIP_ST
#ifdef UNDER_CE
if (numDecoderThreads > 1)
for (i = 0; i < numEncoderThreads; i++)
for (UInt32 j = 0; j < numSubDecoderThreads; j++)
{
FILETIME creationTime, exitTime, kernelTime, userTime;
if (::GetThreadTimes(encoders[i].thread[j], &creationTime, &exitTime, &kernelTime, &userTime) != 0)
info.UserTime += GetTime64(userTime) + GetTime64(kernelTime);
}
#endif
#endif
info.UnpackSize = 0;
info.PackSize = 0;
info.NumIterations = numSubDecoderThreads * encoders[0].NumIterations;
for (i = 0; i < numEncoderThreads; i++)
{
CEncoderInfo &encoder = encoders[i];
info.UnpackSize += encoder.kBufferSize;
info.PackSize += encoder.compressedSize;
}
RINOK(callback->SetDecodeResult(info, false));
RINOK(callback->SetDecodeResult(info, true));
return S_OK;
}
inline UInt64 GetLZMAUsage(bool multiThread, UInt32 dictionary)
{
UInt32 hs = dictionary - 1;
hs |= (hs >> 1);
hs |= (hs >> 2);
hs |= (hs >> 4);
hs |= (hs >> 8);
hs >>= 1;
hs |= 0xFFFF;
if (hs > (1 << 24))
hs >>= 1;
hs++;
return ((hs + (1 << 16)) + (UInt64)dictionary * 2) * 4 + (UInt64)dictionary * 3 / 2 +
(1 << 20) + (multiThread ? (6 << 20) : 0);
}
UInt64 GetBenchMemoryUsage(UInt32 numThreads, UInt32 dictionary)
{
const UInt32 kBufferSize = dictionary;
const UInt32 kCompressedBufferSize = (kBufferSize / 2);
UInt32 numSubThreads = (numThreads > 1) ? 2 : 1;
UInt32 numBigThreads = numThreads / numSubThreads;
return (kBufferSize + kCompressedBufferSize +
GetLZMAUsage((numThreads > 1), dictionary) + (2 << 20)) * numBigThreads;
}
static HRESULT CrcBig(const void *data, UInt32 size, UInt64 numIterations,
const UInt32 *checkSum, IHasher *hf,
IBenchPrintCallback *callback)
{
Byte hash[64];
UInt64 i;
for (i = 0; i < sizeof(hash); i++)
hash[i] = 0;
for (i = 0; i < numIterations; i++)
{
if (callback && (i & 0xFF) == 0)
{
RINOK(callback->CheckBreak());
}
hf->Init();
hf->Update(data, size);
hf->Final(hash);
UInt32 hashSize = hf->GetDigestSize();
if (hashSize > sizeof(hash))
return S_FALSE;
UInt32 sum = 0;
for (UInt32 j = 0; j < hashSize; j += 4)
sum ^= GetUi32(hash + j);
if (checkSum && sum != *checkSum)
{
// printf(" %08X ", sum);
return S_FALSE;
}
}
return S_OK;
}
UInt32 g_BenchCpuFreqTemp = 1;
#define YY1 sum += val; sum ^= val;
#define YY3 YY1 YY1 YY1 YY1
#define YY5 YY3 YY3 YY3 YY3
#define YY7 YY5 YY5 YY5 YY5
static const UInt32 kNumFreqCommands = 128;
static UInt32 CountCpuFreq(UInt32 sum, UInt32 num, UInt32 val)
{
for (UInt32 i = 0; i < num; i++)
{
YY7
}
return sum;
}
#ifndef _7ZIP_ST
struct CFreqInfo
{
NWindows::CThread Thread;
IBenchPrintCallback *Callback;
HRESULT CallbackRes;
UInt32 ValRes;
UInt32 Size;
UInt64 NumIterations;
void Wait()
{
Thread.Wait();
Thread.Close();
}
};
static THREAD_FUNC_DECL FreqThreadFunction(void *param)
{
CFreqInfo *p = (CFreqInfo *)param;
UInt32 sum = g_BenchCpuFreqTemp;
for (UInt64 k = p->NumIterations; k > 0; k--)
{
p->CallbackRes = p->Callback->CheckBreak();
if (p->CallbackRes != S_OK)
return 0;
sum = CountCpuFreq(sum, p->Size, g_BenchCpuFreqTemp);
}
p->ValRes = sum;
return 0;
}
struct CFreqThreads
{
CFreqInfo *Items;
UInt32 NumThreads;
CFreqThreads(): Items(0), NumThreads(0) {}
void WaitAll()
{
for (UInt32 i = 0; i < NumThreads; i++)
Items[i].Wait();
NumThreads = 0;
}
~CFreqThreads()
{
WaitAll();
delete []Items;
}
};
struct CCrcInfo
{
NWindows::CThread Thread;
IBenchPrintCallback *Callback;
HRESULT CallbackRes;
const Byte *Data;
UInt32 Size;
UInt64 NumIterations;
bool CheckSumDefined;
UInt32 CheckSum;
CMyComPtr<IHasher> Hasher;
HRESULT Res;
void Wait()
{
Thread.Wait();
Thread.Close();
}
};
static THREAD_FUNC_DECL CrcThreadFunction(void *param)
{
CCrcInfo *p = (CCrcInfo *)param;
p->Res = CrcBig(p->Data, p->Size, p->NumIterations,
p->CheckSumDefined ? &p->CheckSum : NULL, p->Hasher,
p->Callback);
return 0;
}
struct CCrcThreads
{
CCrcInfo *Items;
UInt32 NumThreads;
CCrcThreads(): Items(0), NumThreads(0) {}
void WaitAll()
{
for (UInt32 i = 0; i < NumThreads; i++)
Items[i].Wait();
NumThreads = 0;
}
~CCrcThreads()
{
WaitAll();
delete []Items;
}
};
#endif
static UInt32 CrcCalc1(const Byte *buf, UInt32 size)
{
UInt32 crc = CRC_INIT_VAL;;
for (UInt32 i = 0; i < size; i++)
crc = CRC_UPDATE_BYTE(crc, buf[i]);
return CRC_GET_DIGEST(crc);
}
static void RandGen(Byte *buf, UInt32 size, CBaseRandomGenerator &RG)
{
for (UInt32 i = 0; i < size; i++)
buf[i] = (Byte)RG.GetRnd();
}
static UInt32 RandGenCrc(Byte *buf, UInt32 size, CBaseRandomGenerator &RG)
{
RandGen(buf, size, RG);
return CrcCalc1(buf, size);
}
bool CrcInternalTest()
{
CBenchBuffer buffer;
const UInt32 kBufferSize0 = (1 << 8);
const UInt32 kBufferSize1 = (1 << 10);
const UInt32 kCheckSize = (1 << 5);
if (!buffer.Alloc(kBufferSize0 + kBufferSize1))
return false;
Byte *buf = buffer.Buffer;
UInt32 i;
for (i = 0; i < kBufferSize0; i++)
buf[i] = (Byte)i;
UInt32 crc1 = CrcCalc1(buf, kBufferSize0);
if (crc1 != 0x29058C73)
return false;
CBaseRandomGenerator RG;
RandGen(buf + kBufferSize0, kBufferSize1, RG);
for (i = 0; i < kBufferSize0 + kBufferSize1 - kCheckSize; i++)
for (UInt32 j = 0; j < kCheckSize; j++)
if (CrcCalc1(buf + i, j) != CrcCalc(buf + i, j))
return false;
return true;
}
struct CBenchMethod
{
unsigned DictBits;
UInt32 EncComplex;
UInt32 DecComplexCompr;
UInt32 DecComplexUnc;
const char *Name;
};
static const CBenchMethod g_Bench[] =
{
{ 17, 357, 145, 20, "LZMA:x1" },
{ 24, 1220, 145, 20, "LZMA:x5:mt1" },
{ 24, 1220, 145, 20, "LZMA:x5:mt2" },
{ 16, 124, 40, 14, "Deflate:x1" },
{ 16, 376, 40, 14, "Deflate:x5" },
{ 16, 1082, 40, 14, "Deflate:x7" },
{ 17, 422, 40, 14, "Deflate64:x5" },
{ 15, 590, 69, 69, "BZip2:x1" },
{ 19, 815, 122, 122, "BZip2:x5" },
{ 19, 815, 122, 122, "BZip2:x5:mt2" },
{ 19, 2530, 122, 122, "BZip2:x7" },
{ 18, 1010, 0, 1150, "PPMD:x1" },
{ 22, 1655, 0, 1830, "PPMD:x5" },
{ 0, 6, 0, 6, "Delta:4" },
{ 0, 4, 0, 4, "BCJ" },
{ 0, 24, 0, 24, "AES256CBC:1" },
{ 0, 8, 0, 2, "AES256CBC:2" }
};
struct CBenchHash
{
UInt32 Complex;
UInt32 CheckSum;
const char *Name;
};
static const CBenchHash g_Hash[] =
{
{ 558, 0x8F8FEDAB, "CRC32:4" },
{ 339, 0x8F8FEDAB, "CRC32:8" },
{ 512, 0xDF1C17CC, "CRC64" },
{ 11900, 0x2D79FF2E, "SHA256" },
{ 5230, 0x4C25132B, "SHA1" }
};
struct CTotalBenchRes
{
UInt64 NumIterations;
UInt64 Rating;
UInt64 Usage;
UInt64 RPU;
void Init() { NumIterations = 0; Rating = 0; Usage = 0; RPU = 0; }
void SetSum(const CTotalBenchRes &r1, const CTotalBenchRes &r2)
{
Rating = (r1.Rating + r2.Rating);
Usage = (r1.Usage + r2.Usage);
RPU = (r1.RPU + r2.RPU);
NumIterations = (r1.NumIterations + r2.NumIterations);
}
};
static void PrintNumber(IBenchPrintCallback &f, UInt64 value, int size)
{
char s[128];
int startPos = (int)sizeof(s) - 32;
memset(s, ' ', startPos);
ConvertUInt64ToString(value, s + startPos);
// if (withSpace)
{
startPos--;
size++;
}
int len = (int)strlen(s + startPos);
if (size > len)
{
startPos -= (size - len);
if (startPos < 0)
startPos = 0;
}
f.Print(s + startPos);
}
static const int kFieldSize_Name = 12;
static const int kFieldSize_SmallName = 4;
static const int kFieldSize_Speed = 9;
static const int kFieldSize_Usage = 5;
static const int kFieldSize_RU = 6;
static const int kFieldSize_Rating = 6;
static const int kFieldSize_EU = 5;
static const int kFieldSize_Effec = 5;
static const int kFieldSize_TotalSize = 4 + kFieldSize_Speed + kFieldSize_Usage + kFieldSize_RU + kFieldSize_Rating;
static const int kFieldSize_EUAndEffec = 2 + kFieldSize_EU + kFieldSize_Effec;
static void PrintRating(IBenchPrintCallback &f, UInt64 rating, int size)
{
PrintNumber(f, (rating + 500000) / 1000000, size);
}
static void PrintPercents(IBenchPrintCallback &f, UInt64 val, UInt64 divider, int size)
{
PrintNumber(f, (val * 100 + divider / 2) / divider, size);
}
static void PrintChars(IBenchPrintCallback &f, char c, int size)
{
char s[256];
memset(s, (Byte)c, size);
s[size] = 0;
f.Print(s);
}
static void PrintSpaces(IBenchPrintCallback &f, int size)
{
PrintChars(f, ' ', size);
}
static void PrintResults(IBenchPrintCallback &f, UInt64 usage, UInt64 rpu, UInt64 rating, bool showFreq, UInt64 cpuFreq)
{
PrintNumber(f, (usage + 5000) / 10000, kFieldSize_Usage);
PrintRating(f, rpu, kFieldSize_RU);
PrintRating(f, rating, kFieldSize_Rating);
if (showFreq)
{
if (cpuFreq == 0)
PrintSpaces(f, kFieldSize_EUAndEffec);
else
{
UInt64 ddd = cpuFreq * usage / 100;
if (ddd == 0)
ddd = 1;
PrintPercents(f, (rating * 10000), ddd, kFieldSize_EU);
PrintPercents(f, rating, cpuFreq, kFieldSize_Effec);
}
}
}
static void PrintResults(IBenchPrintCallback *f, const CBenchInfo &info, UInt64 rating, bool showFreq, UInt64 cpuFreq, CTotalBenchRes *res)
{
UInt64 speed = info.GetSpeed(info.UnpackSize * info.NumIterations);
if (f)
{
if (speed != 0)
PrintNumber(*f, speed / 1024, kFieldSize_Speed);
else
PrintSpaces(*f, 1 + kFieldSize_Speed);
}
UInt64 usage = info.GetUsage();
UInt64 rpu = info.GetRatingPerUsage(rating);
if (f)
{
PrintResults(*f, usage, rpu, rating, showFreq, cpuFreq);
}
if (res)
{
res->NumIterations++;
res->RPU += rpu;
res->Rating += rating;
res->Usage += usage;
}
}
static void PrintTotals(IBenchPrintCallback &f, bool showFreq, UInt64 cpuFreq, const CTotalBenchRes &res)
{
PrintSpaces(f, 1 + kFieldSize_Speed);
UInt64 numIterations = res.NumIterations;
if (numIterations == 0)
numIterations = 1;
PrintResults(f, res.Usage / numIterations, res.RPU / numIterations, res.Rating / numIterations, showFreq, cpuFreq);
}
static void PrintRequirements(IBenchPrintCallback &f, const char *sizeString, UInt64 size, const char *threadsString, UInt32 numThreads)
{
f.Print("RAM ");
f.Print(sizeString);
PrintNumber(f, (size >> 20), 6);
f.Print(" MB, # ");
f.Print(threadsString);
PrintNumber(f, numThreads, 3);
f.NewLine();
}
struct CBenchCallbackToPrint: public IBenchCallback
{
CBenchProps BenchProps;
CTotalBenchRes EncodeRes;
CTotalBenchRes DecodeRes;
IBenchPrintCallback *_file;
UInt32 DictSize;
bool Use2Columns;
int NameFieldSize;
bool ShowFreq;
UInt64 CpuFreq;
CBenchCallbackToPrint(): Use2Columns(false), NameFieldSize(0), ShowFreq(false), CpuFreq(0) {}
void Init() { EncodeRes.Init(); DecodeRes.Init(); }
void Print(const char *s);
void NewLine();
HRESULT SetFreq(bool showFreq, UInt64 cpuFreq);
HRESULT SetEncodeResult(const CBenchInfo &info, bool final);
HRESULT SetDecodeResult(const CBenchInfo &info, bool final);
};
HRESULT CBenchCallbackToPrint::SetFreq(bool showFreq, UInt64 cpuFreq)
{
ShowFreq = showFreq;
CpuFreq = cpuFreq;
return S_OK;
}
HRESULT CBenchCallbackToPrint::SetEncodeResult(const CBenchInfo &info, bool final)
{
RINOK(_file->CheckBreak());
if (final)
{
UInt64 rating = BenchProps.GetCompressRating(DictSize, info.GlobalTime, info.GlobalFreq, info.UnpackSize * info.NumIterations);
PrintResults(_file, info, rating, ShowFreq, CpuFreq, &EncodeRes);
}
return S_OK;
}
static const char *kSep = " | ";
HRESULT CBenchCallbackToPrint::SetDecodeResult(const CBenchInfo &info, bool final)
{
RINOK(_file->CheckBreak());
if (final)
{
UInt64 rating = BenchProps.GetDecompressRating(info.GlobalTime, info.GlobalFreq, info.UnpackSize, info.PackSize, info.NumIterations);
if (Use2Columns)
_file->Print(kSep);
else
{
_file->NewLine();
PrintSpaces(*_file, NameFieldSize);
}
CBenchInfo info2 = info;
info2.UnpackSize *= info2.NumIterations;
info2.PackSize *= info2.NumIterations;
info2.NumIterations = 1;
PrintResults(_file, info2, rating, ShowFreq, CpuFreq, &DecodeRes);
}
return S_OK;
}
void CBenchCallbackToPrint::Print(const char *s)
{
_file->Print(s);
}
void CBenchCallbackToPrint::NewLine()
{
_file->NewLine();
}
void PrintLeft(IBenchPrintCallback &f, const char *s, unsigned size)
{
f.Print(s);
int numSpaces = size - MyStringLen(s);
if (numSpaces > 0)
PrintSpaces(f, numSpaces);
}
void PrintRight(IBenchPrintCallback &f, const char *s, unsigned size)
{
int numSpaces = size - MyStringLen(s);
if (numSpaces > 0)
PrintSpaces(f, numSpaces);
f.Print(s);
}
static HRESULT TotalBench(
DECL_EXTERNAL_CODECS_LOC_VARS
UInt64 complexInCommands,
UInt32 numThreads, bool forceUnpackSize, UInt32 unpackSize, IBenchPrintCallback *printCallback, CBenchCallbackToPrint *callback)
{
for (unsigned i = 0; i < ARRAY_SIZE(g_Bench); i++)
{
CBenchMethod bench = g_Bench[i];
PrintLeft(*callback->_file, bench.Name, kFieldSize_Name);
callback->BenchProps.DecComplexUnc = bench.DecComplexUnc;
callback->BenchProps.DecComplexCompr = bench.DecComplexCompr;
callback->BenchProps.EncComplex = bench.EncComplex;
COneMethodInfo method;
NCOM::CPropVariant propVariant;
propVariant = bench.Name;
RINOK(method.ParseMethodFromPROPVARIANT(L"", propVariant));
UInt32 unpackSize2 = unpackSize;
if (!forceUnpackSize && bench.DictBits == 0)
unpackSize2 = kFilterUnpackSize;
HRESULT res = MethodBench(
EXTERNAL_CODECS_LOC_VARS
complexInCommands,
false, numThreads, method, unpackSize2, bench.DictBits,
printCallback, callback, &callback->BenchProps);
if (res == E_NOTIMPL)
{
// callback->Print(" ---");
// we need additional empty line as line for decompression results
if (!callback->Use2Columns)
callback->NewLine();
}
else
{
RINOK(res);
}
callback->NewLine();
}
return S_OK;
}
static HRESULT FreqBench(
UInt64 complexInCommands,
UInt32 numThreads,
IBenchPrintCallback *_file,
bool showFreq,
UInt64 &cpuFreq,
UInt32 &res)
{
res = 0;
cpuFreq = 0;
UInt32 bufferSize = 1 << 20;
UInt32 complexity = kNumFreqCommands;
if (numThreads == 0)
numThreads = 1;
#ifdef _7ZIP_ST
numThreads = 1;
#endif
UInt32 bsize = (bufferSize == 0 ? 1 : bufferSize);
UInt64 numIterations = complexInCommands / complexity / bsize;
if (numIterations == 0)
numIterations = 1;
CBenchInfoCalc progressInfoSpec;
#ifndef _7ZIP_ST
CFreqThreads threads;
if (numThreads > 1)
{
threads.Items = new CFreqInfo[numThreads];
UInt32 i;
for (i = 0; i < numThreads; i++)
{
CFreqInfo &info = threads.Items[i];
info.Callback = _file;
info.CallbackRes = S_OK;
info.NumIterations = numIterations;
info.Size = bufferSize;
}
progressInfoSpec.SetStartTime();
for (i = 0; i < numThreads; i++)
{
CFreqInfo &info = threads.Items[i];
RINOK(info.Thread.Create(FreqThreadFunction, &info));
threads.NumThreads++;
}
threads.WaitAll();
for (i = 0; i < numThreads; i++)
{
RINOK(threads.Items[i].CallbackRes);
}
}
else
#endif
{
progressInfoSpec.SetStartTime();
UInt32 sum = g_BenchCpuFreqTemp;
for (UInt64 k = numIterations; k > 0; k--)
{
RINOK(_file->CheckBreak());
sum = CountCpuFreq(sum, bufferSize, g_BenchCpuFreqTemp);
}
res += sum;
}
CBenchInfo info;
progressInfoSpec.SetFinishTime(info);
info.UnpackSize = 0;
info.PackSize = 0;
info.NumIterations = 1;
if (_file)
{
{
UInt64 numCommands = (UInt64)numIterations * bufferSize * numThreads * complexity;
UInt64 rating = info.GetSpeed(numCommands);
cpuFreq = rating / numThreads;
PrintResults(_file, info, rating, showFreq, showFreq ? cpuFreq : 0, NULL);
}
RINOK(_file->CheckBreak());
}
return S_OK;
}
static HRESULT CrcBench(
DECL_EXTERNAL_CODECS_LOC_VARS
UInt64 complexInCommands,
UInt32 numThreads, UInt32 bufferSize,
UInt64 &speed,
UInt32 complexity,
const UInt32 *checkSum,
const COneMethodInfo &method,
IBenchPrintCallback *_file,
CTotalBenchRes *encodeRes,
bool showFreq, UInt64 cpuFreq)
{
if (numThreads == 0)
numThreads = 1;
#ifdef _7ZIP_ST
numThreads = 1;
#endif
UString methodName = method.MethodName;
// methodName.RemoveChar(L'-');
CMethodId hashID;
if (!FindHashMethod(
EXTERNAL_CODECS_LOC_VARS
methodName, hashID))
return E_NOTIMPL;
CBenchBuffer buffer;
size_t totalSize = (size_t)bufferSize * numThreads;
if (totalSize / numThreads != bufferSize)
return E_OUTOFMEMORY;
if (!buffer.Alloc(totalSize))
return E_OUTOFMEMORY;
Byte *buf = buffer.Buffer;
CBaseRandomGenerator RG;
UInt32 bsize = (bufferSize == 0 ? 1 : bufferSize);
UInt64 numIterations = complexInCommands * 256 / complexity / bsize;
if (numIterations == 0)
numIterations = 1;
CBenchInfoCalc progressInfoSpec;
#ifndef _7ZIP_ST
CCrcThreads threads;
if (numThreads > 1)
{
threads.Items = new CCrcInfo[numThreads];
UInt32 i;
for (i = 0; i < numThreads; i++)
{
CCrcInfo &info = threads.Items[i];
UString name;
RINOK(CreateHasher(EXTERNAL_CODECS_LOC_VARS hashID, name, info.Hasher));
if (!info.Hasher)
return E_NOTIMPL;
CMyComPtr<ICompressSetCoderProperties> scp;
info.Hasher.QueryInterface(IID_ICompressSetCoderProperties, &scp);
if (scp)
{
UInt64 reduceSize = 1;
RINOK(method.SetCoderProps(scp, &reduceSize));
}
Byte *data = buf + (size_t)bufferSize * i;
info.Callback = _file;
info.Data = data;
info.NumIterations = numIterations;
info.Size = bufferSize;
/* info.Crc = */ RandGenCrc(data, bufferSize, RG);
info.CheckSumDefined = false;
if (checkSum)
{
info.CheckSum = *checkSum;
info.CheckSumDefined = (checkSum && (i == 0));
}
}
progressInfoSpec.SetStartTime();
for (i = 0; i < numThreads; i++)
{
CCrcInfo &info = threads.Items[i];
RINOK(info.Thread.Create(CrcThreadFunction, &info));
threads.NumThreads++;
}
threads.WaitAll();
for (i = 0; i < numThreads; i++)
{
RINOK(threads.Items[i].Res);
}
}
else
#endif
{
/* UInt32 crc = */ RandGenCrc(buf, bufferSize, RG);
progressInfoSpec.SetStartTime();
CMyComPtr<IHasher> hasher;
UString name;
RINOK(CreateHasher(EXTERNAL_CODECS_LOC_VARS hashID, name, hasher));
if (!hasher)
return E_NOTIMPL;
CMyComPtr<ICompressSetCoderProperties> scp;
hasher.QueryInterface(IID_ICompressSetCoderProperties, &scp);
if (scp)
{
UInt64 reduceSize = 1;
RINOK(method.SetCoderProps(scp, &reduceSize));
}
RINOK(CrcBig(buf, bufferSize, numIterations, checkSum, hasher, _file));
}
CBenchInfo info;
progressInfoSpec.SetFinishTime(info);
UInt64 unpSize = numIterations * bufferSize;
UInt64 unpSizeThreads = unpSize * numThreads;
info.UnpackSize = unpSizeThreads;
info.PackSize = unpSizeThreads;
info.NumIterations = 1;
if (_file)
{
{
UInt64 numCommands = unpSizeThreads * complexity / 256;
UInt64 rating = info.GetSpeed(numCommands);
PrintResults(_file, info, rating, showFreq, cpuFreq, encodeRes);
}
RINOK(_file->CheckBreak());
}
speed = info.GetSpeed(unpSizeThreads);
return S_OK;
}
static HRESULT TotalBench_Hash(
DECL_EXTERNAL_CODECS_LOC_VARS
UInt64 complexInCommands,
UInt32 numThreads, UInt32 bufSize,
IBenchPrintCallback *printCallback, CBenchCallbackToPrint *callback,
CTotalBenchRes *encodeRes,
bool showFreq, UInt64 cpuFreq)
{
for (unsigned i = 0; i < ARRAY_SIZE(g_Hash); i++)
{
const CBenchHash &bench = g_Hash[i];
PrintLeft(*callback->_file, bench.Name, kFieldSize_Name);
// callback->BenchProps.DecComplexUnc = bench.DecComplexUnc;
// callback->BenchProps.DecComplexCompr = bench.DecComplexCompr;
// callback->BenchProps.EncComplex = bench.EncComplex;
COneMethodInfo method;
NCOM::CPropVariant propVariant;
propVariant = bench.Name;
RINOK(method.ParseMethodFromPROPVARIANT(L"", propVariant));
UInt64 speed;
HRESULT res = CrcBench(
EXTERNAL_CODECS_LOC_VARS
complexInCommands,
numThreads, bufSize,
speed,
bench.Complex, &bench.CheckSum, method,
printCallback, encodeRes, showFreq, cpuFreq);
if (res == E_NOTIMPL)
{
// callback->Print(" ---");
}
else
{
RINOK(res);
}
callback->NewLine();
}
return S_OK;
}
struct CTempValues
{
UInt64 *Values;
CTempValues(UInt32 num) { Values = new UInt64[num]; }
~CTempValues() { delete []Values; }
};
static void ParseNumberString(const UString &s, NCOM::CPropVariant &prop)
{
const wchar_t *end;
UInt64 result = ConvertStringToUInt64(s, &end);
if (*end != 0 || s.IsEmpty())
prop = s;
else if (result <= (UInt32)0xFFFFFFFF)
prop = (UInt32)result;
else
prop = result;
}
static UInt32 GetNumThreadsNext(unsigned i, UInt32 numThreads)
{
if (i < 2)
return i + 1;
i -= 1;
UInt32 num = (UInt32)(2 + (i & 1)) << (i >> 1);
return (num <= numThreads) ? num : numThreads;
}
static bool AreSameMethodNames(const char *fullName, const wchar_t *shortName)
{
for (;;)
{
wchar_t c2 = *shortName++;
if (c2 == 0)
return true;
char c1 = *fullName++;
if ((unsigned char)MyCharLower_Ascii(c1) != MyCharLower_Ascii(c2))
return false;
}
}
HRESULT Bench(
DECL_EXTERNAL_CODECS_LOC_VARS
IBenchPrintCallback *printCallback,
IBenchCallback *benchCallback,
const CObjectVector<CProperty> &props,
UInt32 numIterations,
bool multiDict)
{
if (!CrcInternalTest())
return S_FALSE;
UInt32 numCPUs = 1;
UInt64 ramSize = (UInt64)512 << 20;
#ifndef _7ZIP_ST
numCPUs = NSystem::GetNumberOfProcessors();
#endif
#if !defined(_7ZIP_ST) || defined(_WIN32)
ramSize = NSystem::GetRamSize();
#endif
UInt32 numThreads = numCPUs;
UInt32 testTime = kComplexInSeconds;
COneMethodInfo method;
unsigned i;
for (i = 0; i < props.Size(); i++)
{
const CProperty &property = props[i];
NCOM::CPropVariant propVariant;
UString name = property.Name;
name.MakeLower_Ascii();
if (!property.Value.IsEmpty())
ParseNumberString(property.Value, propVariant);
if (name.IsEqualTo("testtime"))
{
RINOK(ParsePropToUInt32(L"", propVariant, testTime));
continue;
}
if (name.IsPrefixedBy(L"mt"))
{
#ifndef _7ZIP_ST
RINOK(ParseMtProp(name.Ptr(2), propVariant, numCPUs, numThreads));
#endif
continue;
}
RINOK(method.ParseMethodFromPROPVARIANT(name, propVariant));
}
if (printCallback)
{
printCallback->Print("CPU Freq:");
}
UInt64 complexInCommands = kComplexInCommands;
if (printCallback)
{
UInt64 numMilCommands = (1 << 6);
for (int jj = 0;; jj++)
{
UInt64 start = ::GetTimeCount();
UInt32 sum = (UInt32)start;
sum = CountCpuFreq(sum, (UInt32)(numMilCommands * 1000000 / kNumFreqCommands), g_BenchCpuFreqTemp);
start = ::GetTimeCount() - start;
if (start == 0)
start = 1;
UInt64 freq = GetFreq();
UInt64 mipsVal = numMilCommands * freq / start;
if (printCallback)
PrintNumber(*printCallback, mipsVal, 5 + ((sum >> 31) & 1));
if (jj >= 3)
{
SetComplexCommands(testTime, mipsVal * 1000000, complexInCommands);
if (jj >= 8 || start >= freq)
break;
// break; // change it
numMilCommands <<= 1;
}
}
}
if (printCallback)
{
printCallback->NewLine();
printCallback->NewLine();
PrintRequirements(*printCallback, "size: ", ramSize, "CPU hardware threads:", numCPUs);
}
if (numThreads < 1 || numThreads > kNumThreadsMax)
return E_INVALIDARG;
UInt32 dict;
bool dictIsDefined = method.Get_DicSize(dict);
if (method.MethodName.IsEmpty())
method.MethodName = L"LZMA";
if (benchCallback)
{
CBenchProps benchProps;
benchProps.SetLzmaCompexity();
UInt32 dictSize = method.Get_Lzma_DicSize();
UInt32 uncompressedDataSize = kAdditionalSize + dictSize;
return MethodBench(
EXTERNAL_CODECS_LOC_VARS
complexInCommands,
true, numThreads,
method, uncompressedDataSize,
kOldLzmaDictBits, printCallback, benchCallback, &benchProps);
}
UString methodName = method.MethodName;
if (methodName.IsEqualToNoCase(L"CRC"))
methodName = L"crc32";
method.MethodName = methodName;
CMethodId hashID;
if (FindHashMethod(EXTERNAL_CODECS_LOC_VARS methodName, hashID))
{
if (!printCallback)
return S_FALSE;
IBenchPrintCallback &f = *printCallback;
if (!dictIsDefined)
dict = (1 << 24);
// methhodName.RemoveChar(L'-');
UInt32 complexity = 10000;
const UInt32 *checkSum = NULL;
{
for (unsigned i = 0; i < ARRAY_SIZE(g_Hash); i++)
{
const CBenchHash &h = g_Hash[i];
if (AreSameMethodNames(h.Name, methodName))
{
complexity = h.Complex;
checkSum = &h.CheckSum;
if (strcmp(h.Name, "CRC32:4") != 0)
break;
}
}
}
f.NewLine();
f.Print("Size");
const int kFieldSize_CrcSpeed = 6;
unsigned numThreadsTests = 0;
for (;;)
{
UInt32 t = GetNumThreadsNext(numThreadsTests, numThreads);
PrintNumber(f, t, kFieldSize_CrcSpeed);
numThreadsTests++;
if (t >= numThreads)
break;
}
f.NewLine();
f.NewLine();
CTempValues speedTotals(numThreadsTests);
{
for (unsigned ti = 0; ti < numThreadsTests; ti++)
speedTotals.Values[ti] = 0;
}
UInt64 numSteps = 0;
for (UInt32 i = 0; i < numIterations; i++)
{
for (unsigned pow = 10; pow < 32; pow++)
{
UInt32 bufSize = (UInt32)1 << pow;
if (bufSize > dict)
break;
char s[16];
ConvertUInt32ToString(pow, s);
int pos = MyStringLen(s);
s[pos++] = ':';
s[pos++] = ' ';
s[pos] = 0;
f.Print(s);
for (unsigned ti = 0; ti < numThreadsTests; ti++)
{
RINOK(f.CheckBreak());
UInt32 t = GetNumThreadsNext(ti, numThreads);
UInt64 speed = 0;
RINOK(CrcBench(EXTERNAL_CODECS_LOC_VARS complexInCommands,
t, bufSize, speed, complexity,
(pow == kNumHashDictBits) ? checkSum : NULL, method, NULL, NULL, false, 0));
PrintNumber(f, (speed >> 20), kFieldSize_CrcSpeed);
speedTotals.Values[ti] += speed;
}
f.NewLine();
numSteps++;
}
}
if (numSteps != 0)
{
f.NewLine();
f.Print("Avg:");
for (unsigned ti = 0; ti < numThreadsTests; ti++)
{
PrintNumber(f, ((speedTotals.Values[ti] / numSteps) >> 20), kFieldSize_CrcSpeed);
}
f.NewLine();
}
return S_OK;
}
bool use2Columns = false;
CBenchCallbackToPrint callback;
callback.Init();
callback._file = printCallback;
if (!dictIsDefined)
{
int dicSizeLog;
for (dicSizeLog = 25; dicSizeLog > kBenchMinDicLogSize; dicSizeLog--)
if (GetBenchMemoryUsage(numThreads, ((UInt32)1 << dicSizeLog)) + (8 << 20) <= ramSize)
break;
dict = (1 << dicSizeLog);
}
IBenchPrintCallback &f = *printCallback;
PrintRequirements(f, "usage:", GetBenchMemoryUsage(numThreads, dict), "Benchmark threads: ", numThreads);
bool totalBenchMode = (method.MethodName == L"*");
f.NewLine();
if (totalBenchMode)
{
callback.NameFieldSize = kFieldSize_Name;
use2Columns = false;
}
else
{
callback.NameFieldSize = kFieldSize_SmallName;
use2Columns = true;
}
callback.Use2Columns = use2Columns;
bool showFreq = false;
UInt64 cpuFreq = 0;
if (totalBenchMode)
{
showFreq = true;
}
int fileldSize = kFieldSize_TotalSize;
if (showFreq)
fileldSize += kFieldSize_EUAndEffec;
if (use2Columns)
{
PrintSpaces(f, callback.NameFieldSize);
PrintRight(f, "Compressing", fileldSize);
f.Print(kSep);
PrintRight(f, "Decompressing", fileldSize);
}
f.NewLine();
PrintLeft(f, totalBenchMode ? "Method" : "Dict", callback.NameFieldSize);
int j;
for (j = 0; j < 2; j++)
{
PrintRight(f, "Speed", kFieldSize_Speed + 1);
PrintRight(f, "Usage", kFieldSize_Usage + 1);
PrintRight(f, "R/U", kFieldSize_RU + 1);
PrintRight(f, "Rating", kFieldSize_Rating + 1);
if (showFreq)
{
PrintRight(f, "E/U", kFieldSize_EU + 1);
PrintRight(f, "Effec", kFieldSize_Effec + 1);
}
if (!use2Columns)
break;
if (j == 0)
f.Print(kSep);
}
f.NewLine();
PrintSpaces(f, callback.NameFieldSize);
for (j = 0; j < 2; j++)
{
PrintRight(f, "KB/s", kFieldSize_Speed + 1);
PrintRight(f, "%", kFieldSize_Usage + 1);
PrintRight(f, "MIPS", kFieldSize_RU + 1);
PrintRight(f, "MIPS", kFieldSize_Rating + 1);
if (showFreq)
{
PrintRight(f, "%", kFieldSize_EU + 1);
PrintRight(f, "%", kFieldSize_Effec + 1);
}
if (!use2Columns)
break;
if (j == 0)
f.Print(kSep);
}
f.NewLine();
f.NewLine();
if (totalBenchMode)
{
if (!dictIsDefined)
dict =
#ifdef UNDER_CE
(UInt64)1 << 20;
#else
(UInt64)1 << 24;
#endif
for (UInt32 i = 0; i < numIterations; i++)
{
if (i != 0)
printCallback->NewLine();
HRESULT res;
int freqTest;
const int kNumCpuTests = 3;
for (freqTest = 0; freqTest < kNumCpuTests; freqTest++)
{
PrintLeft(f, "CPU", kFieldSize_Name);
UInt32 resVal;
RINOK(FreqBench(complexInCommands, numThreads, printCallback, freqTest == kNumCpuTests - 1, cpuFreq, resVal));
callback.NewLine();
if (freqTest == kNumCpuTests - 1)
SetComplexCommands(testTime, cpuFreq, complexInCommands);
}
callback.NewLine();
callback.SetFreq(true, cpuFreq);
res = TotalBench(EXTERNAL_CODECS_LOC_VARS complexInCommands, numThreads, dictIsDefined, dict, printCallback, &callback);
RINOK(res);
res = TotalBench_Hash(EXTERNAL_CODECS_LOC_VARS complexInCommands, numThreads,
1 << kNumHashDictBits, printCallback, &callback, &callback.EncodeRes, true, cpuFreq);
RINOK(res);
callback.NewLine();
{
PrintLeft(f, "CPU", kFieldSize_Name);
UInt32 resVal;
UInt64 cpuFreqLastTemp = cpuFreq;
RINOK(FreqBench(complexInCommands, numThreads, printCallback, false, cpuFreqLastTemp, resVal));
callback.NewLine();
}